{ "best_metric": null, "best_model_checkpoint": null, "epoch": 1.0, "global_step": 8324, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, "learning_rate": 2e-08, "loss": 2.894, "step": 1 }, { "epoch": 0.0, "learning_rate": 4e-08, "loss": 3.0019, "step": 2 }, { "epoch": 0.0, "learning_rate": 6.000000000000001e-08, "loss": 2.81, "step": 3 }, { "epoch": 0.0, "learning_rate": 8e-08, "loss": 2.7314, "step": 4 }, { "epoch": 0.0, "learning_rate": 1.0000000000000001e-07, "loss": 2.783, "step": 5 }, { "epoch": 0.0, "learning_rate": 1.2000000000000002e-07, "loss": 3.076, "step": 6 }, { "epoch": 0.0, "learning_rate": 1.4e-07, "loss": 2.8474, "step": 7 }, { "epoch": 0.0, "learning_rate": 1.6e-07, "loss": 2.93, "step": 8 }, { "epoch": 0.0, "learning_rate": 1.8e-07, "loss": 2.8097, "step": 9 }, { "epoch": 0.0, "learning_rate": 2.0000000000000002e-07, "loss": 3.0645, "step": 10 }, { "epoch": 0.0, "learning_rate": 2.2e-07, "loss": 2.7881, "step": 11 }, { "epoch": 0.0, "learning_rate": 2.4000000000000003e-07, "loss": 2.8377, "step": 12 }, { "epoch": 0.0, "learning_rate": 2.6e-07, "loss": 2.874, "step": 13 }, { "epoch": 0.0, "learning_rate": 2.8e-07, "loss": 2.9909, "step": 14 }, { "epoch": 0.0, "learning_rate": 3.0000000000000004e-07, "loss": 2.7501, "step": 15 }, { "epoch": 0.0, "learning_rate": 3.2e-07, "loss": 2.8209, "step": 16 }, { "epoch": 0.0, "learning_rate": 3.4000000000000003e-07, "loss": 2.8401, "step": 17 }, { "epoch": 0.0, "learning_rate": 3.6e-07, "loss": 2.9457, "step": 18 }, { "epoch": 0.0, "learning_rate": 3.8e-07, "loss": 2.6964, "step": 19 }, { "epoch": 0.0, "learning_rate": 4.0000000000000003e-07, "loss": 2.73, "step": 20 }, { "epoch": 0.0, "learning_rate": 4.2000000000000006e-07, "loss": 2.8011, "step": 21 }, { "epoch": 0.0, "learning_rate": 4.4e-07, "loss": 2.8686, "step": 22 }, { "epoch": 0.0, "learning_rate": 4.6000000000000004e-07, "loss": 2.6424, "step": 23 }, { "epoch": 0.0, "learning_rate": 4.800000000000001e-07, "loss": 2.9452, "step": 24 }, { "epoch": 0.0, "learning_rate": 5.000000000000001e-07, "loss": 2.8218, "step": 25 }, { "epoch": 0.0, "learning_rate": 5.2e-07, "loss": 2.674, "step": 26 }, { "epoch": 0.0, "learning_rate": 5.4e-07, "loss": 2.7029, "step": 27 }, { "epoch": 0.0, "learning_rate": 5.6e-07, "loss": 2.8422, "step": 28 }, { "epoch": 0.0, "learning_rate": 5.800000000000001e-07, "loss": 2.8927, "step": 29 }, { "epoch": 0.0, "learning_rate": 6.000000000000001e-07, "loss": 2.795, "step": 30 }, { "epoch": 0.0, "learning_rate": 6.200000000000001e-07, "loss": 2.7053, "step": 31 }, { "epoch": 0.0, "learning_rate": 6.4e-07, "loss": 2.9824, "step": 32 }, { "epoch": 0.0, "learning_rate": 6.6e-07, "loss": 2.787, "step": 33 }, { "epoch": 0.0, "learning_rate": 6.800000000000001e-07, "loss": 2.7714, "step": 34 }, { "epoch": 0.0, "learning_rate": 7.000000000000001e-07, "loss": 2.6498, "step": 35 }, { "epoch": 0.0, "learning_rate": 7.2e-07, "loss": 2.7993, "step": 36 }, { "epoch": 0.0, "learning_rate": 7.4e-07, "loss": 2.9047, "step": 37 }, { "epoch": 0.0, "learning_rate": 7.6e-07, "loss": 2.8935, "step": 38 }, { "epoch": 0.0, "learning_rate": 7.8e-07, "loss": 2.9095, "step": 39 }, { "epoch": 0.0, "learning_rate": 8.000000000000001e-07, "loss": 2.8189, "step": 40 }, { "epoch": 0.0, "learning_rate": 8.200000000000001e-07, "loss": 2.8549, "step": 41 }, { "epoch": 0.01, "learning_rate": 8.400000000000001e-07, "loss": 2.6603, "step": 42 }, { "epoch": 0.01, "learning_rate": 8.6e-07, "loss": 2.7025, "step": 43 }, { "epoch": 0.01, "learning_rate": 8.8e-07, "loss": 2.8764, "step": 44 }, { "epoch": 0.01, "learning_rate": 9.000000000000001e-07, "loss": 2.862, "step": 45 }, { "epoch": 0.01, "learning_rate": 9.200000000000001e-07, "loss": 3.036, "step": 46 }, { "epoch": 0.01, "learning_rate": 9.400000000000001e-07, "loss": 2.6515, "step": 47 }, { "epoch": 0.01, "learning_rate": 9.600000000000001e-07, "loss": 2.7183, "step": 48 }, { "epoch": 0.01, "learning_rate": 9.800000000000001e-07, "loss": 2.9047, "step": 49 }, { "epoch": 0.01, "learning_rate": 1.0000000000000002e-06, "loss": 2.7998, "step": 50 }, { "epoch": 0.01, "learning_rate": 1.02e-06, "loss": 2.7848, "step": 51 }, { "epoch": 0.01, "learning_rate": 1.04e-06, "loss": 2.7999, "step": 52 }, { "epoch": 0.01, "learning_rate": 1.06e-06, "loss": 2.8986, "step": 53 }, { "epoch": 0.01, "learning_rate": 1.08e-06, "loss": 2.8251, "step": 54 }, { "epoch": 0.01, "learning_rate": 1.1e-06, "loss": 2.9027, "step": 55 }, { "epoch": 0.01, "learning_rate": 1.12e-06, "loss": 2.8808, "step": 56 }, { "epoch": 0.01, "learning_rate": 1.14e-06, "loss": 2.91, "step": 57 }, { "epoch": 0.01, "learning_rate": 1.1600000000000001e-06, "loss": 2.7331, "step": 58 }, { "epoch": 0.01, "learning_rate": 1.1800000000000001e-06, "loss": 2.7588, "step": 59 }, { "epoch": 0.01, "learning_rate": 1.2000000000000002e-06, "loss": 2.7667, "step": 60 }, { "epoch": 0.01, "learning_rate": 1.2200000000000002e-06, "loss": 2.9032, "step": 61 }, { "epoch": 0.01, "learning_rate": 1.2400000000000002e-06, "loss": 2.7458, "step": 62 }, { "epoch": 0.01, "learning_rate": 1.26e-06, "loss": 2.5394, "step": 63 }, { "epoch": 0.01, "learning_rate": 1.28e-06, "loss": 3.0551, "step": 64 }, { "epoch": 0.01, "learning_rate": 1.3e-06, "loss": 2.7652, "step": 65 }, { "epoch": 0.01, "learning_rate": 1.32e-06, "loss": 2.8989, "step": 66 }, { "epoch": 0.01, "learning_rate": 1.34e-06, "loss": 2.813, "step": 67 }, { "epoch": 0.01, "learning_rate": 1.3600000000000001e-06, "loss": 2.975, "step": 68 }, { "epoch": 0.01, "learning_rate": 1.3800000000000001e-06, "loss": 2.5782, "step": 69 }, { "epoch": 0.01, "learning_rate": 1.4000000000000001e-06, "loss": 2.793, "step": 70 }, { "epoch": 0.01, "learning_rate": 1.42e-06, "loss": 2.8399, "step": 71 }, { "epoch": 0.01, "learning_rate": 1.44e-06, "loss": 2.855, "step": 72 }, { "epoch": 0.01, "learning_rate": 1.46e-06, "loss": 2.8153, "step": 73 }, { "epoch": 0.01, "learning_rate": 1.48e-06, "loss": 2.861, "step": 74 }, { "epoch": 0.01, "learning_rate": 1.5e-06, "loss": 3.0008, "step": 75 }, { "epoch": 0.01, "learning_rate": 1.52e-06, "loss": 2.6967, "step": 76 }, { "epoch": 0.01, "learning_rate": 1.54e-06, "loss": 2.7379, "step": 77 }, { "epoch": 0.01, "learning_rate": 1.56e-06, "loss": 2.7266, "step": 78 }, { "epoch": 0.01, "learning_rate": 1.5800000000000001e-06, "loss": 2.7166, "step": 79 }, { "epoch": 0.01, "learning_rate": 1.6000000000000001e-06, "loss": 2.7693, "step": 80 }, { "epoch": 0.01, "learning_rate": 1.6200000000000002e-06, "loss": 2.6919, "step": 81 }, { "epoch": 0.01, "learning_rate": 1.6400000000000002e-06, "loss": 2.7995, "step": 82 }, { "epoch": 0.01, "learning_rate": 1.6600000000000002e-06, "loss": 2.9599, "step": 83 }, { "epoch": 0.01, "learning_rate": 1.6800000000000002e-06, "loss": 2.7051, "step": 84 }, { "epoch": 0.01, "learning_rate": 1.7000000000000002e-06, "loss": 2.7666, "step": 85 }, { "epoch": 0.01, "learning_rate": 1.72e-06, "loss": 2.8841, "step": 86 }, { "epoch": 0.01, "learning_rate": 1.74e-06, "loss": 2.7936, "step": 87 }, { "epoch": 0.01, "learning_rate": 1.76e-06, "loss": 2.7436, "step": 88 }, { "epoch": 0.01, "learning_rate": 1.7800000000000001e-06, "loss": 2.8614, "step": 89 }, { "epoch": 0.01, "learning_rate": 1.8000000000000001e-06, "loss": 2.975, "step": 90 }, { "epoch": 0.01, "learning_rate": 1.8200000000000002e-06, "loss": 2.8066, "step": 91 }, { "epoch": 0.01, "learning_rate": 1.8400000000000002e-06, "loss": 2.7571, "step": 92 }, { "epoch": 0.01, "learning_rate": 1.8600000000000002e-06, "loss": 2.6997, "step": 93 }, { "epoch": 0.01, "learning_rate": 1.8800000000000002e-06, "loss": 2.8759, "step": 94 }, { "epoch": 0.01, "learning_rate": 1.9000000000000002e-06, "loss": 3.0306, "step": 95 }, { "epoch": 0.01, "learning_rate": 1.9200000000000003e-06, "loss": 2.7032, "step": 96 }, { "epoch": 0.01, "learning_rate": 1.94e-06, "loss": 2.8026, "step": 97 }, { "epoch": 0.01, "learning_rate": 1.9600000000000003e-06, "loss": 2.6355, "step": 98 }, { "epoch": 0.01, "learning_rate": 1.98e-06, "loss": 2.6331, "step": 99 }, { "epoch": 0.01, "learning_rate": 2.0000000000000003e-06, "loss": 2.7794, "step": 100 }, { "epoch": 0.01, "learning_rate": 2.02e-06, "loss": 2.7938, "step": 101 }, { "epoch": 0.01, "learning_rate": 2.04e-06, "loss": 3.0001, "step": 102 }, { "epoch": 0.01, "learning_rate": 2.06e-06, "loss": 2.7975, "step": 103 }, { "epoch": 0.01, "learning_rate": 2.08e-06, "loss": 2.7868, "step": 104 }, { "epoch": 0.01, "learning_rate": 2.1000000000000002e-06, "loss": 2.8132, "step": 105 }, { "epoch": 0.01, "learning_rate": 2.12e-06, "loss": 2.7565, "step": 106 }, { "epoch": 0.01, "learning_rate": 2.1400000000000003e-06, "loss": 2.7994, "step": 107 }, { "epoch": 0.01, "learning_rate": 2.16e-06, "loss": 2.8481, "step": 108 }, { "epoch": 0.01, "learning_rate": 2.1800000000000003e-06, "loss": 2.6668, "step": 109 }, { "epoch": 0.01, "learning_rate": 2.2e-06, "loss": 3.0088, "step": 110 }, { "epoch": 0.01, "learning_rate": 2.2200000000000003e-06, "loss": 3.011, "step": 111 }, { "epoch": 0.01, "learning_rate": 2.24e-06, "loss": 2.8221, "step": 112 }, { "epoch": 0.01, "learning_rate": 2.2600000000000004e-06, "loss": 2.7214, "step": 113 }, { "epoch": 0.01, "learning_rate": 2.28e-06, "loss": 2.792, "step": 114 }, { "epoch": 0.01, "learning_rate": 2.3000000000000004e-06, "loss": 2.6355, "step": 115 }, { "epoch": 0.01, "learning_rate": 2.3200000000000002e-06, "loss": 2.8261, "step": 116 }, { "epoch": 0.01, "learning_rate": 2.3400000000000005e-06, "loss": 2.7254, "step": 117 }, { "epoch": 0.01, "learning_rate": 2.3600000000000003e-06, "loss": 2.7874, "step": 118 }, { "epoch": 0.01, "learning_rate": 2.38e-06, "loss": 2.6549, "step": 119 }, { "epoch": 0.01, "learning_rate": 2.4000000000000003e-06, "loss": 2.6885, "step": 120 }, { "epoch": 0.01, "learning_rate": 2.42e-06, "loss": 2.7787, "step": 121 }, { "epoch": 0.01, "learning_rate": 2.4400000000000004e-06, "loss": 2.974, "step": 122 }, { "epoch": 0.01, "learning_rate": 2.46e-06, "loss": 2.6929, "step": 123 }, { "epoch": 0.01, "learning_rate": 2.4800000000000004e-06, "loss": 2.8407, "step": 124 }, { "epoch": 0.02, "learning_rate": 2.5e-06, "loss": 2.911, "step": 125 }, { "epoch": 0.02, "learning_rate": 2.52e-06, "loss": 2.6967, "step": 126 }, { "epoch": 0.02, "learning_rate": 2.5400000000000002e-06, "loss": 2.9059, "step": 127 }, { "epoch": 0.02, "learning_rate": 2.56e-06, "loss": 2.834, "step": 128 }, { "epoch": 0.02, "learning_rate": 2.5800000000000003e-06, "loss": 2.6788, "step": 129 }, { "epoch": 0.02, "learning_rate": 2.6e-06, "loss": 2.8869, "step": 130 }, { "epoch": 0.02, "learning_rate": 2.6200000000000003e-06, "loss": 2.7719, "step": 131 }, { "epoch": 0.02, "learning_rate": 2.64e-06, "loss": 2.8594, "step": 132 }, { "epoch": 0.02, "learning_rate": 2.6600000000000004e-06, "loss": 2.6831, "step": 133 }, { "epoch": 0.02, "learning_rate": 2.68e-06, "loss": 2.7681, "step": 134 }, { "epoch": 0.02, "learning_rate": 2.7000000000000004e-06, "loss": 2.605, "step": 135 }, { "epoch": 0.02, "learning_rate": 2.7200000000000002e-06, "loss": 2.8285, "step": 136 }, { "epoch": 0.02, "learning_rate": 2.7400000000000004e-06, "loss": 2.7449, "step": 137 }, { "epoch": 0.02, "learning_rate": 2.7600000000000003e-06, "loss": 2.7741, "step": 138 }, { "epoch": 0.02, "learning_rate": 2.7800000000000005e-06, "loss": 2.6963, "step": 139 }, { "epoch": 0.02, "learning_rate": 2.8000000000000003e-06, "loss": 2.8074, "step": 140 }, { "epoch": 0.02, "learning_rate": 2.82e-06, "loss": 2.9003, "step": 141 }, { "epoch": 0.02, "learning_rate": 2.84e-06, "loss": 2.6186, "step": 142 }, { "epoch": 0.02, "learning_rate": 2.86e-06, "loss": 2.689, "step": 143 }, { "epoch": 0.02, "learning_rate": 2.88e-06, "loss": 2.6509, "step": 144 }, { "epoch": 0.02, "learning_rate": 2.9e-06, "loss": 2.5075, "step": 145 }, { "epoch": 0.02, "learning_rate": 2.92e-06, "loss": 2.8706, "step": 146 }, { "epoch": 0.02, "learning_rate": 2.9400000000000002e-06, "loss": 2.6303, "step": 147 }, { "epoch": 0.02, "learning_rate": 2.96e-06, "loss": 2.7687, "step": 148 }, { "epoch": 0.02, "learning_rate": 2.9800000000000003e-06, "loss": 2.6951, "step": 149 }, { "epoch": 0.02, "learning_rate": 3e-06, "loss": 3.0126, "step": 150 }, { "epoch": 0.02, "learning_rate": 3.0200000000000003e-06, "loss": 2.7296, "step": 151 }, { "epoch": 0.02, "learning_rate": 3.04e-06, "loss": 2.6615, "step": 152 }, { "epoch": 0.02, "learning_rate": 3.0600000000000003e-06, "loss": 2.8486, "step": 153 }, { "epoch": 0.02, "learning_rate": 3.08e-06, "loss": 2.6163, "step": 154 }, { "epoch": 0.02, "learning_rate": 3.1000000000000004e-06, "loss": 2.5788, "step": 155 }, { "epoch": 0.02, "learning_rate": 3.12e-06, "loss": 2.851, "step": 156 }, { "epoch": 0.02, "learning_rate": 3.1400000000000004e-06, "loss": 2.7258, "step": 157 }, { "epoch": 0.02, "learning_rate": 3.1600000000000002e-06, "loss": 2.8291, "step": 158 }, { "epoch": 0.02, "learning_rate": 3.1800000000000005e-06, "loss": 2.7279, "step": 159 }, { "epoch": 0.02, "learning_rate": 3.2000000000000003e-06, "loss": 2.9104, "step": 160 }, { "epoch": 0.02, "learning_rate": 3.2200000000000005e-06, "loss": 2.6855, "step": 161 }, { "epoch": 0.02, "learning_rate": 3.2400000000000003e-06, "loss": 2.7472, "step": 162 }, { "epoch": 0.02, "learning_rate": 3.2600000000000006e-06, "loss": 2.8647, "step": 163 }, { "epoch": 0.02, "learning_rate": 3.2800000000000004e-06, "loss": 2.9263, "step": 164 }, { "epoch": 0.02, "learning_rate": 3.3000000000000006e-06, "loss": 2.6979, "step": 165 }, { "epoch": 0.02, "learning_rate": 3.3200000000000004e-06, "loss": 2.7195, "step": 166 }, { "epoch": 0.02, "learning_rate": 3.3400000000000006e-06, "loss": 2.8101, "step": 167 }, { "epoch": 0.02, "learning_rate": 3.3600000000000004e-06, "loss": 2.7477, "step": 168 }, { "epoch": 0.02, "learning_rate": 3.3800000000000007e-06, "loss": 2.8066, "step": 169 }, { "epoch": 0.02, "learning_rate": 3.4000000000000005e-06, "loss": 2.7861, "step": 170 }, { "epoch": 0.02, "learning_rate": 3.4200000000000007e-06, "loss": 2.8053, "step": 171 }, { "epoch": 0.02, "learning_rate": 3.44e-06, "loss": 2.7382, "step": 172 }, { "epoch": 0.02, "learning_rate": 3.46e-06, "loss": 2.6885, "step": 173 }, { "epoch": 0.02, "learning_rate": 3.48e-06, "loss": 2.7424, "step": 174 }, { "epoch": 0.02, "learning_rate": 3.5e-06, "loss": 2.7374, "step": 175 }, { "epoch": 0.02, "learning_rate": 3.52e-06, "loss": 2.7216, "step": 176 }, { "epoch": 0.02, "learning_rate": 3.54e-06, "loss": 2.8457, "step": 177 }, { "epoch": 0.02, "learning_rate": 3.5600000000000002e-06, "loss": 2.7685, "step": 178 }, { "epoch": 0.02, "learning_rate": 3.58e-06, "loss": 2.8715, "step": 179 }, { "epoch": 0.02, "learning_rate": 3.6000000000000003e-06, "loss": 2.7292, "step": 180 }, { "epoch": 0.02, "learning_rate": 3.62e-06, "loss": 2.9648, "step": 181 }, { "epoch": 0.02, "learning_rate": 3.6400000000000003e-06, "loss": 2.7378, "step": 182 }, { "epoch": 0.02, "learning_rate": 3.66e-06, "loss": 2.9837, "step": 183 }, { "epoch": 0.02, "learning_rate": 3.6800000000000003e-06, "loss": 2.8348, "step": 184 }, { "epoch": 0.02, "learning_rate": 3.7e-06, "loss": 2.8113, "step": 185 }, { "epoch": 0.02, "learning_rate": 3.7200000000000004e-06, "loss": 2.8178, "step": 186 }, { "epoch": 0.02, "learning_rate": 3.74e-06, "loss": 2.8594, "step": 187 }, { "epoch": 0.02, "learning_rate": 3.7600000000000004e-06, "loss": 2.7789, "step": 188 }, { "epoch": 0.02, "learning_rate": 3.7800000000000002e-06, "loss": 2.7139, "step": 189 }, { "epoch": 0.02, "learning_rate": 3.8000000000000005e-06, "loss": 2.7585, "step": 190 }, { "epoch": 0.02, "learning_rate": 3.820000000000001e-06, "loss": 2.8334, "step": 191 }, { "epoch": 0.02, "learning_rate": 3.8400000000000005e-06, "loss": 2.6522, "step": 192 }, { "epoch": 0.02, "learning_rate": 3.86e-06, "loss": 2.6804, "step": 193 }, { "epoch": 0.02, "learning_rate": 3.88e-06, "loss": 2.6061, "step": 194 }, { "epoch": 0.02, "learning_rate": 3.900000000000001e-06, "loss": 2.6389, "step": 195 }, { "epoch": 0.02, "learning_rate": 3.920000000000001e-06, "loss": 2.6688, "step": 196 }, { "epoch": 0.02, "learning_rate": 3.94e-06, "loss": 2.6974, "step": 197 }, { "epoch": 0.02, "learning_rate": 3.96e-06, "loss": 2.7438, "step": 198 }, { "epoch": 0.02, "learning_rate": 3.980000000000001e-06, "loss": 2.818, "step": 199 }, { "epoch": 0.02, "learning_rate": 4.000000000000001e-06, "loss": 2.5431, "step": 200 }, { "epoch": 0.02, "learning_rate": 4.0200000000000005e-06, "loss": 2.7117, "step": 201 }, { "epoch": 0.02, "learning_rate": 4.04e-06, "loss": 2.7474, "step": 202 }, { "epoch": 0.02, "learning_rate": 4.060000000000001e-06, "loss": 2.6124, "step": 203 }, { "epoch": 0.02, "learning_rate": 4.08e-06, "loss": 2.8398, "step": 204 }, { "epoch": 0.02, "learning_rate": 4.1e-06, "loss": 2.6281, "step": 205 }, { "epoch": 0.02, "learning_rate": 4.12e-06, "loss": 2.6267, "step": 206 }, { "epoch": 0.02, "learning_rate": 4.14e-06, "loss": 2.7716, "step": 207 }, { "epoch": 0.02, "learning_rate": 4.16e-06, "loss": 2.7426, "step": 208 }, { "epoch": 0.03, "learning_rate": 4.18e-06, "loss": 2.9914, "step": 209 }, { "epoch": 0.03, "learning_rate": 4.2000000000000004e-06, "loss": 2.7598, "step": 210 }, { "epoch": 0.03, "learning_rate": 4.22e-06, "loss": 2.6267, "step": 211 }, { "epoch": 0.03, "learning_rate": 4.24e-06, "loss": 2.6901, "step": 212 }, { "epoch": 0.03, "learning_rate": 4.26e-06, "loss": 2.9535, "step": 213 }, { "epoch": 0.03, "learning_rate": 4.2800000000000005e-06, "loss": 2.7835, "step": 214 }, { "epoch": 0.03, "learning_rate": 4.3e-06, "loss": 2.641, "step": 215 }, { "epoch": 0.03, "learning_rate": 4.32e-06, "loss": 2.8062, "step": 216 }, { "epoch": 0.03, "learning_rate": 4.34e-06, "loss": 2.7327, "step": 217 }, { "epoch": 0.03, "learning_rate": 4.360000000000001e-06, "loss": 2.6462, "step": 218 }, { "epoch": 0.03, "learning_rate": 4.38e-06, "loss": 2.7658, "step": 219 }, { "epoch": 0.03, "learning_rate": 4.4e-06, "loss": 2.5678, "step": 220 }, { "epoch": 0.03, "learning_rate": 4.42e-06, "loss": 2.8125, "step": 221 }, { "epoch": 0.03, "learning_rate": 4.440000000000001e-06, "loss": 2.7126, "step": 222 }, { "epoch": 0.03, "learning_rate": 4.4600000000000005e-06, "loss": 2.6183, "step": 223 }, { "epoch": 0.03, "learning_rate": 4.48e-06, "loss": 2.6963, "step": 224 }, { "epoch": 0.03, "learning_rate": 4.5e-06, "loss": 2.6586, "step": 225 }, { "epoch": 0.03, "learning_rate": 4.520000000000001e-06, "loss": 2.741, "step": 226 }, { "epoch": 0.03, "learning_rate": 4.540000000000001e-06, "loss": 2.8272, "step": 227 }, { "epoch": 0.03, "learning_rate": 4.56e-06, "loss": 2.878, "step": 228 }, { "epoch": 0.03, "learning_rate": 4.58e-06, "loss": 2.8037, "step": 229 }, { "epoch": 0.03, "learning_rate": 4.600000000000001e-06, "loss": 2.678, "step": 230 }, { "epoch": 0.03, "learning_rate": 4.620000000000001e-06, "loss": 2.6924, "step": 231 }, { "epoch": 0.03, "learning_rate": 4.6400000000000005e-06, "loss": 2.739, "step": 232 }, { "epoch": 0.03, "learning_rate": 4.66e-06, "loss": 2.8372, "step": 233 }, { "epoch": 0.03, "learning_rate": 4.680000000000001e-06, "loss": 2.7128, "step": 234 }, { "epoch": 0.03, "learning_rate": 4.7e-06, "loss": 2.722, "step": 235 }, { "epoch": 0.03, "learning_rate": 4.7200000000000005e-06, "loss": 2.7681, "step": 236 }, { "epoch": 0.03, "learning_rate": 4.74e-06, "loss": 2.6312, "step": 237 }, { "epoch": 0.03, "learning_rate": 4.76e-06, "loss": 2.5889, "step": 238 }, { "epoch": 0.03, "learning_rate": 4.78e-06, "loss": 2.6731, "step": 239 }, { "epoch": 0.03, "learning_rate": 4.800000000000001e-06, "loss": 2.6796, "step": 240 }, { "epoch": 0.03, "learning_rate": 4.8200000000000004e-06, "loss": 2.7552, "step": 241 }, { "epoch": 0.03, "learning_rate": 4.84e-06, "loss": 2.944, "step": 242 }, { "epoch": 0.03, "learning_rate": 4.86e-06, "loss": 2.8513, "step": 243 }, { "epoch": 0.03, "learning_rate": 4.880000000000001e-06, "loss": 2.6528, "step": 244 }, { "epoch": 0.03, "learning_rate": 4.9000000000000005e-06, "loss": 2.961, "step": 245 }, { "epoch": 0.03, "learning_rate": 4.92e-06, "loss": 2.5977, "step": 246 }, { "epoch": 0.03, "learning_rate": 4.94e-06, "loss": 2.7888, "step": 247 }, { "epoch": 0.03, "learning_rate": 4.960000000000001e-06, "loss": 2.5123, "step": 248 }, { "epoch": 0.03, "learning_rate": 4.980000000000001e-06, "loss": 2.8207, "step": 249 }, { "epoch": 0.03, "learning_rate": 5e-06, "loss": 2.8229, "step": 250 }, { "epoch": 0.03, "learning_rate": 5.02e-06, "loss": 2.8254, "step": 251 }, { "epoch": 0.03, "learning_rate": 5.04e-06, "loss": 2.7459, "step": 252 }, { "epoch": 0.03, "learning_rate": 5.060000000000001e-06, "loss": 2.504, "step": 253 }, { "epoch": 0.03, "learning_rate": 5.0800000000000005e-06, "loss": 2.8549, "step": 254 }, { "epoch": 0.03, "learning_rate": 5.1e-06, "loss": 2.9212, "step": 255 }, { "epoch": 0.03, "learning_rate": 5.12e-06, "loss": 2.7519, "step": 256 }, { "epoch": 0.03, "learning_rate": 5.140000000000001e-06, "loss": 2.7328, "step": 257 }, { "epoch": 0.03, "learning_rate": 5.1600000000000006e-06, "loss": 2.9336, "step": 258 }, { "epoch": 0.03, "learning_rate": 5.18e-06, "loss": 2.8143, "step": 259 }, { "epoch": 0.03, "learning_rate": 5.2e-06, "loss": 2.7595, "step": 260 }, { "epoch": 0.03, "learning_rate": 5.220000000000001e-06, "loss": 2.8413, "step": 261 }, { "epoch": 0.03, "learning_rate": 5.240000000000001e-06, "loss": 2.8455, "step": 262 }, { "epoch": 0.03, "learning_rate": 5.2600000000000005e-06, "loss": 2.8666, "step": 263 }, { "epoch": 0.03, "learning_rate": 5.28e-06, "loss": 2.706, "step": 264 }, { "epoch": 0.03, "learning_rate": 5.300000000000001e-06, "loss": 2.7563, "step": 265 }, { "epoch": 0.03, "learning_rate": 5.320000000000001e-06, "loss": 2.8858, "step": 266 }, { "epoch": 0.03, "learning_rate": 5.3400000000000005e-06, "loss": 2.7714, "step": 267 }, { "epoch": 0.03, "learning_rate": 5.36e-06, "loss": 2.6696, "step": 268 }, { "epoch": 0.03, "learning_rate": 5.380000000000001e-06, "loss": 2.7685, "step": 269 }, { "epoch": 0.03, "learning_rate": 5.400000000000001e-06, "loss": 2.8218, "step": 270 }, { "epoch": 0.03, "learning_rate": 5.420000000000001e-06, "loss": 2.6513, "step": 271 }, { "epoch": 0.03, "learning_rate": 5.4400000000000004e-06, "loss": 2.5531, "step": 272 }, { "epoch": 0.03, "learning_rate": 5.460000000000001e-06, "loss": 2.6738, "step": 273 }, { "epoch": 0.03, "learning_rate": 5.480000000000001e-06, "loss": 2.6684, "step": 274 }, { "epoch": 0.03, "learning_rate": 5.500000000000001e-06, "loss": 2.5771, "step": 275 }, { "epoch": 0.03, "learning_rate": 5.5200000000000005e-06, "loss": 2.7887, "step": 276 }, { "epoch": 0.03, "learning_rate": 5.540000000000001e-06, "loss": 2.6957, "step": 277 }, { "epoch": 0.03, "learning_rate": 5.560000000000001e-06, "loss": 2.7742, "step": 278 }, { "epoch": 0.03, "learning_rate": 5.580000000000001e-06, "loss": 2.8841, "step": 279 }, { "epoch": 0.03, "learning_rate": 5.600000000000001e-06, "loss": 2.6455, "step": 280 }, { "epoch": 0.03, "learning_rate": 5.620000000000001e-06, "loss": 2.6645, "step": 281 }, { "epoch": 0.03, "learning_rate": 5.64e-06, "loss": 2.7753, "step": 282 }, { "epoch": 0.03, "learning_rate": 5.66e-06, "loss": 2.9213, "step": 283 }, { "epoch": 0.03, "learning_rate": 5.68e-06, "loss": 2.7834, "step": 284 }, { "epoch": 0.03, "learning_rate": 5.7e-06, "loss": 2.6396, "step": 285 }, { "epoch": 0.03, "learning_rate": 5.72e-06, "loss": 2.8196, "step": 286 }, { "epoch": 0.03, "learning_rate": 5.74e-06, "loss": 2.661, "step": 287 }, { "epoch": 0.03, "learning_rate": 5.76e-06, "loss": 2.6563, "step": 288 }, { "epoch": 0.03, "learning_rate": 5.78e-06, "loss": 2.6019, "step": 289 }, { "epoch": 0.03, "learning_rate": 5.8e-06, "loss": 2.7255, "step": 290 }, { "epoch": 0.03, "learning_rate": 5.82e-06, "loss": 2.7526, "step": 291 }, { "epoch": 0.04, "learning_rate": 5.84e-06, "loss": 2.7014, "step": 292 }, { "epoch": 0.04, "learning_rate": 5.86e-06, "loss": 2.8109, "step": 293 }, { "epoch": 0.04, "learning_rate": 5.8800000000000005e-06, "loss": 2.7619, "step": 294 }, { "epoch": 0.04, "learning_rate": 5.9e-06, "loss": 2.7368, "step": 295 }, { "epoch": 0.04, "learning_rate": 5.92e-06, "loss": 2.8128, "step": 296 }, { "epoch": 0.04, "learning_rate": 5.94e-06, "loss": 2.7018, "step": 297 }, { "epoch": 0.04, "learning_rate": 5.9600000000000005e-06, "loss": 2.7541, "step": 298 }, { "epoch": 0.04, "learning_rate": 5.98e-06, "loss": 2.7203, "step": 299 }, { "epoch": 0.04, "learning_rate": 6e-06, "loss": 2.7399, "step": 300 }, { "epoch": 0.04, "learning_rate": 6.02e-06, "loss": 2.7455, "step": 301 }, { "epoch": 0.04, "learning_rate": 6.040000000000001e-06, "loss": 2.6941, "step": 302 }, { "epoch": 0.04, "learning_rate": 6.0600000000000004e-06, "loss": 2.9303, "step": 303 }, { "epoch": 0.04, "learning_rate": 6.08e-06, "loss": 2.7382, "step": 304 }, { "epoch": 0.04, "learning_rate": 6.1e-06, "loss": 2.7882, "step": 305 }, { "epoch": 0.04, "learning_rate": 6.120000000000001e-06, "loss": 2.6581, "step": 306 }, { "epoch": 0.04, "learning_rate": 6.1400000000000005e-06, "loss": 2.7062, "step": 307 }, { "epoch": 0.04, "learning_rate": 6.16e-06, "loss": 2.602, "step": 308 }, { "epoch": 0.04, "learning_rate": 6.18e-06, "loss": 2.6892, "step": 309 }, { "epoch": 0.04, "learning_rate": 6.200000000000001e-06, "loss": 2.5565, "step": 310 }, { "epoch": 0.04, "learning_rate": 6.220000000000001e-06, "loss": 2.8248, "step": 311 }, { "epoch": 0.04, "learning_rate": 6.24e-06, "loss": 2.6882, "step": 312 }, { "epoch": 0.04, "learning_rate": 6.26e-06, "loss": 2.6782, "step": 313 }, { "epoch": 0.04, "learning_rate": 6.280000000000001e-06, "loss": 2.6754, "step": 314 }, { "epoch": 0.04, "learning_rate": 6.300000000000001e-06, "loss": 2.8579, "step": 315 }, { "epoch": 0.04, "learning_rate": 6.3200000000000005e-06, "loss": 2.6539, "step": 316 }, { "epoch": 0.04, "learning_rate": 6.34e-06, "loss": 2.5563, "step": 317 }, { "epoch": 0.04, "learning_rate": 6.360000000000001e-06, "loss": 2.6639, "step": 318 }, { "epoch": 0.04, "learning_rate": 6.380000000000001e-06, "loss": 2.6467, "step": 319 }, { "epoch": 0.04, "learning_rate": 6.4000000000000006e-06, "loss": 2.7478, "step": 320 }, { "epoch": 0.04, "learning_rate": 6.42e-06, "loss": 2.4947, "step": 321 }, { "epoch": 0.04, "learning_rate": 6.440000000000001e-06, "loss": 2.5668, "step": 322 }, { "epoch": 0.04, "learning_rate": 6.460000000000001e-06, "loss": 2.7168, "step": 323 }, { "epoch": 0.04, "learning_rate": 6.480000000000001e-06, "loss": 2.8168, "step": 324 }, { "epoch": 0.04, "learning_rate": 6.5000000000000004e-06, "loss": 2.7267, "step": 325 }, { "epoch": 0.04, "learning_rate": 6.520000000000001e-06, "loss": 2.6155, "step": 326 }, { "epoch": 0.04, "learning_rate": 6.540000000000001e-06, "loss": 2.5881, "step": 327 }, { "epoch": 0.04, "learning_rate": 6.560000000000001e-06, "loss": 2.5912, "step": 328 }, { "epoch": 0.04, "learning_rate": 6.5800000000000005e-06, "loss": 2.7586, "step": 329 }, { "epoch": 0.04, "learning_rate": 6.600000000000001e-06, "loss": 2.7013, "step": 330 }, { "epoch": 0.04, "learning_rate": 6.620000000000001e-06, "loss": 2.5506, "step": 331 }, { "epoch": 0.04, "learning_rate": 6.640000000000001e-06, "loss": 2.9118, "step": 332 }, { "epoch": 0.04, "learning_rate": 6.660000000000001e-06, "loss": 2.7971, "step": 333 }, { "epoch": 0.04, "learning_rate": 6.680000000000001e-06, "loss": 2.7011, "step": 334 }, { "epoch": 0.04, "learning_rate": 6.700000000000001e-06, "loss": 2.6823, "step": 335 }, { "epoch": 0.04, "learning_rate": 6.720000000000001e-06, "loss": 2.6775, "step": 336 }, { "epoch": 0.04, "learning_rate": 6.740000000000001e-06, "loss": 2.6323, "step": 337 }, { "epoch": 0.04, "learning_rate": 6.760000000000001e-06, "loss": 2.6911, "step": 338 }, { "epoch": 0.04, "learning_rate": 6.780000000000001e-06, "loss": 2.7132, "step": 339 }, { "epoch": 0.04, "learning_rate": 6.800000000000001e-06, "loss": 2.7473, "step": 340 }, { "epoch": 0.04, "learning_rate": 6.820000000000001e-06, "loss": 2.6943, "step": 341 }, { "epoch": 0.04, "learning_rate": 6.8400000000000014e-06, "loss": 2.7517, "step": 342 }, { "epoch": 0.04, "learning_rate": 6.860000000000001e-06, "loss": 2.7072, "step": 343 }, { "epoch": 0.04, "learning_rate": 6.88e-06, "loss": 2.7432, "step": 344 }, { "epoch": 0.04, "learning_rate": 6.9e-06, "loss": 2.8832, "step": 345 }, { "epoch": 0.04, "learning_rate": 6.92e-06, "loss": 2.852, "step": 346 }, { "epoch": 0.04, "learning_rate": 6.9400000000000005e-06, "loss": 2.619, "step": 347 }, { "epoch": 0.04, "learning_rate": 6.96e-06, "loss": 2.8233, "step": 348 }, { "epoch": 0.04, "learning_rate": 6.98e-06, "loss": 2.8981, "step": 349 }, { "epoch": 0.04, "learning_rate": 7e-06, "loss": 2.7773, "step": 350 }, { "epoch": 0.04, "learning_rate": 7.0200000000000006e-06, "loss": 2.7274, "step": 351 }, { "epoch": 0.04, "learning_rate": 7.04e-06, "loss": 2.8148, "step": 352 }, { "epoch": 0.04, "learning_rate": 7.06e-06, "loss": 2.6504, "step": 353 }, { "epoch": 0.04, "learning_rate": 7.08e-06, "loss": 2.5703, "step": 354 }, { "epoch": 0.04, "learning_rate": 7.100000000000001e-06, "loss": 2.6483, "step": 355 }, { "epoch": 0.04, "learning_rate": 7.1200000000000004e-06, "loss": 2.6792, "step": 356 }, { "epoch": 0.04, "learning_rate": 7.14e-06, "loss": 2.679, "step": 357 }, { "epoch": 0.04, "learning_rate": 7.16e-06, "loss": 2.8833, "step": 358 }, { "epoch": 0.04, "learning_rate": 7.180000000000001e-06, "loss": 2.6336, "step": 359 }, { "epoch": 0.04, "learning_rate": 7.2000000000000005e-06, "loss": 2.6633, "step": 360 }, { "epoch": 0.04, "learning_rate": 7.22e-06, "loss": 2.717, "step": 361 }, { "epoch": 0.04, "learning_rate": 7.24e-06, "loss": 2.554, "step": 362 }, { "epoch": 0.04, "learning_rate": 7.260000000000001e-06, "loss": 2.6725, "step": 363 }, { "epoch": 0.04, "learning_rate": 7.280000000000001e-06, "loss": 2.661, "step": 364 }, { "epoch": 0.04, "learning_rate": 7.3e-06, "loss": 2.5621, "step": 365 }, { "epoch": 0.04, "learning_rate": 7.32e-06, "loss": 2.5976, "step": 366 }, { "epoch": 0.04, "learning_rate": 7.340000000000001e-06, "loss": 2.6586, "step": 367 }, { "epoch": 0.04, "learning_rate": 7.360000000000001e-06, "loss": 2.7344, "step": 368 }, { "epoch": 0.04, "learning_rate": 7.3800000000000005e-06, "loss": 2.6487, "step": 369 }, { "epoch": 0.04, "learning_rate": 7.4e-06, "loss": 2.6789, "step": 370 }, { "epoch": 0.04, "learning_rate": 7.420000000000001e-06, "loss": 2.6848, "step": 371 }, { "epoch": 0.04, "learning_rate": 7.440000000000001e-06, "loss": 2.6134, "step": 372 }, { "epoch": 0.04, "learning_rate": 7.4600000000000006e-06, "loss": 2.7112, "step": 373 }, { "epoch": 0.04, "learning_rate": 7.48e-06, "loss": 2.7807, "step": 374 }, { "epoch": 0.05, "learning_rate": 7.500000000000001e-06, "loss": 2.7532, "step": 375 }, { "epoch": 0.05, "learning_rate": 7.520000000000001e-06, "loss": 2.7242, "step": 376 }, { "epoch": 0.05, "learning_rate": 7.540000000000001e-06, "loss": 2.6479, "step": 377 }, { "epoch": 0.05, "learning_rate": 7.5600000000000005e-06, "loss": 2.7481, "step": 378 }, { "epoch": 0.05, "learning_rate": 7.58e-06, "loss": 2.8313, "step": 379 }, { "epoch": 0.05, "learning_rate": 7.600000000000001e-06, "loss": 2.607, "step": 380 }, { "epoch": 0.05, "learning_rate": 7.620000000000001e-06, "loss": 2.6389, "step": 381 }, { "epoch": 0.05, "learning_rate": 7.640000000000001e-06, "loss": 2.5013, "step": 382 }, { "epoch": 0.05, "learning_rate": 7.660000000000001e-06, "loss": 2.6571, "step": 383 }, { "epoch": 0.05, "learning_rate": 7.680000000000001e-06, "loss": 2.494, "step": 384 }, { "epoch": 0.05, "learning_rate": 7.7e-06, "loss": 2.5826, "step": 385 }, { "epoch": 0.05, "learning_rate": 7.72e-06, "loss": 2.9526, "step": 386 }, { "epoch": 0.05, "learning_rate": 7.74e-06, "loss": 2.756, "step": 387 }, { "epoch": 0.05, "learning_rate": 7.76e-06, "loss": 2.5758, "step": 388 }, { "epoch": 0.05, "learning_rate": 7.78e-06, "loss": 2.7195, "step": 389 }, { "epoch": 0.05, "learning_rate": 7.800000000000002e-06, "loss": 2.6548, "step": 390 }, { "epoch": 0.05, "learning_rate": 7.820000000000001e-06, "loss": 2.701, "step": 391 }, { "epoch": 0.05, "learning_rate": 7.840000000000001e-06, "loss": 2.7511, "step": 392 }, { "epoch": 0.05, "learning_rate": 7.860000000000001e-06, "loss": 2.6924, "step": 393 }, { "epoch": 0.05, "learning_rate": 7.88e-06, "loss": 2.7395, "step": 394 }, { "epoch": 0.05, "learning_rate": 7.9e-06, "loss": 2.6731, "step": 395 }, { "epoch": 0.05, "learning_rate": 7.92e-06, "loss": 2.6414, "step": 396 }, { "epoch": 0.05, "learning_rate": 7.94e-06, "loss": 2.8004, "step": 397 }, { "epoch": 0.05, "learning_rate": 7.960000000000002e-06, "loss": 2.521, "step": 398 }, { "epoch": 0.05, "learning_rate": 7.980000000000002e-06, "loss": 2.7233, "step": 399 }, { "epoch": 0.05, "learning_rate": 8.000000000000001e-06, "loss": 2.7275, "step": 400 }, { "epoch": 0.05, "learning_rate": 8.020000000000001e-06, "loss": 2.6185, "step": 401 }, { "epoch": 0.05, "learning_rate": 8.040000000000001e-06, "loss": 2.57, "step": 402 }, { "epoch": 0.05, "learning_rate": 8.06e-06, "loss": 2.6627, "step": 403 }, { "epoch": 0.05, "learning_rate": 8.08e-06, "loss": 2.7651, "step": 404 }, { "epoch": 0.05, "learning_rate": 8.1e-06, "loss": 2.6516, "step": 405 }, { "epoch": 0.05, "learning_rate": 8.120000000000002e-06, "loss": 2.8147, "step": 406 }, { "epoch": 0.05, "learning_rate": 8.14e-06, "loss": 2.8192, "step": 407 }, { "epoch": 0.05, "learning_rate": 8.16e-06, "loss": 2.671, "step": 408 }, { "epoch": 0.05, "learning_rate": 8.18e-06, "loss": 2.7703, "step": 409 }, { "epoch": 0.05, "learning_rate": 8.2e-06, "loss": 2.629, "step": 410 }, { "epoch": 0.05, "learning_rate": 8.220000000000001e-06, "loss": 2.634, "step": 411 }, { "epoch": 0.05, "learning_rate": 8.24e-06, "loss": 2.8503, "step": 412 }, { "epoch": 0.05, "learning_rate": 8.26e-06, "loss": 2.6991, "step": 413 }, { "epoch": 0.05, "learning_rate": 8.28e-06, "loss": 2.714, "step": 414 }, { "epoch": 0.05, "learning_rate": 8.3e-06, "loss": 2.8076, "step": 415 }, { "epoch": 0.05, "learning_rate": 8.32e-06, "loss": 2.6083, "step": 416 }, { "epoch": 0.05, "learning_rate": 8.34e-06, "loss": 2.7288, "step": 417 }, { "epoch": 0.05, "learning_rate": 8.36e-06, "loss": 2.8534, "step": 418 }, { "epoch": 0.05, "learning_rate": 8.380000000000001e-06, "loss": 2.6112, "step": 419 }, { "epoch": 0.05, "learning_rate": 8.400000000000001e-06, "loss": 2.6004, "step": 420 }, { "epoch": 0.05, "learning_rate": 8.42e-06, "loss": 2.7698, "step": 421 }, { "epoch": 0.05, "learning_rate": 8.44e-06, "loss": 2.8104, "step": 422 }, { "epoch": 0.05, "learning_rate": 8.46e-06, "loss": 2.8756, "step": 423 }, { "epoch": 0.05, "learning_rate": 8.48e-06, "loss": 2.9634, "step": 424 }, { "epoch": 0.05, "learning_rate": 8.5e-06, "loss": 2.7704, "step": 425 }, { "epoch": 0.05, "learning_rate": 8.52e-06, "loss": 2.7487, "step": 426 }, { "epoch": 0.05, "learning_rate": 8.540000000000001e-06, "loss": 2.8121, "step": 427 }, { "epoch": 0.05, "learning_rate": 8.560000000000001e-06, "loss": 2.6654, "step": 428 }, { "epoch": 0.05, "learning_rate": 8.580000000000001e-06, "loss": 2.6113, "step": 429 }, { "epoch": 0.05, "learning_rate": 8.6e-06, "loss": 2.5954, "step": 430 }, { "epoch": 0.05, "learning_rate": 8.62e-06, "loss": 2.7727, "step": 431 }, { "epoch": 0.05, "learning_rate": 8.64e-06, "loss": 2.6134, "step": 432 }, { "epoch": 0.05, "learning_rate": 8.66e-06, "loss": 2.7212, "step": 433 }, { "epoch": 0.05, "learning_rate": 8.68e-06, "loss": 2.7521, "step": 434 }, { "epoch": 0.05, "learning_rate": 8.700000000000001e-06, "loss": 2.7893, "step": 435 }, { "epoch": 0.05, "learning_rate": 8.720000000000001e-06, "loss": 2.6715, "step": 436 }, { "epoch": 0.05, "learning_rate": 8.740000000000001e-06, "loss": 2.8775, "step": 437 }, { "epoch": 0.05, "learning_rate": 8.76e-06, "loss": 2.7883, "step": 438 }, { "epoch": 0.05, "learning_rate": 8.78e-06, "loss": 2.7315, "step": 439 }, { "epoch": 0.05, "learning_rate": 8.8e-06, "loss": 2.7721, "step": 440 }, { "epoch": 0.05, "learning_rate": 8.82e-06, "loss": 2.6575, "step": 441 }, { "epoch": 0.05, "learning_rate": 8.84e-06, "loss": 2.7204, "step": 442 }, { "epoch": 0.05, "learning_rate": 8.860000000000002e-06, "loss": 2.6011, "step": 443 }, { "epoch": 0.05, "learning_rate": 8.880000000000001e-06, "loss": 2.7836, "step": 444 }, { "epoch": 0.05, "learning_rate": 8.900000000000001e-06, "loss": 2.6523, "step": 445 }, { "epoch": 0.05, "learning_rate": 8.920000000000001e-06, "loss": 2.694, "step": 446 }, { "epoch": 0.05, "learning_rate": 8.94e-06, "loss": 2.7417, "step": 447 }, { "epoch": 0.05, "learning_rate": 8.96e-06, "loss": 2.7703, "step": 448 }, { "epoch": 0.05, "learning_rate": 8.98e-06, "loss": 2.865, "step": 449 }, { "epoch": 0.05, "learning_rate": 9e-06, "loss": 2.7502, "step": 450 }, { "epoch": 0.05, "learning_rate": 9.020000000000002e-06, "loss": 2.7532, "step": 451 }, { "epoch": 0.05, "learning_rate": 9.040000000000002e-06, "loss": 2.6585, "step": 452 }, { "epoch": 0.05, "learning_rate": 9.060000000000001e-06, "loss": 2.9593, "step": 453 }, { "epoch": 0.05, "learning_rate": 9.080000000000001e-06, "loss": 2.6351, "step": 454 }, { "epoch": 0.05, "learning_rate": 9.100000000000001e-06, "loss": 2.7307, "step": 455 }, { "epoch": 0.05, "learning_rate": 9.12e-06, "loss": 2.797, "step": 456 }, { "epoch": 0.05, "learning_rate": 9.14e-06, "loss": 2.7763, "step": 457 }, { "epoch": 0.06, "learning_rate": 9.16e-06, "loss": 2.7832, "step": 458 }, { "epoch": 0.06, "learning_rate": 9.180000000000002e-06, "loss": 2.5781, "step": 459 }, { "epoch": 0.06, "learning_rate": 9.200000000000002e-06, "loss": 2.7653, "step": 460 }, { "epoch": 0.06, "learning_rate": 9.220000000000002e-06, "loss": 2.6696, "step": 461 }, { "epoch": 0.06, "learning_rate": 9.240000000000001e-06, "loss": 2.6251, "step": 462 }, { "epoch": 0.06, "learning_rate": 9.260000000000001e-06, "loss": 2.6316, "step": 463 }, { "epoch": 0.06, "learning_rate": 9.280000000000001e-06, "loss": 2.7429, "step": 464 }, { "epoch": 0.06, "learning_rate": 9.3e-06, "loss": 2.6906, "step": 465 }, { "epoch": 0.06, "learning_rate": 9.32e-06, "loss": 2.6813, "step": 466 }, { "epoch": 0.06, "learning_rate": 9.340000000000002e-06, "loss": 2.8493, "step": 467 }, { "epoch": 0.06, "learning_rate": 9.360000000000002e-06, "loss": 2.715, "step": 468 }, { "epoch": 0.06, "learning_rate": 9.38e-06, "loss": 2.5253, "step": 469 }, { "epoch": 0.06, "learning_rate": 9.4e-06, "loss": 2.7604, "step": 470 }, { "epoch": 0.06, "learning_rate": 9.42e-06, "loss": 2.4687, "step": 471 }, { "epoch": 0.06, "learning_rate": 9.440000000000001e-06, "loss": 2.7829, "step": 472 }, { "epoch": 0.06, "learning_rate": 9.460000000000001e-06, "loss": 2.6582, "step": 473 }, { "epoch": 0.06, "learning_rate": 9.48e-06, "loss": 2.6355, "step": 474 }, { "epoch": 0.06, "learning_rate": 9.5e-06, "loss": 2.8583, "step": 475 }, { "epoch": 0.06, "learning_rate": 9.52e-06, "loss": 2.7574, "step": 476 }, { "epoch": 0.06, "learning_rate": 9.54e-06, "loss": 2.7816, "step": 477 }, { "epoch": 0.06, "learning_rate": 9.56e-06, "loss": 2.6692, "step": 478 }, { "epoch": 0.06, "learning_rate": 9.58e-06, "loss": 2.6472, "step": 479 }, { "epoch": 0.06, "learning_rate": 9.600000000000001e-06, "loss": 2.6968, "step": 480 }, { "epoch": 0.06, "learning_rate": 9.620000000000001e-06, "loss": 2.8404, "step": 481 }, { "epoch": 0.06, "learning_rate": 9.640000000000001e-06, "loss": 2.6729, "step": 482 }, { "epoch": 0.06, "learning_rate": 9.66e-06, "loss": 2.9113, "step": 483 }, { "epoch": 0.06, "learning_rate": 9.68e-06, "loss": 2.6295, "step": 484 }, { "epoch": 0.06, "learning_rate": 9.7e-06, "loss": 2.7364, "step": 485 }, { "epoch": 0.06, "learning_rate": 9.72e-06, "loss": 2.7664, "step": 486 }, { "epoch": 0.06, "learning_rate": 9.74e-06, "loss": 2.7076, "step": 487 }, { "epoch": 0.06, "learning_rate": 9.760000000000001e-06, "loss": 2.6171, "step": 488 }, { "epoch": 0.06, "learning_rate": 9.780000000000001e-06, "loss": 2.7698, "step": 489 }, { "epoch": 0.06, "learning_rate": 9.800000000000001e-06, "loss": 3.0325, "step": 490 }, { "epoch": 0.06, "learning_rate": 9.820000000000001e-06, "loss": 2.7837, "step": 491 }, { "epoch": 0.06, "learning_rate": 9.84e-06, "loss": 2.5562, "step": 492 }, { "epoch": 0.06, "learning_rate": 9.86e-06, "loss": 2.765, "step": 493 }, { "epoch": 0.06, "learning_rate": 9.88e-06, "loss": 2.6804, "step": 494 }, { "epoch": 0.06, "learning_rate": 9.9e-06, "loss": 2.7081, "step": 495 }, { "epoch": 0.06, "learning_rate": 9.920000000000002e-06, "loss": 2.8065, "step": 496 }, { "epoch": 0.06, "learning_rate": 9.940000000000001e-06, "loss": 2.7093, "step": 497 }, { "epoch": 0.06, "learning_rate": 9.960000000000001e-06, "loss": 2.8892, "step": 498 }, { "epoch": 0.06, "learning_rate": 9.980000000000001e-06, "loss": 2.7807, "step": 499 }, { "epoch": 0.06, "learning_rate": 1e-05, "loss": 2.7471, "step": 500 }, { "epoch": 0.06, "learning_rate": 9.999999596928526e-06, "loss": 2.8152, "step": 501 }, { "epoch": 0.06, "learning_rate": 9.999998387714165e-06, "loss": 2.7673, "step": 502 }, { "epoch": 0.06, "learning_rate": 9.999996372357115e-06, "loss": 2.7032, "step": 503 }, { "epoch": 0.06, "learning_rate": 9.999993550857701e-06, "loss": 2.8087, "step": 504 }, { "epoch": 0.06, "learning_rate": 9.999989923216374e-06, "loss": 2.8449, "step": 505 }, { "epoch": 0.06, "learning_rate": 9.999985489433723e-06, "loss": 2.6203, "step": 506 }, { "epoch": 0.06, "learning_rate": 9.99998024951046e-06, "loss": 2.4976, "step": 507 }, { "epoch": 0.06, "learning_rate": 9.999974203447434e-06, "loss": 2.9274, "step": 508 }, { "epoch": 0.06, "learning_rate": 9.999967351245614e-06, "loss": 2.5602, "step": 509 }, { "epoch": 0.06, "learning_rate": 9.99995969290611e-06, "loss": 2.703, "step": 510 }, { "epoch": 0.06, "learning_rate": 9.999951228430154e-06, "loss": 2.7599, "step": 511 }, { "epoch": 0.06, "learning_rate": 9.999941957819112e-06, "loss": 2.6951, "step": 512 }, { "epoch": 0.06, "learning_rate": 9.999931881074477e-06, "loss": 2.557, "step": 513 }, { "epoch": 0.06, "learning_rate": 9.999920998197874e-06, "loss": 2.8728, "step": 514 }, { "epoch": 0.06, "learning_rate": 9.99990930919106e-06, "loss": 2.7927, "step": 515 }, { "epoch": 0.06, "learning_rate": 9.999896814055916e-06, "loss": 2.7068, "step": 516 }, { "epoch": 0.06, "learning_rate": 9.999883512794459e-06, "loss": 2.6488, "step": 517 }, { "epoch": 0.06, "learning_rate": 9.999869405408833e-06, "loss": 2.636, "step": 518 }, { "epoch": 0.06, "learning_rate": 9.999854491901312e-06, "loss": 2.8244, "step": 519 }, { "epoch": 0.06, "learning_rate": 9.999838772274303e-06, "loss": 2.6701, "step": 520 }, { "epoch": 0.06, "learning_rate": 9.999822246530337e-06, "loss": 2.8465, "step": 521 }, { "epoch": 0.06, "learning_rate": 9.99980491467208e-06, "loss": 2.6571, "step": 522 }, { "epoch": 0.06, "learning_rate": 9.999786776702327e-06, "loss": 2.5901, "step": 523 }, { "epoch": 0.06, "learning_rate": 9.999767832624e-06, "loss": 2.5644, "step": 524 }, { "epoch": 0.06, "learning_rate": 9.999748082440156e-06, "loss": 2.7344, "step": 525 }, { "epoch": 0.06, "learning_rate": 9.999727526153979e-06, "loss": 2.618, "step": 526 }, { "epoch": 0.06, "learning_rate": 9.99970616376878e-06, "loss": 2.5785, "step": 527 }, { "epoch": 0.06, "learning_rate": 9.999683995288008e-06, "loss": 2.6965, "step": 528 }, { "epoch": 0.06, "learning_rate": 9.999661020715234e-06, "loss": 2.5738, "step": 529 }, { "epoch": 0.06, "learning_rate": 9.999637240054163e-06, "loss": 2.8149, "step": 530 }, { "epoch": 0.06, "learning_rate": 9.999612653308631e-06, "loss": 2.7302, "step": 531 }, { "epoch": 0.06, "learning_rate": 9.999587260482597e-06, "loss": 2.8494, "step": 532 }, { "epoch": 0.06, "learning_rate": 9.999561061580161e-06, "loss": 2.722, "step": 533 }, { "epoch": 0.06, "learning_rate": 9.999534056605543e-06, "loss": 2.5865, "step": 534 }, { "epoch": 0.06, "learning_rate": 9.999506245563098e-06, "loss": 2.6119, "step": 535 }, { "epoch": 0.06, "learning_rate": 9.99947762845731e-06, "loss": 2.7701, "step": 536 }, { "epoch": 0.06, "learning_rate": 9.999448205292794e-06, "loss": 2.5768, "step": 537 }, { "epoch": 0.06, "learning_rate": 9.999417976074294e-06, "loss": 2.5837, "step": 538 }, { "epoch": 0.06, "learning_rate": 9.999386940806682e-06, "loss": 2.5491, "step": 539 }, { "epoch": 0.06, "learning_rate": 9.999355099494961e-06, "loss": 2.7923, "step": 540 }, { "epoch": 0.06, "learning_rate": 9.999322452144269e-06, "loss": 2.7359, "step": 541 }, { "epoch": 0.07, "learning_rate": 9.999288998759865e-06, "loss": 2.5339, "step": 542 }, { "epoch": 0.07, "learning_rate": 9.999254739347145e-06, "loss": 2.6716, "step": 543 }, { "epoch": 0.07, "learning_rate": 9.999219673911633e-06, "loss": 2.6797, "step": 544 }, { "epoch": 0.07, "learning_rate": 9.999183802458981e-06, "loss": 2.596, "step": 545 }, { "epoch": 0.07, "learning_rate": 9.999147124994974e-06, "loss": 2.6482, "step": 546 }, { "epoch": 0.07, "learning_rate": 9.999109641525524e-06, "loss": 2.732, "step": 547 }, { "epoch": 0.07, "learning_rate": 9.999071352056676e-06, "loss": 2.7887, "step": 548 }, { "epoch": 0.07, "learning_rate": 9.9990322565946e-06, "loss": 2.7436, "step": 549 }, { "epoch": 0.07, "learning_rate": 9.998992355145604e-06, "loss": 2.5541, "step": 550 }, { "epoch": 0.07, "learning_rate": 9.99895164771612e-06, "loss": 2.7401, "step": 551 }, { "epoch": 0.07, "learning_rate": 9.998910134312709e-06, "loss": 2.6659, "step": 552 }, { "epoch": 0.07, "learning_rate": 9.998867814942065e-06, "loss": 2.5018, "step": 553 }, { "epoch": 0.07, "learning_rate": 9.998824689611012e-06, "loss": 2.5397, "step": 554 }, { "epoch": 0.07, "learning_rate": 9.998780758326502e-06, "loss": 2.6798, "step": 555 }, { "epoch": 0.07, "learning_rate": 9.998736021095621e-06, "loss": 2.7053, "step": 556 }, { "epoch": 0.07, "learning_rate": 9.998690477925576e-06, "loss": 2.628, "step": 557 }, { "epoch": 0.07, "learning_rate": 9.998644128823716e-06, "loss": 2.7674, "step": 558 }, { "epoch": 0.07, "learning_rate": 9.99859697379751e-06, "loss": 2.642, "step": 559 }, { "epoch": 0.07, "learning_rate": 9.998549012854562e-06, "loss": 2.6768, "step": 560 }, { "epoch": 0.07, "learning_rate": 9.998500246002604e-06, "loss": 2.8044, "step": 561 }, { "epoch": 0.07, "learning_rate": 9.998450673249499e-06, "loss": 2.7895, "step": 562 }, { "epoch": 0.07, "learning_rate": 9.99840029460324e-06, "loss": 2.8164, "step": 563 }, { "epoch": 0.07, "learning_rate": 9.99834911007195e-06, "loss": 2.7666, "step": 564 }, { "epoch": 0.07, "learning_rate": 9.99829711966388e-06, "loss": 2.8012, "step": 565 }, { "epoch": 0.07, "learning_rate": 9.998244323387412e-06, "loss": 2.6359, "step": 566 }, { "epoch": 0.07, "learning_rate": 9.99819072125106e-06, "loss": 2.4737, "step": 567 }, { "epoch": 0.07, "learning_rate": 9.998136313263465e-06, "loss": 2.6361, "step": 568 }, { "epoch": 0.07, "learning_rate": 9.9980810994334e-06, "loss": 2.6834, "step": 569 }, { "epoch": 0.07, "learning_rate": 9.998025079769766e-06, "loss": 2.688, "step": 570 }, { "epoch": 0.07, "learning_rate": 9.997968254281595e-06, "loss": 2.6501, "step": 571 }, { "epoch": 0.07, "learning_rate": 9.99791062297805e-06, "loss": 2.7121, "step": 572 }, { "epoch": 0.07, "learning_rate": 9.997852185868424e-06, "loss": 2.5346, "step": 573 }, { "epoch": 0.07, "learning_rate": 9.997792942962135e-06, "loss": 2.6804, "step": 574 }, { "epoch": 0.07, "learning_rate": 9.997732894268737e-06, "loss": 2.8493, "step": 575 }, { "epoch": 0.07, "learning_rate": 9.997672039797912e-06, "loss": 2.6814, "step": 576 }, { "epoch": 0.07, "learning_rate": 9.99761037955947e-06, "loss": 2.793, "step": 577 }, { "epoch": 0.07, "learning_rate": 9.997547913563352e-06, "loss": 2.7212, "step": 578 }, { "epoch": 0.07, "learning_rate": 9.997484641819632e-06, "loss": 2.7028, "step": 579 }, { "epoch": 0.07, "learning_rate": 9.99742056433851e-06, "loss": 2.565, "step": 580 }, { "epoch": 0.07, "learning_rate": 9.997355681130313e-06, "loss": 2.6943, "step": 581 }, { "epoch": 0.07, "learning_rate": 9.99728999220551e-06, "loss": 2.829, "step": 582 }, { "epoch": 0.07, "learning_rate": 9.997223497574685e-06, "loss": 2.6748, "step": 583 }, { "epoch": 0.07, "learning_rate": 9.997156197248564e-06, "loss": 2.7285, "step": 584 }, { "epoch": 0.07, "learning_rate": 9.997088091237991e-06, "loss": 2.5982, "step": 585 }, { "epoch": 0.07, "learning_rate": 9.997019179553956e-06, "loss": 2.6312, "step": 586 }, { "epoch": 0.07, "learning_rate": 9.99694946220756e-06, "loss": 2.6924, "step": 587 }, { "epoch": 0.07, "learning_rate": 9.99687893921005e-06, "loss": 2.775, "step": 588 }, { "epoch": 0.07, "learning_rate": 9.996807610572793e-06, "loss": 2.555, "step": 589 }, { "epoch": 0.07, "learning_rate": 9.996735476307292e-06, "loss": 2.8272, "step": 590 }, { "epoch": 0.07, "learning_rate": 9.996662536425174e-06, "loss": 2.8104, "step": 591 }, { "epoch": 0.07, "learning_rate": 9.996588790938201e-06, "loss": 2.836, "step": 592 }, { "epoch": 0.07, "learning_rate": 9.996514239858263e-06, "loss": 2.5552, "step": 593 }, { "epoch": 0.07, "learning_rate": 9.996438883197378e-06, "loss": 2.5789, "step": 594 }, { "epoch": 0.07, "learning_rate": 9.996362720967698e-06, "loss": 2.8688, "step": 595 }, { "epoch": 0.07, "learning_rate": 9.996285753181499e-06, "loss": 2.6303, "step": 596 }, { "epoch": 0.07, "learning_rate": 9.996207979851195e-06, "loss": 2.5387, "step": 597 }, { "epoch": 0.07, "learning_rate": 9.996129400989322e-06, "loss": 2.6391, "step": 598 }, { "epoch": 0.07, "learning_rate": 9.99605001660855e-06, "loss": 2.6031, "step": 599 }, { "epoch": 0.07, "learning_rate": 9.995969826721679e-06, "loss": 2.7024, "step": 600 }, { "epoch": 0.07, "learning_rate": 9.995888831341636e-06, "loss": 2.5714, "step": 601 }, { "epoch": 0.07, "learning_rate": 9.995807030481481e-06, "loss": 2.6771, "step": 602 }, { "epoch": 0.07, "learning_rate": 9.995724424154403e-06, "loss": 2.6377, "step": 603 }, { "epoch": 0.07, "learning_rate": 9.99564101237372e-06, "loss": 2.7481, "step": 604 }, { "epoch": 0.07, "learning_rate": 9.99555679515288e-06, "loss": 2.7416, "step": 605 }, { "epoch": 0.07, "learning_rate": 9.995471772505461e-06, "loss": 2.7858, "step": 606 }, { "epoch": 0.07, "learning_rate": 9.995385944445173e-06, "loss": 2.5898, "step": 607 }, { "epoch": 0.07, "learning_rate": 9.99529931098585e-06, "loss": 2.6378, "step": 608 }, { "epoch": 0.07, "learning_rate": 9.995211872141466e-06, "loss": 2.7951, "step": 609 }, { "epoch": 0.07, "learning_rate": 9.995123627926113e-06, "loss": 2.6203, "step": 610 }, { "epoch": 0.07, "learning_rate": 9.995034578354022e-06, "loss": 2.7581, "step": 611 }, { "epoch": 0.07, "learning_rate": 9.994944723439546e-06, "loss": 2.7019, "step": 612 }, { "epoch": 0.07, "learning_rate": 9.994854063197176e-06, "loss": 2.5173, "step": 613 }, { "epoch": 0.07, "learning_rate": 9.99476259764153e-06, "loss": 2.7236, "step": 614 }, { "epoch": 0.07, "learning_rate": 9.994670326787351e-06, "loss": 2.7883, "step": 615 }, { "epoch": 0.07, "learning_rate": 9.994577250649519e-06, "loss": 2.6469, "step": 616 }, { "epoch": 0.07, "learning_rate": 9.994483369243038e-06, "loss": 2.759, "step": 617 }, { "epoch": 0.07, "learning_rate": 9.994388682583045e-06, "loss": 2.5253, "step": 618 }, { "epoch": 0.07, "learning_rate": 9.994293190684809e-06, "loss": 2.6467, "step": 619 }, { "epoch": 0.07, "learning_rate": 9.994196893563722e-06, "loss": 2.6278, "step": 620 }, { "epoch": 0.07, "learning_rate": 9.994099791235311e-06, "loss": 2.7281, "step": 621 }, { "epoch": 0.07, "learning_rate": 9.994001883715234e-06, "loss": 2.7038, "step": 622 }, { "epoch": 0.07, "learning_rate": 9.993903171019272e-06, "loss": 2.7874, "step": 623 }, { "epoch": 0.07, "learning_rate": 9.993803653163346e-06, "loss": 2.7049, "step": 624 }, { "epoch": 0.08, "learning_rate": 9.993703330163497e-06, "loss": 2.5307, "step": 625 }, { "epoch": 0.08, "learning_rate": 9.993602202035902e-06, "loss": 2.7684, "step": 626 }, { "epoch": 0.08, "learning_rate": 9.993500268796863e-06, "loss": 2.6364, "step": 627 }, { "epoch": 0.08, "learning_rate": 9.993397530462818e-06, "loss": 2.6076, "step": 628 }, { "epoch": 0.08, "learning_rate": 9.993293987050328e-06, "loss": 2.7699, "step": 629 }, { "epoch": 0.08, "learning_rate": 9.99318963857609e-06, "loss": 2.7259, "step": 630 }, { "epoch": 0.08, "learning_rate": 9.993084485056928e-06, "loss": 2.5497, "step": 631 }, { "epoch": 0.08, "learning_rate": 9.992978526509794e-06, "loss": 2.6458, "step": 632 }, { "epoch": 0.08, "learning_rate": 9.99287176295177e-06, "loss": 2.6104, "step": 633 }, { "epoch": 0.08, "learning_rate": 9.992764194400075e-06, "loss": 2.7969, "step": 634 }, { "epoch": 0.08, "learning_rate": 9.992655820872045e-06, "loss": 2.5573, "step": 635 }, { "epoch": 0.08, "learning_rate": 9.99254664238516e-06, "loss": 2.7115, "step": 636 }, { "epoch": 0.08, "learning_rate": 9.992436658957018e-06, "loss": 2.7499, "step": 637 }, { "epoch": 0.08, "learning_rate": 9.992325870605353e-06, "loss": 2.7235, "step": 638 }, { "epoch": 0.08, "learning_rate": 9.992214277348025e-06, "loss": 2.7157, "step": 639 }, { "epoch": 0.08, "learning_rate": 9.99210187920303e-06, "loss": 2.7748, "step": 640 }, { "epoch": 0.08, "learning_rate": 9.991988676188486e-06, "loss": 2.6614, "step": 641 }, { "epoch": 0.08, "learning_rate": 9.991874668322648e-06, "loss": 2.6307, "step": 642 }, { "epoch": 0.08, "learning_rate": 9.991759855623895e-06, "loss": 2.6769, "step": 643 }, { "epoch": 0.08, "learning_rate": 9.991644238110741e-06, "loss": 2.6164, "step": 644 }, { "epoch": 0.08, "learning_rate": 9.991527815801822e-06, "loss": 2.6349, "step": 645 }, { "epoch": 0.08, "learning_rate": 9.991410588715911e-06, "loss": 2.6492, "step": 646 }, { "epoch": 0.08, "learning_rate": 9.99129255687191e-06, "loss": 2.7794, "step": 647 }, { "epoch": 0.08, "learning_rate": 9.991173720288847e-06, "loss": 2.6926, "step": 648 }, { "epoch": 0.08, "learning_rate": 9.991054078985882e-06, "loss": 2.6104, "step": 649 }, { "epoch": 0.08, "learning_rate": 9.990933632982307e-06, "loss": 2.6673, "step": 650 }, { "epoch": 0.08, "learning_rate": 9.990812382297538e-06, "loss": 2.8701, "step": 651 }, { "epoch": 0.08, "learning_rate": 9.990690326951126e-06, "loss": 2.7313, "step": 652 }, { "epoch": 0.08, "learning_rate": 9.990567466962749e-06, "loss": 2.7137, "step": 653 }, { "epoch": 0.08, "learning_rate": 9.990443802352216e-06, "loss": 2.7408, "step": 654 }, { "epoch": 0.08, "learning_rate": 9.990319333139466e-06, "loss": 2.758, "step": 655 }, { "epoch": 0.08, "learning_rate": 9.990194059344565e-06, "loss": 2.7648, "step": 656 }, { "epoch": 0.08, "learning_rate": 9.990067980987712e-06, "loss": 2.6133, "step": 657 }, { "epoch": 0.08, "learning_rate": 9.989941098089235e-06, "loss": 2.634, "step": 658 }, { "epoch": 0.08, "learning_rate": 9.98981341066959e-06, "loss": 2.7225, "step": 659 }, { "epoch": 0.08, "learning_rate": 9.989684918749365e-06, "loss": 2.624, "step": 660 }, { "epoch": 0.08, "learning_rate": 9.989555622349276e-06, "loss": 2.6906, "step": 661 }, { "epoch": 0.08, "learning_rate": 9.989425521490169e-06, "loss": 2.581, "step": 662 }, { "epoch": 0.08, "learning_rate": 9.989294616193018e-06, "loss": 2.6416, "step": 663 }, { "epoch": 0.08, "learning_rate": 9.989162906478933e-06, "loss": 2.4916, "step": 664 }, { "epoch": 0.08, "learning_rate": 9.989030392369147e-06, "loss": 2.7408, "step": 665 }, { "epoch": 0.08, "learning_rate": 9.988897073885024e-06, "loss": 2.671, "step": 666 }, { "epoch": 0.08, "learning_rate": 9.988762951048062e-06, "loss": 2.6259, "step": 667 }, { "epoch": 0.08, "learning_rate": 9.988628023879883e-06, "loss": 2.561, "step": 668 }, { "epoch": 0.08, "learning_rate": 9.98849229240224e-06, "loss": 2.5333, "step": 669 }, { "epoch": 0.08, "learning_rate": 9.98835575663702e-06, "loss": 2.6159, "step": 670 }, { "epoch": 0.08, "learning_rate": 9.988218416606234e-06, "loss": 2.7005, "step": 671 }, { "epoch": 0.08, "learning_rate": 9.988080272332028e-06, "loss": 2.6932, "step": 672 }, { "epoch": 0.08, "learning_rate": 9.987941323836671e-06, "loss": 2.7513, "step": 673 }, { "epoch": 0.08, "learning_rate": 9.987801571142569e-06, "loss": 2.7071, "step": 674 }, { "epoch": 0.08, "learning_rate": 9.98766101427225e-06, "loss": 2.6824, "step": 675 }, { "epoch": 0.08, "learning_rate": 9.98751965324838e-06, "loss": 2.6819, "step": 676 }, { "epoch": 0.08, "learning_rate": 9.987377488093746e-06, "loss": 2.6191, "step": 677 }, { "epoch": 0.08, "learning_rate": 9.987234518831273e-06, "loss": 2.6233, "step": 678 }, { "epoch": 0.08, "learning_rate": 9.987090745484011e-06, "loss": 2.5139, "step": 679 }, { "epoch": 0.08, "learning_rate": 9.98694616807514e-06, "loss": 2.6586, "step": 680 }, { "epoch": 0.08, "learning_rate": 9.986800786627969e-06, "loss": 2.6545, "step": 681 }, { "epoch": 0.08, "learning_rate": 9.98665460116594e-06, "loss": 2.6103, "step": 682 }, { "epoch": 0.08, "learning_rate": 9.98650761171262e-06, "loss": 2.6391, "step": 683 }, { "epoch": 0.08, "learning_rate": 9.986359818291706e-06, "loss": 2.7295, "step": 684 }, { "epoch": 0.08, "learning_rate": 9.986211220927032e-06, "loss": 2.6726, "step": 685 }, { "epoch": 0.08, "learning_rate": 9.986061819642554e-06, "loss": 2.7735, "step": 686 }, { "epoch": 0.08, "learning_rate": 9.985911614462358e-06, "loss": 2.6624, "step": 687 }, { "epoch": 0.08, "learning_rate": 9.985760605410662e-06, "loss": 2.6959, "step": 688 }, { "epoch": 0.08, "learning_rate": 9.985608792511813e-06, "loss": 2.742, "step": 689 }, { "epoch": 0.08, "learning_rate": 9.98545617579029e-06, "loss": 2.5758, "step": 690 }, { "epoch": 0.08, "learning_rate": 9.985302755270695e-06, "loss": 2.544, "step": 691 }, { "epoch": 0.08, "learning_rate": 9.985148530977767e-06, "loss": 2.6583, "step": 692 }, { "epoch": 0.08, "learning_rate": 9.984993502936369e-06, "loss": 2.5515, "step": 693 }, { "epoch": 0.08, "learning_rate": 9.984837671171498e-06, "loss": 2.6473, "step": 694 }, { "epoch": 0.08, "learning_rate": 9.984681035708279e-06, "loss": 2.6459, "step": 695 }, { "epoch": 0.08, "learning_rate": 9.984523596571964e-06, "loss": 2.5454, "step": 696 }, { "epoch": 0.08, "learning_rate": 9.984365353787938e-06, "loss": 2.5949, "step": 697 }, { "epoch": 0.08, "learning_rate": 9.984206307381714e-06, "loss": 2.6478, "step": 698 }, { "epoch": 0.08, "learning_rate": 9.984046457378935e-06, "loss": 2.6056, "step": 699 }, { "epoch": 0.08, "learning_rate": 9.983885803805373e-06, "loss": 2.6816, "step": 700 }, { "epoch": 0.08, "learning_rate": 9.983724346686929e-06, "loss": 2.5684, "step": 701 }, { "epoch": 0.08, "learning_rate": 9.983562086049636e-06, "loss": 2.8159, "step": 702 }, { "epoch": 0.08, "learning_rate": 9.983399021919655e-06, "loss": 2.6108, "step": 703 }, { "epoch": 0.08, "learning_rate": 9.983235154323276e-06, "loss": 2.6073, "step": 704 }, { "epoch": 0.08, "learning_rate": 9.983070483286919e-06, "loss": 2.7053, "step": 705 }, { "epoch": 0.08, "learning_rate": 9.982905008837133e-06, "loss": 2.7898, "step": 706 }, { "epoch": 0.08, "learning_rate": 9.982738731000602e-06, "loss": 2.6836, "step": 707 }, { "epoch": 0.09, "learning_rate": 9.982571649804126e-06, "loss": 2.7115, "step": 708 }, { "epoch": 0.09, "learning_rate": 9.982403765274652e-06, "loss": 2.7248, "step": 709 }, { "epoch": 0.09, "learning_rate": 9.982235077439242e-06, "loss": 2.6297, "step": 710 }, { "epoch": 0.09, "learning_rate": 9.982065586325096e-06, "loss": 2.7146, "step": 711 }, { "epoch": 0.09, "learning_rate": 9.981895291959541e-06, "loss": 2.8611, "step": 712 }, { "epoch": 0.09, "learning_rate": 9.98172419437003e-06, "loss": 2.656, "step": 713 }, { "epoch": 0.09, "learning_rate": 9.981552293584154e-06, "loss": 2.6716, "step": 714 }, { "epoch": 0.09, "learning_rate": 9.981379589629624e-06, "loss": 2.5776, "step": 715 }, { "epoch": 0.09, "learning_rate": 9.981206082534287e-06, "loss": 2.5523, "step": 716 }, { "epoch": 0.09, "learning_rate": 9.981031772326118e-06, "loss": 2.7048, "step": 717 }, { "epoch": 0.09, "learning_rate": 9.980856659033216e-06, "loss": 2.7631, "step": 718 }, { "epoch": 0.09, "learning_rate": 9.980680742683822e-06, "loss": 2.6329, "step": 719 }, { "epoch": 0.09, "learning_rate": 9.98050402330629e-06, "loss": 2.6379, "step": 720 }, { "epoch": 0.09, "learning_rate": 9.980326500929121e-06, "loss": 2.7127, "step": 721 }, { "epoch": 0.09, "learning_rate": 9.98014817558093e-06, "loss": 2.6222, "step": 722 }, { "epoch": 0.09, "learning_rate": 9.979969047290472e-06, "loss": 2.6534, "step": 723 }, { "epoch": 0.09, "learning_rate": 9.979789116086625e-06, "loss": 2.6033, "step": 724 }, { "epoch": 0.09, "learning_rate": 9.9796083819984e-06, "loss": 2.9023, "step": 725 }, { "epoch": 0.09, "learning_rate": 9.979426845054938e-06, "loss": 2.6704, "step": 726 }, { "epoch": 0.09, "learning_rate": 9.979244505285505e-06, "loss": 2.5729, "step": 727 }, { "epoch": 0.09, "learning_rate": 9.979061362719502e-06, "loss": 2.7437, "step": 728 }, { "epoch": 0.09, "learning_rate": 9.978877417386456e-06, "loss": 2.6636, "step": 729 }, { "epoch": 0.09, "learning_rate": 9.978692669316024e-06, "loss": 2.8921, "step": 730 }, { "epoch": 0.09, "learning_rate": 9.978507118537994e-06, "loss": 2.8422, "step": 731 }, { "epoch": 0.09, "learning_rate": 9.97832076508228e-06, "loss": 2.8175, "step": 732 }, { "epoch": 0.09, "learning_rate": 9.978133608978927e-06, "loss": 2.6225, "step": 733 }, { "epoch": 0.09, "learning_rate": 9.977945650258111e-06, "loss": 2.6151, "step": 734 }, { "epoch": 0.09, "learning_rate": 9.977756888950139e-06, "loss": 2.4018, "step": 735 }, { "epoch": 0.09, "learning_rate": 9.977567325085442e-06, "loss": 2.6013, "step": 736 }, { "epoch": 0.09, "learning_rate": 9.977376958694583e-06, "loss": 2.5516, "step": 737 }, { "epoch": 0.09, "learning_rate": 9.977185789808254e-06, "loss": 2.6465, "step": 738 }, { "epoch": 0.09, "learning_rate": 9.97699381845728e-06, "loss": 2.7325, "step": 739 }, { "epoch": 0.09, "learning_rate": 9.976801044672608e-06, "loss": 2.7577, "step": 740 }, { "epoch": 0.09, "learning_rate": 9.97660746848532e-06, "loss": 2.632, "step": 741 }, { "epoch": 0.09, "learning_rate": 9.976413089926629e-06, "loss": 2.8808, "step": 742 }, { "epoch": 0.09, "learning_rate": 9.976217909027872e-06, "loss": 2.8911, "step": 743 }, { "epoch": 0.09, "learning_rate": 9.976021925820516e-06, "loss": 2.6939, "step": 744 }, { "epoch": 0.09, "learning_rate": 9.975825140336163e-06, "loss": 2.6575, "step": 745 }, { "epoch": 0.09, "learning_rate": 9.975627552606538e-06, "loss": 2.7469, "step": 746 }, { "epoch": 0.09, "learning_rate": 9.975429162663498e-06, "loss": 2.623, "step": 747 }, { "epoch": 0.09, "learning_rate": 9.97522997053903e-06, "loss": 2.6184, "step": 748 }, { "epoch": 0.09, "learning_rate": 9.975029976265248e-06, "loss": 2.632, "step": 749 }, { "epoch": 0.09, "learning_rate": 9.974829179874398e-06, "loss": 2.674, "step": 750 }, { "epoch": 0.09, "learning_rate": 9.974627581398853e-06, "loss": 2.6871, "step": 751 }, { "epoch": 0.09, "learning_rate": 9.974425180871118e-06, "loss": 2.678, "step": 752 }, { "epoch": 0.09, "learning_rate": 9.974221978323824e-06, "loss": 2.7658, "step": 753 }, { "epoch": 0.09, "learning_rate": 9.974017973789735e-06, "loss": 2.6934, "step": 754 }, { "epoch": 0.09, "learning_rate": 9.973813167301743e-06, "loss": 2.6184, "step": 755 }, { "epoch": 0.09, "learning_rate": 9.973607558892864e-06, "loss": 2.8569, "step": 756 }, { "epoch": 0.09, "learning_rate": 9.973401148596251e-06, "loss": 2.6307, "step": 757 }, { "epoch": 0.09, "learning_rate": 9.973193936445185e-06, "loss": 2.4401, "step": 758 }, { "epoch": 0.09, "learning_rate": 9.972985922473073e-06, "loss": 2.744, "step": 759 }, { "epoch": 0.09, "learning_rate": 9.972777106713452e-06, "loss": 2.8363, "step": 760 }, { "epoch": 0.09, "learning_rate": 9.972567489199987e-06, "loss": 2.5208, "step": 761 }, { "epoch": 0.09, "learning_rate": 9.97235706996648e-06, "loss": 2.572, "step": 762 }, { "epoch": 0.09, "learning_rate": 9.972145849046853e-06, "loss": 2.7874, "step": 763 }, { "epoch": 0.09, "learning_rate": 9.971933826475162e-06, "loss": 2.5977, "step": 764 }, { "epoch": 0.09, "learning_rate": 9.971721002285589e-06, "loss": 2.4596, "step": 765 }, { "epoch": 0.09, "learning_rate": 9.971507376512449e-06, "loss": 2.6819, "step": 766 }, { "epoch": 0.09, "learning_rate": 9.971292949190185e-06, "loss": 2.7796, "step": 767 }, { "epoch": 0.09, "learning_rate": 9.971077720353368e-06, "loss": 2.7317, "step": 768 }, { "epoch": 0.09, "learning_rate": 9.9708616900367e-06, "loss": 2.6484, "step": 769 }, { "epoch": 0.09, "learning_rate": 9.970644858275008e-06, "loss": 2.5201, "step": 770 }, { "epoch": 0.09, "learning_rate": 9.970427225103257e-06, "loss": 2.6916, "step": 771 }, { "epoch": 0.09, "learning_rate": 9.970208790556531e-06, "loss": 2.7888, "step": 772 }, { "epoch": 0.09, "learning_rate": 9.96998955467005e-06, "loss": 2.7053, "step": 773 }, { "epoch": 0.09, "learning_rate": 9.969769517479162e-06, "loss": 2.8093, "step": 774 }, { "epoch": 0.09, "learning_rate": 9.96954867901934e-06, "loss": 2.7505, "step": 775 }, { "epoch": 0.09, "learning_rate": 9.969327039326193e-06, "loss": 2.5734, "step": 776 }, { "epoch": 0.09, "learning_rate": 9.969104598435454e-06, "loss": 2.5812, "step": 777 }, { "epoch": 0.09, "learning_rate": 9.968881356382985e-06, "loss": 2.5958, "step": 778 }, { "epoch": 0.09, "learning_rate": 9.968657313204783e-06, "loss": 2.6269, "step": 779 }, { "epoch": 0.09, "learning_rate": 9.968432468936967e-06, "loss": 2.492, "step": 780 }, { "epoch": 0.09, "learning_rate": 9.96820682361579e-06, "loss": 2.6069, "step": 781 }, { "epoch": 0.09, "learning_rate": 9.967980377277632e-06, "loss": 2.704, "step": 782 }, { "epoch": 0.09, "learning_rate": 9.967753129959e-06, "loss": 2.6147, "step": 783 }, { "epoch": 0.09, "learning_rate": 9.96752508169654e-06, "loss": 2.8338, "step": 784 }, { "epoch": 0.09, "learning_rate": 9.967296232527013e-06, "loss": 2.9013, "step": 785 }, { "epoch": 0.09, "learning_rate": 9.967066582487317e-06, "loss": 2.5386, "step": 786 }, { "epoch": 0.09, "learning_rate": 9.96683613161448e-06, "loss": 2.8145, "step": 787 }, { "epoch": 0.09, "learning_rate": 9.966604879945659e-06, "loss": 2.4897, "step": 788 }, { "epoch": 0.09, "learning_rate": 9.966372827518133e-06, "loss": 2.5608, "step": 789 }, { "epoch": 0.09, "learning_rate": 9.96613997436932e-06, "loss": 2.6553, "step": 790 }, { "epoch": 0.1, "learning_rate": 9.96590632053676e-06, "loss": 2.5605, "step": 791 }, { "epoch": 0.1, "learning_rate": 9.965671866058126e-06, "loss": 2.6024, "step": 792 }, { "epoch": 0.1, "learning_rate": 9.965436610971219e-06, "loss": 2.6897, "step": 793 }, { "epoch": 0.1, "learning_rate": 9.96520055531397e-06, "loss": 2.634, "step": 794 }, { "epoch": 0.1, "learning_rate": 9.964963699124434e-06, "loss": 2.6553, "step": 795 }, { "epoch": 0.1, "learning_rate": 9.964726042440802e-06, "loss": 2.6558, "step": 796 }, { "epoch": 0.1, "learning_rate": 9.96448758530139e-06, "loss": 2.681, "step": 797 }, { "epoch": 0.1, "learning_rate": 9.964248327744645e-06, "loss": 2.6811, "step": 798 }, { "epoch": 0.1, "learning_rate": 9.964008269809142e-06, "loss": 2.7352, "step": 799 }, { "epoch": 0.1, "learning_rate": 9.963767411533584e-06, "loss": 2.5464, "step": 800 }, { "epoch": 0.1, "learning_rate": 9.963525752956805e-06, "loss": 2.6996, "step": 801 }, { "epoch": 0.1, "learning_rate": 9.963283294117768e-06, "loss": 2.6565, "step": 802 }, { "epoch": 0.1, "learning_rate": 9.963040035055562e-06, "loss": 2.6059, "step": 803 }, { "epoch": 0.1, "learning_rate": 9.962795975809411e-06, "loss": 2.773, "step": 804 }, { "epoch": 0.1, "learning_rate": 9.962551116418662e-06, "loss": 2.792, "step": 805 }, { "epoch": 0.1, "learning_rate": 9.962305456922792e-06, "loss": 2.6749, "step": 806 }, { "epoch": 0.1, "learning_rate": 9.962058997361413e-06, "loss": 2.7405, "step": 807 }, { "epoch": 0.1, "learning_rate": 9.961811737774256e-06, "loss": 2.6446, "step": 808 }, { "epoch": 0.1, "learning_rate": 9.961563678201187e-06, "loss": 2.5141, "step": 809 }, { "epoch": 0.1, "learning_rate": 9.961314818682205e-06, "loss": 2.7463, "step": 810 }, { "epoch": 0.1, "learning_rate": 9.961065159257428e-06, "loss": 2.6984, "step": 811 }, { "epoch": 0.1, "learning_rate": 9.960814699967112e-06, "loss": 2.6402, "step": 812 }, { "epoch": 0.1, "learning_rate": 9.960563440851636e-06, "loss": 2.7279, "step": 813 }, { "epoch": 0.1, "learning_rate": 9.96031138195151e-06, "loss": 2.7699, "step": 814 }, { "epoch": 0.1, "learning_rate": 9.960058523307375e-06, "loss": 2.6444, "step": 815 }, { "epoch": 0.1, "learning_rate": 9.959804864959996e-06, "loss": 2.5227, "step": 816 }, { "epoch": 0.1, "learning_rate": 9.959550406950273e-06, "loss": 2.7408, "step": 817 }, { "epoch": 0.1, "learning_rate": 9.959295149319233e-06, "loss": 2.7429, "step": 818 }, { "epoch": 0.1, "learning_rate": 9.959039092108025e-06, "loss": 2.7074, "step": 819 }, { "epoch": 0.1, "learning_rate": 9.958782235357938e-06, "loss": 2.6348, "step": 820 }, { "epoch": 0.1, "learning_rate": 9.958524579110384e-06, "loss": 2.7218, "step": 821 }, { "epoch": 0.1, "learning_rate": 9.958266123406901e-06, "loss": 2.7546, "step": 822 }, { "epoch": 0.1, "learning_rate": 9.958006868289164e-06, "loss": 2.7894, "step": 823 }, { "epoch": 0.1, "learning_rate": 9.95774681379897e-06, "loss": 2.6929, "step": 824 }, { "epoch": 0.1, "learning_rate": 9.957485959978246e-06, "loss": 2.8333, "step": 825 }, { "epoch": 0.1, "learning_rate": 9.957224306869053e-06, "loss": 2.7111, "step": 826 }, { "epoch": 0.1, "learning_rate": 9.956961854513574e-06, "loss": 2.7532, "step": 827 }, { "epoch": 0.1, "learning_rate": 9.956698602954124e-06, "loss": 2.6462, "step": 828 }, { "epoch": 0.1, "learning_rate": 9.956434552233147e-06, "loss": 2.4514, "step": 829 }, { "epoch": 0.1, "learning_rate": 9.956169702393215e-06, "loss": 2.6819, "step": 830 }, { "epoch": 0.1, "learning_rate": 9.95590405347703e-06, "loss": 2.8479, "step": 831 }, { "epoch": 0.1, "learning_rate": 9.955637605527425e-06, "loss": 2.5551, "step": 832 }, { "epoch": 0.1, "learning_rate": 9.955370358587354e-06, "loss": 2.7663, "step": 833 }, { "epoch": 0.1, "learning_rate": 9.955102312699905e-06, "loss": 2.7017, "step": 834 }, { "epoch": 0.1, "learning_rate": 9.9548334679083e-06, "loss": 2.6073, "step": 835 }, { "epoch": 0.1, "learning_rate": 9.954563824255879e-06, "loss": 2.85, "step": 836 }, { "epoch": 0.1, "learning_rate": 9.95429338178612e-06, "loss": 2.6695, "step": 837 }, { "epoch": 0.1, "learning_rate": 9.954022140542622e-06, "loss": 2.4893, "step": 838 }, { "epoch": 0.1, "learning_rate": 9.953750100569122e-06, "loss": 2.7494, "step": 839 }, { "epoch": 0.1, "learning_rate": 9.953477261909478e-06, "loss": 2.5879, "step": 840 }, { "epoch": 0.1, "learning_rate": 9.953203624607679e-06, "loss": 2.8848, "step": 841 }, { "epoch": 0.1, "learning_rate": 9.952929188707843e-06, "loss": 2.5864, "step": 842 }, { "epoch": 0.1, "learning_rate": 9.952653954254218e-06, "loss": 2.6576, "step": 843 }, { "epoch": 0.1, "learning_rate": 9.952377921291179e-06, "loss": 2.6337, "step": 844 }, { "epoch": 0.1, "learning_rate": 9.952101089863232e-06, "loss": 2.7645, "step": 845 }, { "epoch": 0.1, "learning_rate": 9.951823460015004e-06, "loss": 2.6757, "step": 846 }, { "epoch": 0.1, "learning_rate": 9.951545031791265e-06, "loss": 2.7233, "step": 847 }, { "epoch": 0.1, "learning_rate": 9.951265805236903e-06, "loss": 2.7793, "step": 848 }, { "epoch": 0.1, "learning_rate": 9.950985780396934e-06, "loss": 2.754, "step": 849 }, { "epoch": 0.1, "learning_rate": 9.95070495731651e-06, "loss": 2.7755, "step": 850 }, { "epoch": 0.1, "learning_rate": 9.950423336040904e-06, "loss": 2.678, "step": 851 }, { "epoch": 0.1, "learning_rate": 9.950140916615526e-06, "loss": 2.5232, "step": 852 }, { "epoch": 0.1, "learning_rate": 9.949857699085907e-06, "loss": 2.5793, "step": 853 }, { "epoch": 0.1, "learning_rate": 9.94957368349771e-06, "loss": 2.595, "step": 854 }, { "epoch": 0.1, "learning_rate": 9.949288869896727e-06, "loss": 2.8473, "step": 855 }, { "epoch": 0.1, "learning_rate": 9.949003258328878e-06, "loss": 2.5512, "step": 856 }, { "epoch": 0.1, "learning_rate": 9.948716848840211e-06, "loss": 2.6794, "step": 857 }, { "epoch": 0.1, "learning_rate": 9.948429641476905e-06, "loss": 2.6545, "step": 858 }, { "epoch": 0.1, "learning_rate": 9.948141636285264e-06, "loss": 2.4357, "step": 859 }, { "epoch": 0.1, "learning_rate": 9.947852833311725e-06, "loss": 2.6344, "step": 860 }, { "epoch": 0.1, "learning_rate": 9.94756323260285e-06, "loss": 2.5807, "step": 861 }, { "epoch": 0.1, "learning_rate": 9.94727283420533e-06, "loss": 2.575, "step": 862 }, { "epoch": 0.1, "learning_rate": 9.946981638165987e-06, "loss": 2.7577, "step": 863 }, { "epoch": 0.1, "learning_rate": 9.94668964453177e-06, "loss": 2.7748, "step": 864 }, { "epoch": 0.1, "learning_rate": 9.946396853349756e-06, "loss": 2.7502, "step": 865 }, { "epoch": 0.1, "learning_rate": 9.946103264667151e-06, "loss": 2.6322, "step": 866 }, { "epoch": 0.1, "learning_rate": 9.945808878531291e-06, "loss": 2.5729, "step": 867 }, { "epoch": 0.1, "learning_rate": 9.94551369498964e-06, "loss": 2.6847, "step": 868 }, { "epoch": 0.1, "learning_rate": 9.945217714089787e-06, "loss": 2.7741, "step": 869 }, { "epoch": 0.1, "learning_rate": 9.944920935879456e-06, "loss": 2.6681, "step": 870 }, { "epoch": 0.1, "learning_rate": 9.944623360406496e-06, "loss": 2.773, "step": 871 }, { "epoch": 0.1, "learning_rate": 9.94432498771888e-06, "loss": 2.8415, "step": 872 }, { "epoch": 0.1, "learning_rate": 9.944025817864722e-06, "loss": 2.7011, "step": 873 }, { "epoch": 0.1, "learning_rate": 9.943725850892249e-06, "loss": 2.7413, "step": 874 }, { "epoch": 0.11, "learning_rate": 9.943425086849829e-06, "loss": 2.6027, "step": 875 }, { "epoch": 0.11, "learning_rate": 9.943123525785952e-06, "loss": 2.5397, "step": 876 }, { "epoch": 0.11, "learning_rate": 9.942821167749239e-06, "loss": 2.8096, "step": 877 }, { "epoch": 0.11, "learning_rate": 9.942518012788438e-06, "loss": 2.5149, "step": 878 }, { "epoch": 0.11, "learning_rate": 9.942214060952426e-06, "loss": 2.5931, "step": 879 }, { "epoch": 0.11, "learning_rate": 9.94190931229021e-06, "loss": 2.747, "step": 880 }, { "epoch": 0.11, "learning_rate": 9.941603766850924e-06, "loss": 2.4034, "step": 881 }, { "epoch": 0.11, "learning_rate": 9.941297424683832e-06, "loss": 2.5628, "step": 882 }, { "epoch": 0.11, "learning_rate": 9.94099028583832e-06, "loss": 2.6205, "step": 883 }, { "epoch": 0.11, "learning_rate": 9.940682350363913e-06, "loss": 2.6363, "step": 884 }, { "epoch": 0.11, "learning_rate": 9.940373618310255e-06, "loss": 2.5571, "step": 885 }, { "epoch": 0.11, "learning_rate": 9.940064089727127e-06, "loss": 2.6705, "step": 886 }, { "epoch": 0.11, "learning_rate": 9.939753764664428e-06, "loss": 2.4719, "step": 887 }, { "epoch": 0.11, "learning_rate": 9.939442643172197e-06, "loss": 2.6, "step": 888 }, { "epoch": 0.11, "learning_rate": 9.939130725300592e-06, "loss": 2.5352, "step": 889 }, { "epoch": 0.11, "learning_rate": 9.938818011099906e-06, "loss": 2.5904, "step": 890 }, { "epoch": 0.11, "learning_rate": 9.938504500620554e-06, "loss": 2.4875, "step": 891 }, { "epoch": 0.11, "learning_rate": 9.938190193913084e-06, "loss": 2.7945, "step": 892 }, { "epoch": 0.11, "learning_rate": 9.937875091028173e-06, "loss": 2.6087, "step": 893 }, { "epoch": 0.11, "learning_rate": 9.937559192016624e-06, "loss": 2.7428, "step": 894 }, { "epoch": 0.11, "learning_rate": 9.937242496929367e-06, "loss": 2.5869, "step": 895 }, { "epoch": 0.11, "learning_rate": 9.936925005817464e-06, "loss": 2.5228, "step": 896 }, { "epoch": 0.11, "learning_rate": 9.936606718732103e-06, "loss": 2.569, "step": 897 }, { "epoch": 0.11, "learning_rate": 9.936287635724601e-06, "loss": 2.5986, "step": 898 }, { "epoch": 0.11, "learning_rate": 9.935967756846406e-06, "loss": 2.7891, "step": 899 }, { "epoch": 0.11, "learning_rate": 9.935647082149088e-06, "loss": 2.7049, "step": 900 }, { "epoch": 0.11, "learning_rate": 9.935325611684348e-06, "loss": 2.668, "step": 901 }, { "epoch": 0.11, "learning_rate": 9.93500334550402e-06, "loss": 2.5601, "step": 902 }, { "epoch": 0.11, "learning_rate": 9.93468028366006e-06, "loss": 2.5658, "step": 903 }, { "epoch": 0.11, "learning_rate": 9.934356426204557e-06, "loss": 2.7243, "step": 904 }, { "epoch": 0.11, "learning_rate": 9.934031773189724e-06, "loss": 2.7012, "step": 905 }, { "epoch": 0.11, "learning_rate": 9.933706324667906e-06, "loss": 2.6517, "step": 906 }, { "epoch": 0.11, "learning_rate": 9.933380080691573e-06, "loss": 2.7875, "step": 907 }, { "epoch": 0.11, "learning_rate": 9.933053041313325e-06, "loss": 2.7827, "step": 908 }, { "epoch": 0.11, "learning_rate": 9.932725206585892e-06, "loss": 2.6219, "step": 909 }, { "epoch": 0.11, "learning_rate": 9.932396576562128e-06, "loss": 2.8049, "step": 910 }, { "epoch": 0.11, "learning_rate": 9.932067151295018e-06, "loss": 2.7362, "step": 911 }, { "epoch": 0.11, "learning_rate": 9.931736930837676e-06, "loss": 2.5993, "step": 912 }, { "epoch": 0.11, "learning_rate": 9.931405915243343e-06, "loss": 2.7668, "step": 913 }, { "epoch": 0.11, "learning_rate": 9.931074104565387e-06, "loss": 2.6353, "step": 914 }, { "epoch": 0.11, "learning_rate": 9.930741498857307e-06, "loss": 2.4801, "step": 915 }, { "epoch": 0.11, "learning_rate": 9.930408098172725e-06, "loss": 2.5892, "step": 916 }, { "epoch": 0.11, "learning_rate": 9.930073902565397e-06, "loss": 2.7477, "step": 917 }, { "epoch": 0.11, "learning_rate": 9.929738912089207e-06, "loss": 2.4668, "step": 918 }, { "epoch": 0.11, "learning_rate": 9.929403126798162e-06, "loss": 2.6532, "step": 919 }, { "epoch": 0.11, "learning_rate": 9.929066546746403e-06, "loss": 2.6674, "step": 920 }, { "epoch": 0.11, "learning_rate": 9.928729171988191e-06, "loss": 2.5192, "step": 921 }, { "epoch": 0.11, "learning_rate": 9.928391002577926e-06, "loss": 2.6031, "step": 922 }, { "epoch": 0.11, "learning_rate": 9.928052038570129e-06, "loss": 2.7143, "step": 923 }, { "epoch": 0.11, "learning_rate": 9.92771228001945e-06, "loss": 2.806, "step": 924 }, { "epoch": 0.11, "learning_rate": 9.927371726980669e-06, "loss": 2.7175, "step": 925 }, { "epoch": 0.11, "learning_rate": 9.927030379508691e-06, "loss": 2.5713, "step": 926 }, { "epoch": 0.11, "learning_rate": 9.926688237658551e-06, "loss": 2.7587, "step": 927 }, { "epoch": 0.11, "learning_rate": 9.926345301485414e-06, "loss": 2.6487, "step": 928 }, { "epoch": 0.11, "learning_rate": 9.92600157104457e-06, "loss": 2.563, "step": 929 }, { "epoch": 0.11, "learning_rate": 9.925657046391438e-06, "loss": 2.701, "step": 930 }, { "epoch": 0.11, "learning_rate": 9.925311727581567e-06, "loss": 2.5976, "step": 931 }, { "epoch": 0.11, "learning_rate": 9.924965614670629e-06, "loss": 2.661, "step": 932 }, { "epoch": 0.11, "learning_rate": 9.924618707714429e-06, "loss": 2.605, "step": 933 }, { "epoch": 0.11, "learning_rate": 9.9242710067689e-06, "loss": 2.5763, "step": 934 }, { "epoch": 0.11, "learning_rate": 9.923922511890098e-06, "loss": 2.7099, "step": 935 }, { "epoch": 0.11, "learning_rate": 9.923573223134213e-06, "loss": 2.5051, "step": 936 }, { "epoch": 0.11, "learning_rate": 9.923223140557558e-06, "loss": 2.5177, "step": 937 }, { "epoch": 0.11, "learning_rate": 9.922872264216581e-06, "loss": 2.6984, "step": 938 }, { "epoch": 0.11, "learning_rate": 9.922520594167847e-06, "loss": 2.8218, "step": 939 }, { "epoch": 0.11, "learning_rate": 9.92216813046806e-06, "loss": 2.5356, "step": 940 }, { "epoch": 0.11, "learning_rate": 9.921814873174045e-06, "loss": 2.8193, "step": 941 }, { "epoch": 0.11, "learning_rate": 9.921460822342757e-06, "loss": 2.7087, "step": 942 }, { "epoch": 0.11, "learning_rate": 9.92110597803128e-06, "loss": 2.5888, "step": 943 }, { "epoch": 0.11, "learning_rate": 9.920750340296823e-06, "loss": 2.5517, "step": 944 }, { "epoch": 0.11, "learning_rate": 9.920393909196729e-06, "loss": 2.6957, "step": 945 }, { "epoch": 0.11, "learning_rate": 9.920036684788464e-06, "loss": 2.6603, "step": 946 }, { "epoch": 0.11, "learning_rate": 9.919678667129618e-06, "loss": 2.6993, "step": 947 }, { "epoch": 0.11, "learning_rate": 9.919319856277921e-06, "loss": 2.6966, "step": 948 }, { "epoch": 0.11, "learning_rate": 9.918960252291216e-06, "loss": 2.5685, "step": 949 }, { "epoch": 0.11, "learning_rate": 9.918599855227487e-06, "loss": 2.7165, "step": 950 }, { "epoch": 0.11, "learning_rate": 9.91823866514484e-06, "loss": 2.523, "step": 951 }, { "epoch": 0.11, "learning_rate": 9.917876682101504e-06, "loss": 2.5824, "step": 952 }, { "epoch": 0.11, "learning_rate": 9.917513906155847e-06, "loss": 2.5774, "step": 953 }, { "epoch": 0.11, "learning_rate": 9.917150337366357e-06, "loss": 2.587, "step": 954 }, { "epoch": 0.11, "learning_rate": 9.916785975791649e-06, "loss": 2.7042, "step": 955 }, { "epoch": 0.11, "learning_rate": 9.916420821490474e-06, "loss": 2.6069, "step": 956 }, { "epoch": 0.11, "learning_rate": 9.9160548745217e-06, "loss": 2.6973, "step": 957 }, { "epoch": 0.12, "learning_rate": 9.915688134944328e-06, "loss": 2.9187, "step": 958 }, { "epoch": 0.12, "learning_rate": 9.915320602817493e-06, "loss": 2.6963, "step": 959 }, { "epoch": 0.12, "learning_rate": 9.914952278200444e-06, "loss": 2.6668, "step": 960 }, { "epoch": 0.12, "learning_rate": 9.914583161152574e-06, "loss": 2.5568, "step": 961 }, { "epoch": 0.12, "learning_rate": 9.914213251733387e-06, "loss": 2.7312, "step": 962 }, { "epoch": 0.12, "learning_rate": 9.913842550002526e-06, "loss": 2.7678, "step": 963 }, { "epoch": 0.12, "learning_rate": 9.91347105601976e-06, "loss": 2.806, "step": 964 }, { "epoch": 0.12, "learning_rate": 9.913098769844984e-06, "loss": 2.7121, "step": 965 }, { "epoch": 0.12, "learning_rate": 9.91272569153822e-06, "loss": 2.5571, "step": 966 }, { "epoch": 0.12, "learning_rate": 9.91235182115962e-06, "loss": 2.652, "step": 967 }, { "epoch": 0.12, "learning_rate": 9.911977158769461e-06, "loss": 2.6688, "step": 968 }, { "epoch": 0.12, "learning_rate": 9.911601704428153e-06, "loss": 2.7113, "step": 969 }, { "epoch": 0.12, "learning_rate": 9.911225458196226e-06, "loss": 2.741, "step": 970 }, { "epoch": 0.12, "learning_rate": 9.910848420134342e-06, "loss": 2.4043, "step": 971 }, { "epoch": 0.12, "learning_rate": 9.910470590303294e-06, "loss": 2.5095, "step": 972 }, { "epoch": 0.12, "learning_rate": 9.910091968763995e-06, "loss": 2.5416, "step": 973 }, { "epoch": 0.12, "learning_rate": 9.909712555577491e-06, "loss": 2.7067, "step": 974 }, { "epoch": 0.12, "learning_rate": 9.909332350804954e-06, "loss": 2.7044, "step": 975 }, { "epoch": 0.12, "learning_rate": 9.908951354507683e-06, "loss": 2.6406, "step": 976 }, { "epoch": 0.12, "learning_rate": 9.908569566747108e-06, "loss": 2.7271, "step": 977 }, { "epoch": 0.12, "learning_rate": 9.908186987584783e-06, "loss": 2.8177, "step": 978 }, { "epoch": 0.12, "learning_rate": 9.907803617082391e-06, "loss": 2.6757, "step": 979 }, { "epoch": 0.12, "learning_rate": 9.90741945530174e-06, "loss": 2.6966, "step": 980 }, { "epoch": 0.12, "learning_rate": 9.907034502304771e-06, "loss": 2.6855, "step": 981 }, { "epoch": 0.12, "learning_rate": 9.906648758153547e-06, "loss": 2.6183, "step": 982 }, { "epoch": 0.12, "learning_rate": 9.906262222910264e-06, "loss": 2.6375, "step": 983 }, { "epoch": 0.12, "learning_rate": 9.905874896637238e-06, "loss": 2.6201, "step": 984 }, { "epoch": 0.12, "learning_rate": 9.905486779396921e-06, "loss": 2.8266, "step": 985 }, { "epoch": 0.12, "learning_rate": 9.905097871251887e-06, "loss": 2.723, "step": 986 }, { "epoch": 0.12, "learning_rate": 9.90470817226484e-06, "loss": 2.5363, "step": 987 }, { "epoch": 0.12, "learning_rate": 9.904317682498609e-06, "loss": 2.6324, "step": 988 }, { "epoch": 0.12, "learning_rate": 9.903926402016153e-06, "loss": 2.5363, "step": 989 }, { "epoch": 0.12, "learning_rate": 9.903534330880557e-06, "loss": 2.7391, "step": 990 }, { "epoch": 0.12, "learning_rate": 9.903141469155036e-06, "loss": 2.5352, "step": 991 }, { "epoch": 0.12, "learning_rate": 9.90274781690293e-06, "loss": 2.6342, "step": 992 }, { "epoch": 0.12, "learning_rate": 9.902353374187706e-06, "loss": 2.7823, "step": 993 }, { "epoch": 0.12, "learning_rate": 9.901958141072957e-06, "loss": 2.5623, "step": 994 }, { "epoch": 0.12, "learning_rate": 9.901562117622412e-06, "loss": 2.7264, "step": 995 }, { "epoch": 0.12, "learning_rate": 9.901165303899916e-06, "loss": 2.6299, "step": 996 }, { "epoch": 0.12, "learning_rate": 9.900767699969449e-06, "loss": 2.6094, "step": 997 }, { "epoch": 0.12, "learning_rate": 9.900369305895115e-06, "loss": 2.6387, "step": 998 }, { "epoch": 0.12, "learning_rate": 9.899970121741147e-06, "loss": 2.6321, "step": 999 }, { "epoch": 0.12, "learning_rate": 9.899570147571907e-06, "loss": 2.3323, "step": 1000 }, { "epoch": 0.12, "learning_rate": 9.899169383451878e-06, "loss": 2.5735, "step": 1001 }, { "epoch": 0.12, "learning_rate": 9.89876782944568e-06, "loss": 2.6439, "step": 1002 }, { "epoch": 0.12, "learning_rate": 9.89836548561805e-06, "loss": 2.7669, "step": 1003 }, { "epoch": 0.12, "learning_rate": 9.89796235203386e-06, "loss": 2.8535, "step": 1004 }, { "epoch": 0.12, "learning_rate": 9.897558428758107e-06, "loss": 2.7649, "step": 1005 }, { "epoch": 0.12, "learning_rate": 9.897153715855911e-06, "loss": 2.6537, "step": 1006 }, { "epoch": 0.12, "learning_rate": 9.896748213392529e-06, "loss": 2.5848, "step": 1007 }, { "epoch": 0.12, "learning_rate": 9.896341921433337e-06, "loss": 2.6654, "step": 1008 }, { "epoch": 0.12, "learning_rate": 9.895934840043839e-06, "loss": 2.7781, "step": 1009 }, { "epoch": 0.12, "learning_rate": 9.895526969289671e-06, "loss": 2.7418, "step": 1010 }, { "epoch": 0.12, "learning_rate": 9.895118309236591e-06, "loss": 2.5787, "step": 1011 }, { "epoch": 0.12, "learning_rate": 9.89470885995049e-06, "loss": 2.5821, "step": 1012 }, { "epoch": 0.12, "learning_rate": 9.89429862149738e-06, "loss": 2.6385, "step": 1013 }, { "epoch": 0.12, "learning_rate": 9.893887593943405e-06, "loss": 2.7581, "step": 1014 }, { "epoch": 0.12, "learning_rate": 9.893475777354832e-06, "loss": 2.4466, "step": 1015 }, { "epoch": 0.12, "learning_rate": 9.89306317179806e-06, "loss": 2.7203, "step": 1016 }, { "epoch": 0.12, "learning_rate": 9.892649777339611e-06, "loss": 2.6585, "step": 1017 }, { "epoch": 0.12, "learning_rate": 9.89223559404614e-06, "loss": 2.6484, "step": 1018 }, { "epoch": 0.12, "learning_rate": 9.891820621984418e-06, "loss": 2.5929, "step": 1019 }, { "epoch": 0.12, "learning_rate": 9.891404861221356e-06, "loss": 2.5658, "step": 1020 }, { "epoch": 0.12, "learning_rate": 9.890988311823986e-06, "loss": 2.6685, "step": 1021 }, { "epoch": 0.12, "learning_rate": 9.890570973859468e-06, "loss": 2.4192, "step": 1022 }, { "epoch": 0.12, "learning_rate": 9.890152847395085e-06, "loss": 2.6418, "step": 1023 }, { "epoch": 0.12, "learning_rate": 9.889733932498253e-06, "loss": 2.8217, "step": 1024 }, { "epoch": 0.12, "learning_rate": 9.889314229236515e-06, "loss": 2.7264, "step": 1025 }, { "epoch": 0.12, "learning_rate": 9.888893737677537e-06, "loss": 2.8306, "step": 1026 }, { "epoch": 0.12, "learning_rate": 9.888472457889115e-06, "loss": 2.585, "step": 1027 }, { "epoch": 0.12, "learning_rate": 9.888050389939172e-06, "loss": 2.6385, "step": 1028 }, { "epoch": 0.12, "learning_rate": 9.887627533895757e-06, "loss": 2.6988, "step": 1029 }, { "epoch": 0.12, "learning_rate": 9.887203889827045e-06, "loss": 2.7786, "step": 1030 }, { "epoch": 0.12, "learning_rate": 9.88677945780134e-06, "loss": 2.5515, "step": 1031 }, { "epoch": 0.12, "learning_rate": 9.886354237887075e-06, "loss": 2.6657, "step": 1032 }, { "epoch": 0.12, "learning_rate": 9.885928230152804e-06, "loss": 2.7088, "step": 1033 }, { "epoch": 0.12, "learning_rate": 9.885501434667215e-06, "loss": 2.599, "step": 1034 }, { "epoch": 0.12, "learning_rate": 9.885073851499119e-06, "loss": 2.692, "step": 1035 }, { "epoch": 0.12, "learning_rate": 9.884645480717452e-06, "loss": 2.8362, "step": 1036 }, { "epoch": 0.12, "learning_rate": 9.884216322391282e-06, "loss": 2.6754, "step": 1037 }, { "epoch": 0.12, "learning_rate": 9.883786376589802e-06, "loss": 2.7087, "step": 1038 }, { "epoch": 0.12, "learning_rate": 9.883355643382328e-06, "loss": 2.6454, "step": 1039 }, { "epoch": 0.12, "learning_rate": 9.882924122838311e-06, "loss": 2.7205, "step": 1040 }, { "epoch": 0.13, "learning_rate": 9.882491815027322e-06, "loss": 2.5998, "step": 1041 }, { "epoch": 0.13, "learning_rate": 9.882058720019062e-06, "loss": 2.6998, "step": 1042 }, { "epoch": 0.13, "learning_rate": 9.881624837883358e-06, "loss": 2.5463, "step": 1043 }, { "epoch": 0.13, "learning_rate": 9.881190168690164e-06, "loss": 2.7631, "step": 1044 }, { "epoch": 0.13, "learning_rate": 9.880754712509563e-06, "loss": 2.8184, "step": 1045 }, { "epoch": 0.13, "learning_rate": 9.88031846941176e-06, "loss": 2.4644, "step": 1046 }, { "epoch": 0.13, "learning_rate": 9.879881439467091e-06, "loss": 2.7637, "step": 1047 }, { "epoch": 0.13, "learning_rate": 9.87944362274602e-06, "loss": 2.6318, "step": 1048 }, { "epoch": 0.13, "learning_rate": 9.879005019319133e-06, "loss": 2.7644, "step": 1049 }, { "epoch": 0.13, "learning_rate": 9.878565629257146e-06, "loss": 2.7064, "step": 1050 }, { "epoch": 0.13, "learning_rate": 9.8781254526309e-06, "loss": 2.4167, "step": 1051 }, { "epoch": 0.13, "learning_rate": 9.877684489511367e-06, "loss": 2.6741, "step": 1052 }, { "epoch": 0.13, "learning_rate": 9.87724273996964e-06, "loss": 2.6613, "step": 1053 }, { "epoch": 0.13, "learning_rate": 9.876800204076944e-06, "loss": 2.5728, "step": 1054 }, { "epoch": 0.13, "learning_rate": 9.876356881904627e-06, "loss": 2.6559, "step": 1055 }, { "epoch": 0.13, "learning_rate": 9.875912773524165e-06, "loss": 2.6052, "step": 1056 }, { "epoch": 0.13, "learning_rate": 9.87546787900716e-06, "loss": 2.6146, "step": 1057 }, { "epoch": 0.13, "learning_rate": 9.875022198425347e-06, "loss": 2.7509, "step": 1058 }, { "epoch": 0.13, "learning_rate": 9.874575731850575e-06, "loss": 2.5809, "step": 1059 }, { "epoch": 0.13, "learning_rate": 9.874128479354833e-06, "loss": 2.614, "step": 1060 }, { "epoch": 0.13, "learning_rate": 9.873680441010227e-06, "loss": 2.6881, "step": 1061 }, { "epoch": 0.13, "learning_rate": 9.873231616888997e-06, "loss": 2.7237, "step": 1062 }, { "epoch": 0.13, "learning_rate": 9.872782007063503e-06, "loss": 2.7201, "step": 1063 }, { "epoch": 0.13, "learning_rate": 9.872331611606238e-06, "loss": 2.521, "step": 1064 }, { "epoch": 0.13, "learning_rate": 9.871880430589817e-06, "loss": 2.6008, "step": 1065 }, { "epoch": 0.13, "learning_rate": 9.871428464086983e-06, "loss": 2.4882, "step": 1066 }, { "epoch": 0.13, "learning_rate": 9.870975712170605e-06, "loss": 2.4552, "step": 1067 }, { "epoch": 0.13, "learning_rate": 9.870522174913683e-06, "loss": 2.683, "step": 1068 }, { "epoch": 0.13, "learning_rate": 9.870067852389338e-06, "loss": 2.7308, "step": 1069 }, { "epoch": 0.13, "learning_rate": 9.869612744670817e-06, "loss": 2.6873, "step": 1070 }, { "epoch": 0.13, "learning_rate": 9.869156851831502e-06, "loss": 2.8014, "step": 1071 }, { "epoch": 0.13, "learning_rate": 9.868700173944895e-06, "loss": 2.4885, "step": 1072 }, { "epoch": 0.13, "learning_rate": 9.86824271108462e-06, "loss": 2.6166, "step": 1073 }, { "epoch": 0.13, "learning_rate": 9.867784463324437e-06, "loss": 2.552, "step": 1074 }, { "epoch": 0.13, "learning_rate": 9.86732543073823e-06, "loss": 2.6872, "step": 1075 }, { "epoch": 0.13, "learning_rate": 9.866865613400008e-06, "loss": 2.6828, "step": 1076 }, { "epoch": 0.13, "learning_rate": 9.866405011383902e-06, "loss": 2.536, "step": 1077 }, { "epoch": 0.13, "learning_rate": 9.86594362476418e-06, "loss": 2.6703, "step": 1078 }, { "epoch": 0.13, "learning_rate": 9.865481453615227e-06, "loss": 2.3919, "step": 1079 }, { "epoch": 0.13, "learning_rate": 9.86501849801156e-06, "loss": 2.7571, "step": 1080 }, { "epoch": 0.13, "learning_rate": 9.86455475802782e-06, "loss": 2.5048, "step": 1081 }, { "epoch": 0.13, "learning_rate": 9.864090233738776e-06, "loss": 2.5079, "step": 1082 }, { "epoch": 0.13, "learning_rate": 9.86362492521932e-06, "loss": 2.6762, "step": 1083 }, { "epoch": 0.13, "learning_rate": 9.863158832544477e-06, "loss": 2.5886, "step": 1084 }, { "epoch": 0.13, "learning_rate": 9.862691955789393e-06, "loss": 2.6237, "step": 1085 }, { "epoch": 0.13, "learning_rate": 9.862224295029339e-06, "loss": 2.5936, "step": 1086 }, { "epoch": 0.13, "learning_rate": 9.861755850339718e-06, "loss": 2.7221, "step": 1087 }, { "epoch": 0.13, "learning_rate": 9.861286621796056e-06, "loss": 2.6428, "step": 1088 }, { "epoch": 0.13, "learning_rate": 9.860816609474008e-06, "loss": 2.509, "step": 1089 }, { "epoch": 0.13, "learning_rate": 9.86034581344935e-06, "loss": 2.6801, "step": 1090 }, { "epoch": 0.13, "learning_rate": 9.859874233797991e-06, "loss": 2.6718, "step": 1091 }, { "epoch": 0.13, "learning_rate": 9.859401870595959e-06, "loss": 2.6979, "step": 1092 }, { "epoch": 0.13, "learning_rate": 9.858928723919419e-06, "loss": 2.6733, "step": 1093 }, { "epoch": 0.13, "learning_rate": 9.858454793844648e-06, "loss": 2.5676, "step": 1094 }, { "epoch": 0.13, "learning_rate": 9.857980080448064e-06, "loss": 2.7128, "step": 1095 }, { "epoch": 0.13, "learning_rate": 9.8575045838062e-06, "loss": 2.7672, "step": 1096 }, { "epoch": 0.13, "learning_rate": 9.857028303995719e-06, "loss": 2.8331, "step": 1097 }, { "epoch": 0.13, "learning_rate": 9.856551241093414e-06, "loss": 2.8234, "step": 1098 }, { "epoch": 0.13, "learning_rate": 9.856073395176203e-06, "loss": 2.7091, "step": 1099 }, { "epoch": 0.13, "learning_rate": 9.855594766321122e-06, "loss": 2.578, "step": 1100 }, { "epoch": 0.13, "learning_rate": 9.855115354605345e-06, "loss": 2.7099, "step": 1101 }, { "epoch": 0.13, "learning_rate": 9.854635160106166e-06, "loss": 2.6883, "step": 1102 }, { "epoch": 0.13, "learning_rate": 9.854154182901e-06, "loss": 2.584, "step": 1103 }, { "epoch": 0.13, "learning_rate": 9.853672423067404e-06, "loss": 2.4562, "step": 1104 }, { "epoch": 0.13, "learning_rate": 9.853189880683046e-06, "loss": 2.6069, "step": 1105 }, { "epoch": 0.13, "learning_rate": 9.852706555825727e-06, "loss": 2.7305, "step": 1106 }, { "epoch": 0.13, "learning_rate": 9.85222244857337e-06, "loss": 2.7552, "step": 1107 }, { "epoch": 0.13, "learning_rate": 9.85173755900403e-06, "loss": 2.7975, "step": 1108 }, { "epoch": 0.13, "learning_rate": 9.851251887195886e-06, "loss": 2.5809, "step": 1109 }, { "epoch": 0.13, "learning_rate": 9.850765433227239e-06, "loss": 2.6274, "step": 1110 }, { "epoch": 0.13, "learning_rate": 9.850278197176522e-06, "loss": 2.6602, "step": 1111 }, { "epoch": 0.13, "learning_rate": 9.849790179122287e-06, "loss": 2.6088, "step": 1112 }, { "epoch": 0.13, "learning_rate": 9.849301379143223e-06, "loss": 2.5476, "step": 1113 }, { "epoch": 0.13, "learning_rate": 9.848811797318132e-06, "loss": 2.5605, "step": 1114 }, { "epoch": 0.13, "learning_rate": 9.848321433725954e-06, "loss": 2.6549, "step": 1115 }, { "epoch": 0.13, "learning_rate": 9.847830288445745e-06, "loss": 2.8376, "step": 1116 }, { "epoch": 0.13, "learning_rate": 9.847338361556697e-06, "loss": 2.5053, "step": 1117 }, { "epoch": 0.13, "learning_rate": 9.846845653138117e-06, "loss": 2.4495, "step": 1118 }, { "epoch": 0.13, "learning_rate": 9.846352163269448e-06, "loss": 2.66, "step": 1119 }, { "epoch": 0.13, "learning_rate": 9.845857892030252e-06, "loss": 2.7009, "step": 1120 }, { "epoch": 0.13, "learning_rate": 9.84536283950022e-06, "loss": 2.6353, "step": 1121 }, { "epoch": 0.13, "learning_rate": 9.844867005759171e-06, "loss": 2.6904, "step": 1122 }, { "epoch": 0.13, "learning_rate": 9.844370390887046e-06, "loss": 2.568, "step": 1123 }, { "epoch": 0.14, "learning_rate": 9.843872994963912e-06, "loss": 2.6672, "step": 1124 }, { "epoch": 0.14, "learning_rate": 9.843374818069964e-06, "loss": 2.5252, "step": 1125 }, { "epoch": 0.14, "learning_rate": 9.842875860285525e-06, "loss": 2.5919, "step": 1126 }, { "epoch": 0.14, "learning_rate": 9.842376121691038e-06, "loss": 2.5046, "step": 1127 }, { "epoch": 0.14, "learning_rate": 9.841875602367079e-06, "loss": 2.5479, "step": 1128 }, { "epoch": 0.14, "learning_rate": 9.841374302394341e-06, "loss": 2.7249, "step": 1129 }, { "epoch": 0.14, "learning_rate": 9.84087222185365e-06, "loss": 2.7983, "step": 1130 }, { "epoch": 0.14, "learning_rate": 9.84036936082596e-06, "loss": 2.6776, "step": 1131 }, { "epoch": 0.14, "learning_rate": 9.83986571939234e-06, "loss": 2.7237, "step": 1132 }, { "epoch": 0.14, "learning_rate": 9.839361297633994e-06, "loss": 2.7218, "step": 1133 }, { "epoch": 0.14, "learning_rate": 9.83885609563225e-06, "loss": 2.3394, "step": 1134 }, { "epoch": 0.14, "learning_rate": 9.83835011346856e-06, "loss": 2.5308, "step": 1135 }, { "epoch": 0.14, "learning_rate": 9.837843351224504e-06, "loss": 2.6986, "step": 1136 }, { "epoch": 0.14, "learning_rate": 9.837335808981785e-06, "loss": 2.5363, "step": 1137 }, { "epoch": 0.14, "learning_rate": 9.836827486822233e-06, "loss": 2.6301, "step": 1138 }, { "epoch": 0.14, "learning_rate": 9.836318384827807e-06, "loss": 2.6516, "step": 1139 }, { "epoch": 0.14, "learning_rate": 9.835808503080586e-06, "loss": 2.7416, "step": 1140 }, { "epoch": 0.14, "learning_rate": 9.83529784166278e-06, "loss": 2.6613, "step": 1141 }, { "epoch": 0.14, "learning_rate": 9.834786400656719e-06, "loss": 2.6756, "step": 1142 }, { "epoch": 0.14, "learning_rate": 9.834274180144865e-06, "loss": 2.6653, "step": 1143 }, { "epoch": 0.14, "learning_rate": 9.833761180209799e-06, "loss": 2.6257, "step": 1144 }, { "epoch": 0.14, "learning_rate": 9.833247400934236e-06, "loss": 2.5206, "step": 1145 }, { "epoch": 0.14, "learning_rate": 9.832732842401008e-06, "loss": 2.7033, "step": 1146 }, { "epoch": 0.14, "learning_rate": 9.832217504693078e-06, "loss": 2.5908, "step": 1147 }, { "epoch": 0.14, "learning_rate": 9.831701387893533e-06, "loss": 2.4812, "step": 1148 }, { "epoch": 0.14, "learning_rate": 9.831184492085584e-06, "loss": 2.522, "step": 1149 }, { "epoch": 0.14, "learning_rate": 9.830666817352575e-06, "loss": 2.6933, "step": 1150 }, { "epoch": 0.14, "learning_rate": 9.830148363777963e-06, "loss": 2.5252, "step": 1151 }, { "epoch": 0.14, "learning_rate": 9.829629131445342e-06, "loss": 2.7246, "step": 1152 }, { "epoch": 0.14, "learning_rate": 9.829109120438426e-06, "loss": 2.6901, "step": 1153 }, { "epoch": 0.14, "learning_rate": 9.828588330841055e-06, "loss": 2.6394, "step": 1154 }, { "epoch": 0.14, "learning_rate": 9.828066762737196e-06, "loss": 2.6392, "step": 1155 }, { "epoch": 0.14, "learning_rate": 9.82754441621094e-06, "loss": 2.5612, "step": 1156 }, { "epoch": 0.14, "learning_rate": 9.827021291346506e-06, "loss": 2.6585, "step": 1157 }, { "epoch": 0.14, "learning_rate": 9.826497388228234e-06, "loss": 2.6451, "step": 1158 }, { "epoch": 0.14, "learning_rate": 9.825972706940591e-06, "loss": 2.6866, "step": 1159 }, { "epoch": 0.14, "learning_rate": 9.825447247568177e-06, "loss": 2.7848, "step": 1160 }, { "epoch": 0.14, "learning_rate": 9.824921010195706e-06, "loss": 2.6162, "step": 1161 }, { "epoch": 0.14, "learning_rate": 9.824393994908021e-06, "loss": 2.7045, "step": 1162 }, { "epoch": 0.14, "learning_rate": 9.823866201790097e-06, "loss": 2.832, "step": 1163 }, { "epoch": 0.14, "learning_rate": 9.823337630927027e-06, "loss": 2.7403, "step": 1164 }, { "epoch": 0.14, "learning_rate": 9.822808282404031e-06, "loss": 2.5951, "step": 1165 }, { "epoch": 0.14, "learning_rate": 9.822278156306455e-06, "loss": 2.6795, "step": 1166 }, { "epoch": 0.14, "learning_rate": 9.821747252719772e-06, "loss": 2.5628, "step": 1167 }, { "epoch": 0.14, "learning_rate": 9.821215571729578e-06, "loss": 2.7008, "step": 1168 }, { "epoch": 0.14, "learning_rate": 9.820683113421595e-06, "loss": 2.5576, "step": 1169 }, { "epoch": 0.14, "learning_rate": 9.82014987788167e-06, "loss": 2.5441, "step": 1170 }, { "epoch": 0.14, "learning_rate": 9.819615865195778e-06, "loss": 2.5093, "step": 1171 }, { "epoch": 0.14, "learning_rate": 9.819081075450014e-06, "loss": 2.6538, "step": 1172 }, { "epoch": 0.14, "learning_rate": 9.818545508730604e-06, "loss": 2.4913, "step": 1173 }, { "epoch": 0.14, "learning_rate": 9.818009165123895e-06, "loss": 2.6728, "step": 1174 }, { "epoch": 0.14, "learning_rate": 9.817472044716362e-06, "loss": 2.5991, "step": 1175 }, { "epoch": 0.14, "learning_rate": 9.816934147594606e-06, "loss": 2.6714, "step": 1176 }, { "epoch": 0.14, "learning_rate": 9.816395473845346e-06, "loss": 2.5955, "step": 1177 }, { "epoch": 0.14, "learning_rate": 9.815856023555437e-06, "loss": 2.8624, "step": 1178 }, { "epoch": 0.14, "learning_rate": 9.815315796811849e-06, "loss": 2.3883, "step": 1179 }, { "epoch": 0.14, "learning_rate": 9.814774793701686e-06, "loss": 2.5678, "step": 1180 }, { "epoch": 0.14, "learning_rate": 9.814233014312174e-06, "loss": 2.6132, "step": 1181 }, { "epoch": 0.14, "learning_rate": 9.813690458730659e-06, "loss": 2.6245, "step": 1182 }, { "epoch": 0.14, "learning_rate": 9.813147127044618e-06, "loss": 2.5358, "step": 1183 }, { "epoch": 0.14, "learning_rate": 9.812603019341652e-06, "loss": 2.7457, "step": 1184 }, { "epoch": 0.14, "learning_rate": 9.812058135709488e-06, "loss": 2.6248, "step": 1185 }, { "epoch": 0.14, "learning_rate": 9.811512476235974e-06, "loss": 2.3929, "step": 1186 }, { "epoch": 0.14, "learning_rate": 9.810966041009088e-06, "loss": 2.6402, "step": 1187 }, { "epoch": 0.14, "learning_rate": 9.810418830116933e-06, "loss": 2.5529, "step": 1188 }, { "epoch": 0.14, "learning_rate": 9.809870843647731e-06, "loss": 2.645, "step": 1189 }, { "epoch": 0.14, "learning_rate": 9.809322081689834e-06, "loss": 2.8, "step": 1190 }, { "epoch": 0.14, "learning_rate": 9.808772544331719e-06, "loss": 2.72, "step": 1191 }, { "epoch": 0.14, "learning_rate": 9.808222231661989e-06, "loss": 2.632, "step": 1192 }, { "epoch": 0.14, "learning_rate": 9.807671143769367e-06, "loss": 2.6817, "step": 1193 }, { "epoch": 0.14, "learning_rate": 9.807119280742702e-06, "loss": 2.7025, "step": 1194 }, { "epoch": 0.14, "learning_rate": 9.806566642670979e-06, "loss": 2.6578, "step": 1195 }, { "epoch": 0.14, "learning_rate": 9.80601322964329e-06, "loss": 2.7352, "step": 1196 }, { "epoch": 0.14, "learning_rate": 9.805459041748864e-06, "loss": 2.4547, "step": 1197 }, { "epoch": 0.14, "learning_rate": 9.804904079077054e-06, "loss": 2.5056, "step": 1198 }, { "epoch": 0.14, "learning_rate": 9.804348341717333e-06, "loss": 2.7427, "step": 1199 }, { "epoch": 0.14, "learning_rate": 9.803791829759302e-06, "loss": 2.5503, "step": 1200 }, { "epoch": 0.14, "learning_rate": 9.80323454329269e-06, "loss": 2.7746, "step": 1201 }, { "epoch": 0.14, "learning_rate": 9.802676482407343e-06, "loss": 2.6463, "step": 1202 }, { "epoch": 0.14, "learning_rate": 9.80211764719324e-06, "loss": 2.5803, "step": 1203 }, { "epoch": 0.14, "learning_rate": 9.80155803774048e-06, "loss": 2.6343, "step": 1204 }, { "epoch": 0.14, "learning_rate": 9.800997654139286e-06, "loss": 2.5275, "step": 1205 }, { "epoch": 0.14, "learning_rate": 9.800436496480009e-06, "loss": 2.572, "step": 1206 }, { "epoch": 0.15, "learning_rate": 9.799874564853126e-06, "loss": 2.7689, "step": 1207 }, { "epoch": 0.15, "learning_rate": 9.799311859349235e-06, "loss": 2.5281, "step": 1208 }, { "epoch": 0.15, "learning_rate": 9.798748380059058e-06, "loss": 2.5983, "step": 1209 }, { "epoch": 0.15, "learning_rate": 9.798184127073446e-06, "loss": 2.6778, "step": 1210 }, { "epoch": 0.15, "learning_rate": 9.797619100483374e-06, "loss": 2.5932, "step": 1211 }, { "epoch": 0.15, "learning_rate": 9.797053300379938e-06, "loss": 2.5835, "step": 1212 }, { "epoch": 0.15, "learning_rate": 9.796486726854361e-06, "loss": 2.6636, "step": 1213 }, { "epoch": 0.15, "learning_rate": 9.795919379997993e-06, "loss": 2.5734, "step": 1214 }, { "epoch": 0.15, "learning_rate": 9.795351259902308e-06, "loss": 2.749, "step": 1215 }, { "epoch": 0.15, "learning_rate": 9.794782366658896e-06, "loss": 2.5195, "step": 1216 }, { "epoch": 0.15, "learning_rate": 9.794212700359488e-06, "loss": 2.7522, "step": 1217 }, { "epoch": 0.15, "learning_rate": 9.793642261095924e-06, "loss": 2.5126, "step": 1218 }, { "epoch": 0.15, "learning_rate": 9.793071048960177e-06, "loss": 2.6713, "step": 1219 }, { "epoch": 0.15, "learning_rate": 9.792499064044343e-06, "loss": 2.4674, "step": 1220 }, { "epoch": 0.15, "learning_rate": 9.791926306440643e-06, "loss": 2.7383, "step": 1221 }, { "epoch": 0.15, "learning_rate": 9.791352776241421e-06, "loss": 2.6019, "step": 1222 }, { "epoch": 0.15, "learning_rate": 9.790778473539147e-06, "loss": 2.5178, "step": 1223 }, { "epoch": 0.15, "learning_rate": 9.790203398426414e-06, "loss": 2.689, "step": 1224 }, { "epoch": 0.15, "learning_rate": 9.789627550995941e-06, "loss": 2.6425, "step": 1225 }, { "epoch": 0.15, "learning_rate": 9.789050931340572e-06, "loss": 2.6346, "step": 1226 }, { "epoch": 0.15, "learning_rate": 9.788473539553271e-06, "loss": 2.7565, "step": 1227 }, { "epoch": 0.15, "learning_rate": 9.787895375727137e-06, "loss": 2.6264, "step": 1228 }, { "epoch": 0.15, "learning_rate": 9.787316439955378e-06, "loss": 2.5931, "step": 1229 }, { "epoch": 0.15, "learning_rate": 9.786736732331343e-06, "loss": 2.586, "step": 1230 }, { "epoch": 0.15, "learning_rate": 9.786156252948493e-06, "loss": 2.7511, "step": 1231 }, { "epoch": 0.15, "learning_rate": 9.785575001900418e-06, "loss": 2.6356, "step": 1232 }, { "epoch": 0.15, "learning_rate": 9.784992979280833e-06, "loss": 2.6094, "step": 1233 }, { "epoch": 0.15, "learning_rate": 9.784410185183579e-06, "loss": 2.7318, "step": 1234 }, { "epoch": 0.15, "learning_rate": 9.783826619702615e-06, "loss": 2.6301, "step": 1235 }, { "epoch": 0.15, "learning_rate": 9.783242282932028e-06, "loss": 2.6861, "step": 1236 }, { "epoch": 0.15, "learning_rate": 9.782657174966035e-06, "loss": 2.5651, "step": 1237 }, { "epoch": 0.15, "learning_rate": 9.78207129589897e-06, "loss": 2.6839, "step": 1238 }, { "epoch": 0.15, "learning_rate": 9.781484645825289e-06, "loss": 2.5388, "step": 1239 }, { "epoch": 0.15, "learning_rate": 9.780897224839583e-06, "loss": 2.7062, "step": 1240 }, { "epoch": 0.15, "learning_rate": 9.780309033036556e-06, "loss": 2.5085, "step": 1241 }, { "epoch": 0.15, "learning_rate": 9.779720070511048e-06, "loss": 2.7103, "step": 1242 }, { "epoch": 0.15, "learning_rate": 9.77913033735801e-06, "loss": 2.6695, "step": 1243 }, { "epoch": 0.15, "learning_rate": 9.778539833672525e-06, "loss": 2.5719, "step": 1244 }, { "epoch": 0.15, "learning_rate": 9.777948559549802e-06, "loss": 2.6052, "step": 1245 }, { "epoch": 0.15, "learning_rate": 9.777356515085167e-06, "loss": 2.7043, "step": 1246 }, { "epoch": 0.15, "learning_rate": 9.77676370037408e-06, "loss": 2.6633, "step": 1247 }, { "epoch": 0.15, "learning_rate": 9.776170115512115e-06, "loss": 2.5843, "step": 1248 }, { "epoch": 0.15, "learning_rate": 9.775575760594978e-06, "loss": 2.5889, "step": 1249 }, { "epoch": 0.15, "learning_rate": 9.774980635718494e-06, "loss": 2.5847, "step": 1250 }, { "epoch": 0.15, "learning_rate": 9.774384740978614e-06, "loss": 2.5711, "step": 1251 }, { "epoch": 0.15, "learning_rate": 9.773788076471415e-06, "loss": 2.7146, "step": 1252 }, { "epoch": 0.15, "learning_rate": 9.773190642293094e-06, "loss": 2.5059, "step": 1253 }, { "epoch": 0.15, "learning_rate": 9.772592438539977e-06, "loss": 2.8255, "step": 1254 }, { "epoch": 0.15, "learning_rate": 9.77199346530851e-06, "loss": 2.6024, "step": 1255 }, { "epoch": 0.15, "learning_rate": 9.771393722695267e-06, "loss": 2.5862, "step": 1256 }, { "epoch": 0.15, "learning_rate": 9.770793210796938e-06, "loss": 2.6022, "step": 1257 }, { "epoch": 0.15, "learning_rate": 9.770191929710348e-06, "loss": 2.7668, "step": 1258 }, { "epoch": 0.15, "learning_rate": 9.76958987953244e-06, "loss": 2.8871, "step": 1259 }, { "epoch": 0.15, "learning_rate": 9.76898706036028e-06, "loss": 2.6784, "step": 1260 }, { "epoch": 0.15, "learning_rate": 9.768383472291061e-06, "loss": 2.7255, "step": 1261 }, { "epoch": 0.15, "learning_rate": 9.767779115422097e-06, "loss": 2.5715, "step": 1262 }, { "epoch": 0.15, "learning_rate": 9.767173989850828e-06, "loss": 2.5899, "step": 1263 }, { "epoch": 0.15, "learning_rate": 9.766568095674819e-06, "loss": 2.4836, "step": 1264 }, { "epoch": 0.15, "learning_rate": 9.765961432991758e-06, "loss": 2.5232, "step": 1265 }, { "epoch": 0.15, "learning_rate": 9.765354001899455e-06, "loss": 2.7133, "step": 1266 }, { "epoch": 0.15, "learning_rate": 9.764745802495846e-06, "loss": 2.6456, "step": 1267 }, { "epoch": 0.15, "learning_rate": 9.764136834878987e-06, "loss": 2.6134, "step": 1268 }, { "epoch": 0.15, "learning_rate": 9.763527099147064e-06, "loss": 2.6227, "step": 1269 }, { "epoch": 0.15, "learning_rate": 9.762916595398384e-06, "loss": 2.7248, "step": 1270 }, { "epoch": 0.15, "learning_rate": 9.762305323731376e-06, "loss": 2.7307, "step": 1271 }, { "epoch": 0.15, "learning_rate": 9.761693284244598e-06, "loss": 2.6071, "step": 1272 }, { "epoch": 0.15, "learning_rate": 9.761080477036722e-06, "loss": 2.8569, "step": 1273 }, { "epoch": 0.15, "learning_rate": 9.760466902206557e-06, "loss": 2.5946, "step": 1274 }, { "epoch": 0.15, "learning_rate": 9.759852559853025e-06, "loss": 2.7093, "step": 1275 }, { "epoch": 0.15, "learning_rate": 9.759237450075174e-06, "loss": 2.6723, "step": 1276 }, { "epoch": 0.15, "learning_rate": 9.75862157297218e-06, "loss": 2.4425, "step": 1277 }, { "epoch": 0.15, "learning_rate": 9.758004928643342e-06, "loss": 2.6542, "step": 1278 }, { "epoch": 0.15, "learning_rate": 9.757387517188076e-06, "loss": 2.5784, "step": 1279 }, { "epoch": 0.15, "learning_rate": 9.756769338705927e-06, "loss": 2.5291, "step": 1280 }, { "epoch": 0.15, "learning_rate": 9.756150393296566e-06, "loss": 2.7432, "step": 1281 }, { "epoch": 0.15, "learning_rate": 9.755530681059784e-06, "loss": 2.5371, "step": 1282 }, { "epoch": 0.15, "learning_rate": 9.754910202095493e-06, "loss": 2.5031, "step": 1283 }, { "epoch": 0.15, "learning_rate": 9.754288956503737e-06, "loss": 2.6121, "step": 1284 }, { "epoch": 0.15, "learning_rate": 9.753666944384675e-06, "loss": 2.8312, "step": 1285 }, { "epoch": 0.15, "learning_rate": 9.753044165838594e-06, "loss": 2.7478, "step": 1286 }, { "epoch": 0.15, "learning_rate": 9.752420620965903e-06, "loss": 2.845, "step": 1287 }, { "epoch": 0.15, "learning_rate": 9.751796309867139e-06, "loss": 2.5277, "step": 1288 }, { "epoch": 0.15, "learning_rate": 9.751171232642954e-06, "loss": 2.7744, "step": 1289 }, { "epoch": 0.15, "learning_rate": 9.75054538939413e-06, "loss": 2.6891, "step": 1290 }, { "epoch": 0.16, "learning_rate": 9.74991878022157e-06, "loss": 2.6358, "step": 1291 }, { "epoch": 0.16, "learning_rate": 9.749291405226304e-06, "loss": 2.6578, "step": 1292 }, { "epoch": 0.16, "learning_rate": 9.748663264509481e-06, "loss": 2.5, "step": 1293 }, { "epoch": 0.16, "learning_rate": 9.748034358172376e-06, "loss": 2.6628, "step": 1294 }, { "epoch": 0.16, "learning_rate": 9.747404686316386e-06, "loss": 2.551, "step": 1295 }, { "epoch": 0.16, "learning_rate": 9.74677424904303e-06, "loss": 2.9117, "step": 1296 }, { "epoch": 0.16, "learning_rate": 9.746143046453956e-06, "loss": 2.6162, "step": 1297 }, { "epoch": 0.16, "learning_rate": 9.745511078650931e-06, "loss": 2.6874, "step": 1298 }, { "epoch": 0.16, "learning_rate": 9.744878345735846e-06, "loss": 2.54, "step": 1299 }, { "epoch": 0.16, "learning_rate": 9.744244847810716e-06, "loss": 2.6775, "step": 1300 }, { "epoch": 0.16, "learning_rate": 9.743610584977676e-06, "loss": 2.6283, "step": 1301 }, { "epoch": 0.16, "learning_rate": 9.742975557338992e-06, "loss": 2.6796, "step": 1302 }, { "epoch": 0.16, "learning_rate": 9.742339764997046e-06, "loss": 2.5238, "step": 1303 }, { "epoch": 0.16, "learning_rate": 9.741703208054347e-06, "loss": 2.6554, "step": 1304 }, { "epoch": 0.16, "learning_rate": 9.741065886613523e-06, "loss": 2.7491, "step": 1305 }, { "epoch": 0.16, "learning_rate": 9.740427800777333e-06, "loss": 2.822, "step": 1306 }, { "epoch": 0.16, "learning_rate": 9.739788950648651e-06, "loss": 2.5097, "step": 1307 }, { "epoch": 0.16, "learning_rate": 9.739149336330482e-06, "loss": 2.6376, "step": 1308 }, { "epoch": 0.16, "learning_rate": 9.738508957925947e-06, "loss": 2.6424, "step": 1309 }, { "epoch": 0.16, "learning_rate": 9.737867815538292e-06, "loss": 2.6645, "step": 1310 }, { "epoch": 0.16, "learning_rate": 9.737225909270891e-06, "loss": 2.8391, "step": 1311 }, { "epoch": 0.16, "learning_rate": 9.736583239227235e-06, "loss": 2.4144, "step": 1312 }, { "epoch": 0.16, "learning_rate": 9.735939805510943e-06, "loss": 2.5847, "step": 1313 }, { "epoch": 0.16, "learning_rate": 9.735295608225753e-06, "loss": 2.5234, "step": 1314 }, { "epoch": 0.16, "learning_rate": 9.73465064747553e-06, "loss": 2.7315, "step": 1315 }, { "epoch": 0.16, "learning_rate": 9.734004923364258e-06, "loss": 2.5849, "step": 1316 }, { "epoch": 0.16, "learning_rate": 9.733358435996045e-06, "loss": 2.6387, "step": 1317 }, { "epoch": 0.16, "learning_rate": 9.732711185475127e-06, "loss": 2.6055, "step": 1318 }, { "epoch": 0.16, "learning_rate": 9.732063171905858e-06, "loss": 2.6118, "step": 1319 }, { "epoch": 0.16, "learning_rate": 9.731414395392716e-06, "loss": 2.6367, "step": 1320 }, { "epoch": 0.16, "learning_rate": 9.730764856040302e-06, "loss": 2.6154, "step": 1321 }, { "epoch": 0.16, "learning_rate": 9.73011455395334e-06, "loss": 2.613, "step": 1322 }, { "epoch": 0.16, "learning_rate": 9.729463489236679e-06, "loss": 2.5388, "step": 1323 }, { "epoch": 0.16, "learning_rate": 9.728811661995287e-06, "loss": 2.5568, "step": 1324 }, { "epoch": 0.16, "learning_rate": 9.72815907233426e-06, "loss": 2.6106, "step": 1325 }, { "epoch": 0.16, "learning_rate": 9.72750572035881e-06, "loss": 2.6312, "step": 1326 }, { "epoch": 0.16, "learning_rate": 9.726851606174281e-06, "loss": 2.7771, "step": 1327 }, { "epoch": 0.16, "learning_rate": 9.72619672988613e-06, "loss": 2.6366, "step": 1328 }, { "epoch": 0.16, "learning_rate": 9.725541091599946e-06, "loss": 2.7585, "step": 1329 }, { "epoch": 0.16, "learning_rate": 9.724884691421433e-06, "loss": 2.5895, "step": 1330 }, { "epoch": 0.16, "learning_rate": 9.724227529456424e-06, "loss": 2.7193, "step": 1331 }, { "epoch": 0.16, "learning_rate": 9.72356960581087e-06, "loss": 2.6253, "step": 1332 }, { "epoch": 0.16, "learning_rate": 9.72291092059085e-06, "loss": 2.5116, "step": 1333 }, { "epoch": 0.16, "learning_rate": 9.722251473902562e-06, "loss": 2.6533, "step": 1334 }, { "epoch": 0.16, "learning_rate": 9.721591265852326e-06, "loss": 2.6217, "step": 1335 }, { "epoch": 0.16, "learning_rate": 9.72093029654659e-06, "loss": 2.7431, "step": 1336 }, { "epoch": 0.16, "learning_rate": 9.720268566091915e-06, "loss": 2.5942, "step": 1337 }, { "epoch": 0.16, "learning_rate": 9.719606074594999e-06, "loss": 2.5996, "step": 1338 }, { "epoch": 0.16, "learning_rate": 9.718942822162646e-06, "loss": 2.5461, "step": 1339 }, { "epoch": 0.16, "learning_rate": 9.718278808901797e-06, "loss": 2.6276, "step": 1340 }, { "epoch": 0.16, "learning_rate": 9.717614034919509e-06, "loss": 2.6358, "step": 1341 }, { "epoch": 0.16, "learning_rate": 9.71694850032296e-06, "loss": 2.5685, "step": 1342 }, { "epoch": 0.16, "learning_rate": 9.716282205219457e-06, "loss": 2.7049, "step": 1343 }, { "epoch": 0.16, "learning_rate": 9.715615149716424e-06, "loss": 2.7119, "step": 1344 }, { "epoch": 0.16, "learning_rate": 9.714947333921407e-06, "loss": 2.4839, "step": 1345 }, { "epoch": 0.16, "learning_rate": 9.714278757942082e-06, "loss": 2.4821, "step": 1346 }, { "epoch": 0.16, "learning_rate": 9.71360942188624e-06, "loss": 2.7496, "step": 1347 }, { "epoch": 0.16, "learning_rate": 9.712939325861794e-06, "loss": 2.7042, "step": 1348 }, { "epoch": 0.16, "learning_rate": 9.712268469976789e-06, "loss": 2.4932, "step": 1349 }, { "epoch": 0.16, "learning_rate": 9.71159685433938e-06, "loss": 2.8221, "step": 1350 }, { "epoch": 0.16, "learning_rate": 9.710924479057855e-06, "loss": 2.5959, "step": 1351 }, { "epoch": 0.16, "learning_rate": 9.710251344240619e-06, "loss": 2.5959, "step": 1352 }, { "epoch": 0.16, "learning_rate": 9.709577449996199e-06, "loss": 2.6307, "step": 1353 }, { "epoch": 0.16, "learning_rate": 9.708902796433249e-06, "loss": 2.4944, "step": 1354 }, { "epoch": 0.16, "learning_rate": 9.708227383660538e-06, "loss": 2.5639, "step": 1355 }, { "epoch": 0.16, "learning_rate": 9.707551211786966e-06, "loss": 2.489, "step": 1356 }, { "epoch": 0.16, "learning_rate": 9.706874280921549e-06, "loss": 2.5778, "step": 1357 }, { "epoch": 0.16, "learning_rate": 9.70619659117343e-06, "loss": 2.6372, "step": 1358 }, { "epoch": 0.16, "learning_rate": 9.705518142651868e-06, "loss": 2.6256, "step": 1359 }, { "epoch": 0.16, "learning_rate": 9.704838935466251e-06, "loss": 2.8043, "step": 1360 }, { "epoch": 0.16, "learning_rate": 9.704158969726086e-06, "loss": 2.592, "step": 1361 }, { "epoch": 0.16, "learning_rate": 9.703478245541005e-06, "loss": 2.6031, "step": 1362 }, { "epoch": 0.16, "learning_rate": 9.702796763020757e-06, "loss": 2.6353, "step": 1363 }, { "epoch": 0.16, "learning_rate": 9.702114522275216e-06, "loss": 2.6636, "step": 1364 }, { "epoch": 0.16, "learning_rate": 9.701431523414382e-06, "loss": 2.371, "step": 1365 }, { "epoch": 0.16, "learning_rate": 9.700747766548373e-06, "loss": 2.7056, "step": 1366 }, { "epoch": 0.16, "learning_rate": 9.700063251787431e-06, "loss": 2.5786, "step": 1367 }, { "epoch": 0.16, "learning_rate": 9.699377979241915e-06, "loss": 2.5416, "step": 1368 }, { "epoch": 0.16, "learning_rate": 9.698691949022314e-06, "loss": 2.5366, "step": 1369 }, { "epoch": 0.16, "learning_rate": 9.698005161239237e-06, "loss": 2.5828, "step": 1370 }, { "epoch": 0.16, "learning_rate": 9.697317616003409e-06, "loss": 2.6523, "step": 1371 }, { "epoch": 0.16, "learning_rate": 9.696629313425688e-06, "loss": 2.6129, "step": 1372 }, { "epoch": 0.16, "learning_rate": 9.695940253617044e-06, "loss": 2.4794, "step": 1373 }, { "epoch": 0.17, "learning_rate": 9.695250436688573e-06, "loss": 2.5515, "step": 1374 }, { "epoch": 0.17, "learning_rate": 9.694559862751495e-06, "loss": 2.6366, "step": 1375 }, { "epoch": 0.17, "learning_rate": 9.69386853191715e-06, "loss": 2.7393, "step": 1376 }, { "epoch": 0.17, "learning_rate": 9.693176444296999e-06, "loss": 2.5332, "step": 1377 }, { "epoch": 0.17, "learning_rate": 9.692483600002626e-06, "loss": 2.4741, "step": 1378 }, { "epoch": 0.17, "learning_rate": 9.69178999914574e-06, "loss": 2.5597, "step": 1379 }, { "epoch": 0.17, "learning_rate": 9.691095641838168e-06, "loss": 2.6521, "step": 1380 }, { "epoch": 0.17, "learning_rate": 9.690400528191861e-06, "loss": 2.5744, "step": 1381 }, { "epoch": 0.17, "learning_rate": 9.689704658318888e-06, "loss": 2.6384, "step": 1382 }, { "epoch": 0.17, "learning_rate": 9.689008032331446e-06, "loss": 2.5182, "step": 1383 }, { "epoch": 0.17, "learning_rate": 9.688310650341852e-06, "loss": 2.6784, "step": 1384 }, { "epoch": 0.17, "learning_rate": 9.68761251246254e-06, "loss": 2.6287, "step": 1385 }, { "epoch": 0.17, "learning_rate": 9.686913618806073e-06, "loss": 2.7042, "step": 1386 }, { "epoch": 0.17, "learning_rate": 9.686213969485132e-06, "loss": 2.6248, "step": 1387 }, { "epoch": 0.17, "learning_rate": 9.685513564612521e-06, "loss": 2.7073, "step": 1388 }, { "epoch": 0.17, "learning_rate": 9.684812404301162e-06, "loss": 2.4783, "step": 1389 }, { "epoch": 0.17, "learning_rate": 9.684110488664107e-06, "loss": 2.4616, "step": 1390 }, { "epoch": 0.17, "learning_rate": 9.68340781781452e-06, "loss": 2.6964, "step": 1391 }, { "epoch": 0.17, "learning_rate": 9.682704391865697e-06, "loss": 2.6094, "step": 1392 }, { "epoch": 0.17, "learning_rate": 9.682000210931046e-06, "loss": 2.684, "step": 1393 }, { "epoch": 0.17, "learning_rate": 9.681295275124104e-06, "loss": 2.6348, "step": 1394 }, { "epoch": 0.17, "learning_rate": 9.680589584558521e-06, "loss": 2.6252, "step": 1395 }, { "epoch": 0.17, "learning_rate": 9.679883139348082e-06, "loss": 2.7184, "step": 1396 }, { "epoch": 0.17, "learning_rate": 9.679175939606683e-06, "loss": 2.5765, "step": 1397 }, { "epoch": 0.17, "learning_rate": 9.678467985448345e-06, "loss": 2.3808, "step": 1398 }, { "epoch": 0.17, "learning_rate": 9.67775927698721e-06, "loss": 2.6887, "step": 1399 }, { "epoch": 0.17, "learning_rate": 9.67704981433754e-06, "loss": 2.6965, "step": 1400 }, { "epoch": 0.17, "learning_rate": 9.676339597613726e-06, "loss": 2.5613, "step": 1401 }, { "epoch": 0.17, "learning_rate": 9.675628626930271e-06, "loss": 2.5554, "step": 1402 }, { "epoch": 0.17, "learning_rate": 9.674916902401805e-06, "loss": 2.5328, "step": 1403 }, { "epoch": 0.17, "learning_rate": 9.674204424143079e-06, "loss": 2.746, "step": 1404 }, { "epoch": 0.17, "learning_rate": 9.673491192268964e-06, "loss": 2.6315, "step": 1405 }, { "epoch": 0.17, "learning_rate": 9.672777206894452e-06, "loss": 2.3984, "step": 1406 }, { "epoch": 0.17, "learning_rate": 9.672062468134662e-06, "loss": 2.6085, "step": 1407 }, { "epoch": 0.17, "learning_rate": 9.671346976104828e-06, "loss": 2.7326, "step": 1408 }, { "epoch": 0.17, "learning_rate": 9.670630730920304e-06, "loss": 2.5899, "step": 1409 }, { "epoch": 0.17, "learning_rate": 9.669913732696577e-06, "loss": 2.6177, "step": 1410 }, { "epoch": 0.17, "learning_rate": 9.66919598154924e-06, "loss": 2.6628, "step": 1411 }, { "epoch": 0.17, "learning_rate": 9.668477477594021e-06, "loss": 2.7427, "step": 1412 }, { "epoch": 0.17, "learning_rate": 9.66775822094676e-06, "loss": 2.6795, "step": 1413 }, { "epoch": 0.17, "learning_rate": 9.66703821172342e-06, "loss": 2.623, "step": 1414 }, { "epoch": 0.17, "learning_rate": 9.666317450040093e-06, "loss": 2.4876, "step": 1415 }, { "epoch": 0.17, "learning_rate": 9.665595936012982e-06, "loss": 2.6778, "step": 1416 }, { "epoch": 0.17, "learning_rate": 9.664873669758415e-06, "loss": 2.588, "step": 1417 }, { "epoch": 0.17, "learning_rate": 9.664150651392846e-06, "loss": 2.5699, "step": 1418 }, { "epoch": 0.17, "learning_rate": 9.66342688103284e-06, "loss": 2.7762, "step": 1419 }, { "epoch": 0.17, "learning_rate": 9.662702358795098e-06, "loss": 2.3558, "step": 1420 }, { "epoch": 0.17, "learning_rate": 9.661977084796426e-06, "loss": 2.5766, "step": 1421 }, { "epoch": 0.17, "learning_rate": 9.661251059153762e-06, "loss": 2.6752, "step": 1422 }, { "epoch": 0.17, "learning_rate": 9.660524281984164e-06, "loss": 2.5678, "step": 1423 }, { "epoch": 0.17, "learning_rate": 9.659796753404806e-06, "loss": 2.6222, "step": 1424 }, { "epoch": 0.17, "learning_rate": 9.659068473532988e-06, "loss": 2.686, "step": 1425 }, { "epoch": 0.17, "learning_rate": 9.65833944248613e-06, "loss": 2.759, "step": 1426 }, { "epoch": 0.17, "learning_rate": 9.65760966038177e-06, "loss": 2.4977, "step": 1427 }, { "epoch": 0.17, "learning_rate": 9.656879127337571e-06, "loss": 2.4989, "step": 1428 }, { "epoch": 0.17, "learning_rate": 9.656147843471319e-06, "loss": 2.5743, "step": 1429 }, { "epoch": 0.17, "learning_rate": 9.655415808900915e-06, "loss": 2.6892, "step": 1430 }, { "epoch": 0.17, "learning_rate": 9.654683023744383e-06, "loss": 2.7186, "step": 1431 }, { "epoch": 0.17, "learning_rate": 9.65394948811987e-06, "loss": 2.5371, "step": 1432 }, { "epoch": 0.17, "learning_rate": 9.653215202145643e-06, "loss": 2.7226, "step": 1433 }, { "epoch": 0.17, "learning_rate": 9.65248016594009e-06, "loss": 2.4539, "step": 1434 }, { "epoch": 0.17, "learning_rate": 9.651744379621722e-06, "loss": 2.5593, "step": 1435 }, { "epoch": 0.17, "learning_rate": 9.651007843309164e-06, "loss": 2.5544, "step": 1436 }, { "epoch": 0.17, "learning_rate": 9.650270557121168e-06, "loss": 2.6385, "step": 1437 }, { "epoch": 0.17, "learning_rate": 9.64953252117661e-06, "loss": 2.5453, "step": 1438 }, { "epoch": 0.17, "learning_rate": 9.648793735594478e-06, "loss": 2.5724, "step": 1439 }, { "epoch": 0.17, "learning_rate": 9.648054200493887e-06, "loss": 2.7389, "step": 1440 }, { "epoch": 0.17, "learning_rate": 9.64731391599407e-06, "loss": 2.6903, "step": 1441 }, { "epoch": 0.17, "learning_rate": 9.646572882214385e-06, "loss": 2.6983, "step": 1442 }, { "epoch": 0.17, "learning_rate": 9.645831099274304e-06, "loss": 2.6395, "step": 1443 }, { "epoch": 0.17, "learning_rate": 9.645088567293426e-06, "loss": 2.5018, "step": 1444 }, { "epoch": 0.17, "learning_rate": 9.644345286391468e-06, "loss": 2.7372, "step": 1445 }, { "epoch": 0.17, "learning_rate": 9.643601256688267e-06, "loss": 2.4862, "step": 1446 }, { "epoch": 0.17, "learning_rate": 9.642856478303784e-06, "loss": 2.5152, "step": 1447 }, { "epoch": 0.17, "learning_rate": 9.642110951358097e-06, "loss": 2.5342, "step": 1448 }, { "epoch": 0.17, "learning_rate": 9.641364675971407e-06, "loss": 2.6705, "step": 1449 }, { "epoch": 0.17, "learning_rate": 9.640617652264033e-06, "loss": 2.6344, "step": 1450 }, { "epoch": 0.17, "learning_rate": 9.63986988035642e-06, "loss": 2.7042, "step": 1451 }, { "epoch": 0.17, "learning_rate": 9.639121360369127e-06, "loss": 2.6463, "step": 1452 }, { "epoch": 0.17, "learning_rate": 9.638372092422839e-06, "loss": 2.6987, "step": 1453 }, { "epoch": 0.17, "learning_rate": 9.637622076638358e-06, "loss": 2.6854, "step": 1454 }, { "epoch": 0.17, "learning_rate": 9.636871313136608e-06, "loss": 2.5133, "step": 1455 }, { "epoch": 0.17, "learning_rate": 9.636119802038634e-06, "loss": 2.6984, "step": 1456 }, { "epoch": 0.18, "learning_rate": 9.635367543465603e-06, "loss": 2.616, "step": 1457 }, { "epoch": 0.18, "learning_rate": 9.634614537538797e-06, "loss": 2.4556, "step": 1458 }, { "epoch": 0.18, "learning_rate": 9.633860784379624e-06, "loss": 2.6933, "step": 1459 }, { "epoch": 0.18, "learning_rate": 9.633106284109612e-06, "loss": 2.6485, "step": 1460 }, { "epoch": 0.18, "learning_rate": 9.632351036850404e-06, "loss": 2.6258, "step": 1461 }, { "epoch": 0.18, "learning_rate": 9.631595042723772e-06, "loss": 2.6719, "step": 1462 }, { "epoch": 0.18, "learning_rate": 9.6308383018516e-06, "loss": 2.4835, "step": 1463 }, { "epoch": 0.18, "learning_rate": 9.6300808143559e-06, "loss": 2.5818, "step": 1464 }, { "epoch": 0.18, "learning_rate": 9.629322580358796e-06, "loss": 2.6605, "step": 1465 }, { "epoch": 0.18, "learning_rate": 9.62856359998254e-06, "loss": 2.5854, "step": 1466 }, { "epoch": 0.18, "learning_rate": 9.627803873349503e-06, "loss": 2.6581, "step": 1467 }, { "epoch": 0.18, "learning_rate": 9.627043400582173e-06, "loss": 2.7113, "step": 1468 }, { "epoch": 0.18, "learning_rate": 9.626282181803158e-06, "loss": 2.5465, "step": 1469 }, { "epoch": 0.18, "learning_rate": 9.62552021713519e-06, "loss": 2.5895, "step": 1470 }, { "epoch": 0.18, "learning_rate": 9.624757506701118e-06, "loss": 2.5225, "step": 1471 }, { "epoch": 0.18, "learning_rate": 9.623994050623917e-06, "loss": 2.6917, "step": 1472 }, { "epoch": 0.18, "learning_rate": 9.623229849026674e-06, "loss": 2.6314, "step": 1473 }, { "epoch": 0.18, "learning_rate": 9.622464902032599e-06, "loss": 2.6384, "step": 1474 }, { "epoch": 0.18, "learning_rate": 9.621699209765028e-06, "loss": 2.6022, "step": 1475 }, { "epoch": 0.18, "learning_rate": 9.620932772347408e-06, "loss": 2.5904, "step": 1476 }, { "epoch": 0.18, "learning_rate": 9.620165589903313e-06, "loss": 2.6037, "step": 1477 }, { "epoch": 0.18, "learning_rate": 9.619397662556434e-06, "loss": 2.5978, "step": 1478 }, { "epoch": 0.18, "learning_rate": 9.618628990430585e-06, "loss": 2.6549, "step": 1479 }, { "epoch": 0.18, "learning_rate": 9.617859573649695e-06, "loss": 2.6927, "step": 1480 }, { "epoch": 0.18, "learning_rate": 9.617089412337817e-06, "loss": 2.5409, "step": 1481 }, { "epoch": 0.18, "learning_rate": 9.616318506619122e-06, "loss": 2.6058, "step": 1482 }, { "epoch": 0.18, "learning_rate": 9.615546856617903e-06, "loss": 2.503, "step": 1483 }, { "epoch": 0.18, "learning_rate": 9.614774462458573e-06, "loss": 2.6709, "step": 1484 }, { "epoch": 0.18, "learning_rate": 9.614001324265665e-06, "loss": 2.7324, "step": 1485 }, { "epoch": 0.18, "learning_rate": 9.613227442163826e-06, "loss": 2.4723, "step": 1486 }, { "epoch": 0.18, "learning_rate": 9.612452816277833e-06, "loss": 2.5892, "step": 1487 }, { "epoch": 0.18, "learning_rate": 9.611677446732576e-06, "loss": 2.6584, "step": 1488 }, { "epoch": 0.18, "learning_rate": 9.610901333653065e-06, "loss": 2.5884, "step": 1489 }, { "epoch": 0.18, "learning_rate": 9.610124477164436e-06, "loss": 2.4421, "step": 1490 }, { "epoch": 0.18, "learning_rate": 9.609346877391935e-06, "loss": 2.6581, "step": 1491 }, { "epoch": 0.18, "learning_rate": 9.608568534460938e-06, "loss": 2.518, "step": 1492 }, { "epoch": 0.18, "learning_rate": 9.607789448496932e-06, "loss": 2.7892, "step": 1493 }, { "epoch": 0.18, "learning_rate": 9.607009619625532e-06, "loss": 2.5812, "step": 1494 }, { "epoch": 0.18, "learning_rate": 9.606229047972465e-06, "loss": 2.7331, "step": 1495 }, { "epoch": 0.18, "learning_rate": 9.605447733663586e-06, "loss": 2.5899, "step": 1496 }, { "epoch": 0.18, "learning_rate": 9.60466567682486e-06, "loss": 2.6392, "step": 1497 }, { "epoch": 0.18, "learning_rate": 9.603882877582382e-06, "loss": 2.5432, "step": 1498 }, { "epoch": 0.18, "learning_rate": 9.603099336062357e-06, "loss": 2.5804, "step": 1499 }, { "epoch": 0.18, "learning_rate": 9.602315052391116e-06, "loss": 2.5907, "step": 1500 }, { "epoch": 0.18, "learning_rate": 9.601530026695109e-06, "loss": 2.5421, "step": 1501 }, { "epoch": 0.18, "learning_rate": 9.600744259100905e-06, "loss": 2.643, "step": 1502 }, { "epoch": 0.18, "learning_rate": 9.59995774973519e-06, "loss": 2.6593, "step": 1503 }, { "epoch": 0.18, "learning_rate": 9.599170498724772e-06, "loss": 2.5082, "step": 1504 }, { "epoch": 0.18, "learning_rate": 9.598382506196581e-06, "loss": 2.4918, "step": 1505 }, { "epoch": 0.18, "learning_rate": 9.597593772277662e-06, "loss": 2.7278, "step": 1506 }, { "epoch": 0.18, "learning_rate": 9.59680429709518e-06, "loss": 2.522, "step": 1507 }, { "epoch": 0.18, "learning_rate": 9.596014080776424e-06, "loss": 2.6042, "step": 1508 }, { "epoch": 0.18, "learning_rate": 9.595223123448796e-06, "loss": 2.5533, "step": 1509 }, { "epoch": 0.18, "learning_rate": 9.594431425239825e-06, "loss": 2.5438, "step": 1510 }, { "epoch": 0.18, "learning_rate": 9.593638986277154e-06, "loss": 2.4683, "step": 1511 }, { "epoch": 0.18, "learning_rate": 9.592845806688545e-06, "loss": 2.657, "step": 1512 }, { "epoch": 0.18, "learning_rate": 9.592051886601883e-06, "loss": 2.5805, "step": 1513 }, { "epoch": 0.18, "learning_rate": 9.59125722614517e-06, "loss": 2.7307, "step": 1514 }, { "epoch": 0.18, "learning_rate": 9.590461825446527e-06, "loss": 2.6306, "step": 1515 }, { "epoch": 0.18, "learning_rate": 9.589665684634197e-06, "loss": 2.562, "step": 1516 }, { "epoch": 0.18, "learning_rate": 9.58886880383654e-06, "loss": 2.4641, "step": 1517 }, { "epoch": 0.18, "learning_rate": 9.588071183182035e-06, "loss": 2.4935, "step": 1518 }, { "epoch": 0.18, "learning_rate": 9.587272822799283e-06, "loss": 2.4716, "step": 1519 }, { "epoch": 0.18, "learning_rate": 9.586473722817002e-06, "loss": 2.6376, "step": 1520 }, { "epoch": 0.18, "learning_rate": 9.58567388336403e-06, "loss": 2.7806, "step": 1521 }, { "epoch": 0.18, "learning_rate": 9.584873304569322e-06, "loss": 2.4493, "step": 1522 }, { "epoch": 0.18, "learning_rate": 9.584071986561958e-06, "loss": 2.7338, "step": 1523 }, { "epoch": 0.18, "learning_rate": 9.583269929471129e-06, "loss": 2.7047, "step": 1524 }, { "epoch": 0.18, "learning_rate": 9.582467133426153e-06, "loss": 2.7635, "step": 1525 }, { "epoch": 0.18, "learning_rate": 9.581663598556461e-06, "loss": 2.5728, "step": 1526 }, { "epoch": 0.18, "learning_rate": 9.580859324991607e-06, "loss": 2.6713, "step": 1527 }, { "epoch": 0.18, "learning_rate": 9.580054312861264e-06, "loss": 2.5567, "step": 1528 }, { "epoch": 0.18, "learning_rate": 9.579248562295222e-06, "loss": 2.7706, "step": 1529 }, { "epoch": 0.18, "learning_rate": 9.57844207342339e-06, "loss": 2.6388, "step": 1530 }, { "epoch": 0.18, "learning_rate": 9.577634846375798e-06, "loss": 2.6246, "step": 1531 }, { "epoch": 0.18, "learning_rate": 9.576826881282595e-06, "loss": 2.7485, "step": 1532 }, { "epoch": 0.18, "learning_rate": 9.576018178274047e-06, "loss": 2.6885, "step": 1533 }, { "epoch": 0.18, "learning_rate": 9.57520873748054e-06, "loss": 2.585, "step": 1534 }, { "epoch": 0.18, "learning_rate": 9.574398559032579e-06, "loss": 2.5497, "step": 1535 }, { "epoch": 0.18, "learning_rate": 9.573587643060788e-06, "loss": 2.4683, "step": 1536 }, { "epoch": 0.18, "learning_rate": 9.57277598969591e-06, "loss": 2.623, "step": 1537 }, { "epoch": 0.18, "learning_rate": 9.571963599068807e-06, "loss": 2.6493, "step": 1538 }, { "epoch": 0.18, "learning_rate": 9.571150471310459e-06, "loss": 2.5531, "step": 1539 }, { "epoch": 0.19, "learning_rate": 9.570336606551966e-06, "loss": 2.5747, "step": 1540 }, { "epoch": 0.19, "learning_rate": 9.569522004924547e-06, "loss": 2.5166, "step": 1541 }, { "epoch": 0.19, "learning_rate": 9.568706666559537e-06, "loss": 2.5962, "step": 1542 }, { "epoch": 0.19, "learning_rate": 9.567890591588393e-06, "loss": 2.6826, "step": 1543 }, { "epoch": 0.19, "learning_rate": 9.56707378014269e-06, "loss": 2.5252, "step": 1544 }, { "epoch": 0.19, "learning_rate": 9.56625623235412e-06, "loss": 2.7067, "step": 1545 }, { "epoch": 0.19, "learning_rate": 9.565437948354498e-06, "loss": 2.7468, "step": 1546 }, { "epoch": 0.19, "learning_rate": 9.56461892827575e-06, "loss": 2.7205, "step": 1547 }, { "epoch": 0.19, "learning_rate": 9.56379917224993e-06, "loss": 2.5395, "step": 1548 }, { "epoch": 0.19, "learning_rate": 9.562978680409204e-06, "loss": 2.6991, "step": 1549 }, { "epoch": 0.19, "learning_rate": 9.56215745288586e-06, "loss": 2.7441, "step": 1550 }, { "epoch": 0.19, "learning_rate": 9.561335489812301e-06, "loss": 2.6663, "step": 1551 }, { "epoch": 0.19, "learning_rate": 9.560512791321053e-06, "loss": 2.6246, "step": 1552 }, { "epoch": 0.19, "learning_rate": 9.559689357544756e-06, "loss": 2.6095, "step": 1553 }, { "epoch": 0.19, "learning_rate": 9.558865188616177e-06, "loss": 2.5742, "step": 1554 }, { "epoch": 0.19, "learning_rate": 9.558040284668189e-06, "loss": 2.6222, "step": 1555 }, { "epoch": 0.19, "learning_rate": 9.557214645833792e-06, "loss": 2.6949, "step": 1556 }, { "epoch": 0.19, "learning_rate": 9.556388272246104e-06, "loss": 2.6171, "step": 1557 }, { "epoch": 0.19, "learning_rate": 9.555561164038361e-06, "loss": 2.7241, "step": 1558 }, { "epoch": 0.19, "learning_rate": 9.554733321343913e-06, "loss": 2.6961, "step": 1559 }, { "epoch": 0.19, "learning_rate": 9.553904744296232e-06, "loss": 2.5286, "step": 1560 }, { "epoch": 0.19, "learning_rate": 9.553075433028913e-06, "loss": 2.5792, "step": 1561 }, { "epoch": 0.19, "learning_rate": 9.55224538767566e-06, "loss": 2.6807, "step": 1562 }, { "epoch": 0.19, "learning_rate": 9.551414608370303e-06, "loss": 2.8158, "step": 1563 }, { "epoch": 0.19, "learning_rate": 9.550583095246786e-06, "loss": 2.6429, "step": 1564 }, { "epoch": 0.19, "learning_rate": 9.549750848439172e-06, "loss": 2.6286, "step": 1565 }, { "epoch": 0.19, "learning_rate": 9.548917868081644e-06, "loss": 2.4178, "step": 1566 }, { "epoch": 0.19, "learning_rate": 9.5480841543085e-06, "loss": 2.5774, "step": 1567 }, { "epoch": 0.19, "learning_rate": 9.547249707254166e-06, "loss": 2.7037, "step": 1568 }, { "epoch": 0.19, "learning_rate": 9.546414527053167e-06, "loss": 2.5711, "step": 1569 }, { "epoch": 0.19, "learning_rate": 9.545578613840168e-06, "loss": 2.6101, "step": 1570 }, { "epoch": 0.19, "learning_rate": 9.544741967749937e-06, "loss": 2.5438, "step": 1571 }, { "epoch": 0.19, "learning_rate": 9.543904588917366e-06, "loss": 2.5924, "step": 1572 }, { "epoch": 0.19, "learning_rate": 9.543066477477467e-06, "loss": 2.6435, "step": 1573 }, { "epoch": 0.19, "learning_rate": 9.542227633565364e-06, "loss": 2.607, "step": 1574 }, { "epoch": 0.19, "learning_rate": 9.541388057316302e-06, "loss": 2.6511, "step": 1575 }, { "epoch": 0.19, "learning_rate": 9.54054774886565e-06, "loss": 2.6576, "step": 1576 }, { "epoch": 0.19, "learning_rate": 9.539706708348886e-06, "loss": 2.5765, "step": 1577 }, { "epoch": 0.19, "learning_rate": 9.53886493590161e-06, "loss": 2.6457, "step": 1578 }, { "epoch": 0.19, "learning_rate": 9.538022431659541e-06, "loss": 2.7188, "step": 1579 }, { "epoch": 0.19, "learning_rate": 9.537179195758513e-06, "loss": 2.7571, "step": 1580 }, { "epoch": 0.19, "learning_rate": 9.53633522833448e-06, "loss": 2.5843, "step": 1581 }, { "epoch": 0.19, "learning_rate": 9.535490529523514e-06, "loss": 2.5458, "step": 1582 }, { "epoch": 0.19, "learning_rate": 9.534645099461805e-06, "loss": 2.5623, "step": 1583 }, { "epoch": 0.19, "learning_rate": 9.533798938285663e-06, "loss": 2.5564, "step": 1584 }, { "epoch": 0.19, "learning_rate": 9.532952046131507e-06, "loss": 2.6347, "step": 1585 }, { "epoch": 0.19, "learning_rate": 9.532104423135885e-06, "loss": 2.6198, "step": 1586 }, { "epoch": 0.19, "learning_rate": 9.531256069435459e-06, "loss": 2.5483, "step": 1587 }, { "epoch": 0.19, "learning_rate": 9.530406985167005e-06, "loss": 2.5712, "step": 1588 }, { "epoch": 0.19, "learning_rate": 9.52955717046742e-06, "loss": 2.6821, "step": 1589 }, { "epoch": 0.19, "learning_rate": 9.52870662547372e-06, "loss": 2.4305, "step": 1590 }, { "epoch": 0.19, "learning_rate": 9.527855350323035e-06, "loss": 2.56, "step": 1591 }, { "epoch": 0.19, "learning_rate": 9.527003345152616e-06, "loss": 2.3647, "step": 1592 }, { "epoch": 0.19, "learning_rate": 9.526150610099831e-06, "loss": 2.711, "step": 1593 }, { "epoch": 0.19, "learning_rate": 9.525297145302167e-06, "loss": 2.6373, "step": 1594 }, { "epoch": 0.19, "learning_rate": 9.524442950897221e-06, "loss": 2.463, "step": 1595 }, { "epoch": 0.19, "learning_rate": 9.523588027022721e-06, "loss": 2.5171, "step": 1596 }, { "epoch": 0.19, "learning_rate": 9.522732373816499e-06, "loss": 2.5808, "step": 1597 }, { "epoch": 0.19, "learning_rate": 9.521875991416514e-06, "loss": 2.6144, "step": 1598 }, { "epoch": 0.19, "learning_rate": 9.52101887996084e-06, "loss": 2.778, "step": 1599 }, { "epoch": 0.19, "learning_rate": 9.520161039587666e-06, "loss": 2.7144, "step": 1600 }, { "epoch": 0.19, "learning_rate": 9.519302470435298e-06, "loss": 2.7252, "step": 1601 }, { "epoch": 0.19, "learning_rate": 9.518443172642168e-06, "loss": 2.4493, "step": 1602 }, { "epoch": 0.19, "learning_rate": 9.517583146346816e-06, "loss": 2.7483, "step": 1603 }, { "epoch": 0.19, "learning_rate": 9.516722391687903e-06, "loss": 2.5071, "step": 1604 }, { "epoch": 0.19, "learning_rate": 9.515860908804206e-06, "loss": 2.7041, "step": 1605 }, { "epoch": 0.19, "learning_rate": 9.514998697834623e-06, "loss": 2.6237, "step": 1606 }, { "epoch": 0.19, "learning_rate": 9.514135758918166e-06, "loss": 2.5838, "step": 1607 }, { "epoch": 0.19, "learning_rate": 9.513272092193965e-06, "loss": 2.4795, "step": 1608 }, { "epoch": 0.19, "learning_rate": 9.512407697801268e-06, "loss": 2.6168, "step": 1609 }, { "epoch": 0.19, "learning_rate": 9.51154257587944e-06, "loss": 2.5734, "step": 1610 }, { "epoch": 0.19, "learning_rate": 9.510676726567965e-06, "loss": 2.8275, "step": 1611 }, { "epoch": 0.19, "learning_rate": 9.50981015000644e-06, "loss": 2.4319, "step": 1612 }, { "epoch": 0.19, "learning_rate": 9.508942846334585e-06, "loss": 2.5992, "step": 1613 }, { "epoch": 0.19, "learning_rate": 9.508074815692232e-06, "loss": 2.5862, "step": 1614 }, { "epoch": 0.19, "learning_rate": 9.507206058219332e-06, "loss": 2.4351, "step": 1615 }, { "epoch": 0.19, "learning_rate": 9.506336574055954e-06, "loss": 2.6975, "step": 1616 }, { "epoch": 0.19, "learning_rate": 9.505466363342283e-06, "loss": 2.4826, "step": 1617 }, { "epoch": 0.19, "learning_rate": 9.504595426218626e-06, "loss": 2.7028, "step": 1618 }, { "epoch": 0.19, "learning_rate": 9.503723762825397e-06, "loss": 2.6407, "step": 1619 }, { "epoch": 0.19, "learning_rate": 9.502851373303137e-06, "loss": 2.6229, "step": 1620 }, { "epoch": 0.19, "learning_rate": 9.5019782577925e-06, "loss": 2.5398, "step": 1621 }, { "epoch": 0.19, "learning_rate": 9.501104416434255e-06, "loss": 2.6138, "step": 1622 }, { "epoch": 0.19, "learning_rate": 9.500229849369291e-06, "loss": 2.5243, "step": 1623 }, { "epoch": 0.2, "learning_rate": 9.499354556738615e-06, "loss": 2.6005, "step": 1624 }, { "epoch": 0.2, "learning_rate": 9.498478538683346e-06, "loss": 2.4422, "step": 1625 }, { "epoch": 0.2, "learning_rate": 9.497601795344728e-06, "loss": 2.7324, "step": 1626 }, { "epoch": 0.2, "learning_rate": 9.496724326864111e-06, "loss": 2.6163, "step": 1627 }, { "epoch": 0.2, "learning_rate": 9.495846133382973e-06, "loss": 2.5485, "step": 1628 }, { "epoch": 0.2, "learning_rate": 9.494967215042901e-06, "loss": 2.6753, "step": 1629 }, { "epoch": 0.2, "learning_rate": 9.494087571985604e-06, "loss": 2.7141, "step": 1630 }, { "epoch": 0.2, "learning_rate": 9.493207204352902e-06, "loss": 2.6547, "step": 1631 }, { "epoch": 0.2, "learning_rate": 9.49232611228674e-06, "loss": 2.5318, "step": 1632 }, { "epoch": 0.2, "learning_rate": 9.49144429592917e-06, "loss": 2.6309, "step": 1633 }, { "epoch": 0.2, "learning_rate": 9.490561755422374e-06, "loss": 2.6446, "step": 1634 }, { "epoch": 0.2, "learning_rate": 9.489678490908634e-06, "loss": 2.7225, "step": 1635 }, { "epoch": 0.2, "learning_rate": 9.488794502530361e-06, "loss": 2.5662, "step": 1636 }, { "epoch": 0.2, "learning_rate": 9.487909790430081e-06, "loss": 2.4752, "step": 1637 }, { "epoch": 0.2, "learning_rate": 9.487024354750434e-06, "loss": 2.5272, "step": 1638 }, { "epoch": 0.2, "learning_rate": 9.486138195634176e-06, "loss": 2.5857, "step": 1639 }, { "epoch": 0.2, "learning_rate": 9.485251313224181e-06, "loss": 2.5848, "step": 1640 }, { "epoch": 0.2, "learning_rate": 9.484363707663443e-06, "loss": 2.4172, "step": 1641 }, { "epoch": 0.2, "learning_rate": 9.483475379095066e-06, "loss": 2.7155, "step": 1642 }, { "epoch": 0.2, "learning_rate": 9.482586327662276e-06, "loss": 2.5455, "step": 1643 }, { "epoch": 0.2, "learning_rate": 9.481696553508411e-06, "loss": 2.6111, "step": 1644 }, { "epoch": 0.2, "learning_rate": 9.48080605677693e-06, "loss": 2.4677, "step": 1645 }, { "epoch": 0.2, "learning_rate": 9.479914837611409e-06, "loss": 2.6357, "step": 1646 }, { "epoch": 0.2, "learning_rate": 9.479022896155532e-06, "loss": 2.5689, "step": 1647 }, { "epoch": 0.2, "learning_rate": 9.478130232553111e-06, "loss": 2.702, "step": 1648 }, { "epoch": 0.2, "learning_rate": 9.477236846948068e-06, "loss": 2.6484, "step": 1649 }, { "epoch": 0.2, "learning_rate": 9.476342739484438e-06, "loss": 2.4815, "step": 1650 }, { "epoch": 0.2, "learning_rate": 9.47544791030638e-06, "loss": 2.5919, "step": 1651 }, { "epoch": 0.2, "learning_rate": 9.474552359558167e-06, "loss": 2.6211, "step": 1652 }, { "epoch": 0.2, "learning_rate": 9.473656087384186e-06, "loss": 2.5475, "step": 1653 }, { "epoch": 0.2, "learning_rate": 9.472759093928942e-06, "loss": 2.4485, "step": 1654 }, { "epoch": 0.2, "learning_rate": 9.471861379337054e-06, "loss": 2.4919, "step": 1655 }, { "epoch": 0.2, "learning_rate": 9.470962943753263e-06, "loss": 2.6224, "step": 1656 }, { "epoch": 0.2, "learning_rate": 9.470063787322418e-06, "loss": 2.545, "step": 1657 }, { "epoch": 0.2, "learning_rate": 9.469163910189494e-06, "loss": 2.5292, "step": 1658 }, { "epoch": 0.2, "learning_rate": 9.468263312499574e-06, "loss": 2.6412, "step": 1659 }, { "epoch": 0.2, "learning_rate": 9.46736199439786e-06, "loss": 2.4453, "step": 1660 }, { "epoch": 0.2, "learning_rate": 9.46645995602967e-06, "loss": 2.554, "step": 1661 }, { "epoch": 0.2, "learning_rate": 9.465557197540438e-06, "loss": 2.7085, "step": 1662 }, { "epoch": 0.2, "learning_rate": 9.464653719075718e-06, "loss": 2.5804, "step": 1663 }, { "epoch": 0.2, "learning_rate": 9.463749520781172e-06, "loss": 2.5613, "step": 1664 }, { "epoch": 0.2, "learning_rate": 9.462844602802585e-06, "loss": 2.5723, "step": 1665 }, { "epoch": 0.2, "learning_rate": 9.461938965285856e-06, "loss": 2.662, "step": 1666 }, { "epoch": 0.2, "learning_rate": 9.461032608376997e-06, "loss": 2.7024, "step": 1667 }, { "epoch": 0.2, "learning_rate": 9.460125532222142e-06, "loss": 2.6135, "step": 1668 }, { "epoch": 0.2, "learning_rate": 9.459217736967535e-06, "loss": 2.579, "step": 1669 }, { "epoch": 0.2, "learning_rate": 9.458309222759542e-06, "loss": 2.5759, "step": 1670 }, { "epoch": 0.2, "learning_rate": 9.457399989744635e-06, "loss": 2.59, "step": 1671 }, { "epoch": 0.2, "learning_rate": 9.456490038069417e-06, "loss": 2.5522, "step": 1672 }, { "epoch": 0.2, "learning_rate": 9.45557936788059e-06, "loss": 2.5628, "step": 1673 }, { "epoch": 0.2, "learning_rate": 9.454667979324987e-06, "loss": 2.6187, "step": 1674 }, { "epoch": 0.2, "learning_rate": 9.453755872549545e-06, "loss": 2.4746, "step": 1675 }, { "epoch": 0.2, "learning_rate": 9.452843047701324e-06, "loss": 2.6569, "step": 1676 }, { "epoch": 0.2, "learning_rate": 9.451929504927496e-06, "loss": 2.7459, "step": 1677 }, { "epoch": 0.2, "learning_rate": 9.451015244375352e-06, "loss": 2.5345, "step": 1678 }, { "epoch": 0.2, "learning_rate": 9.450100266192295e-06, "loss": 2.5932, "step": 1679 }, { "epoch": 0.2, "learning_rate": 9.449184570525847e-06, "loss": 2.6893, "step": 1680 }, { "epoch": 0.2, "learning_rate": 9.448268157523645e-06, "loss": 2.7194, "step": 1681 }, { "epoch": 0.2, "learning_rate": 9.44735102733344e-06, "loss": 2.8082, "step": 1682 }, { "epoch": 0.2, "learning_rate": 9.446433180103098e-06, "loss": 2.4355, "step": 1683 }, { "epoch": 0.2, "learning_rate": 9.445514615980604e-06, "loss": 2.5808, "step": 1684 }, { "epoch": 0.2, "learning_rate": 9.444595335114058e-06, "loss": 2.5742, "step": 1685 }, { "epoch": 0.2, "learning_rate": 9.44367533765167e-06, "loss": 2.478, "step": 1686 }, { "epoch": 0.2, "learning_rate": 9.442754623741775e-06, "loss": 2.6777, "step": 1687 }, { "epoch": 0.2, "learning_rate": 9.441833193532817e-06, "loss": 2.7856, "step": 1688 }, { "epoch": 0.2, "learning_rate": 9.440911047173355e-06, "loss": 2.7012, "step": 1689 }, { "epoch": 0.2, "learning_rate": 9.439988184812065e-06, "loss": 2.5071, "step": 1690 }, { "epoch": 0.2, "learning_rate": 9.439064606597743e-06, "loss": 2.4894, "step": 1691 }, { "epoch": 0.2, "learning_rate": 9.438140312679292e-06, "loss": 2.561, "step": 1692 }, { "epoch": 0.2, "learning_rate": 9.437215303205736e-06, "loss": 2.85, "step": 1693 }, { "epoch": 0.2, "learning_rate": 9.436289578326215e-06, "loss": 2.5594, "step": 1694 }, { "epoch": 0.2, "learning_rate": 9.435363138189976e-06, "loss": 2.6036, "step": 1695 }, { "epoch": 0.2, "learning_rate": 9.434435982946397e-06, "loss": 2.5689, "step": 1696 }, { "epoch": 0.2, "learning_rate": 9.433508112744953e-06, "loss": 2.6231, "step": 1697 }, { "epoch": 0.2, "learning_rate": 9.432579527735251e-06, "loss": 2.4876, "step": 1698 }, { "epoch": 0.2, "learning_rate": 9.431650228066999e-06, "loss": 2.5626, "step": 1699 }, { "epoch": 0.2, "learning_rate": 9.43072021389003e-06, "loss": 2.6454, "step": 1700 }, { "epoch": 0.2, "learning_rate": 9.429789485354287e-06, "loss": 2.5638, "step": 1701 }, { "epoch": 0.2, "learning_rate": 9.428858042609832e-06, "loss": 2.7173, "step": 1702 }, { "epoch": 0.2, "learning_rate": 9.42792588580684e-06, "loss": 2.7663, "step": 1703 }, { "epoch": 0.2, "learning_rate": 9.4269930150956e-06, "loss": 2.6596, "step": 1704 }, { "epoch": 0.2, "learning_rate": 9.426059430626518e-06, "loss": 2.6069, "step": 1705 }, { "epoch": 0.2, "learning_rate": 9.425125132550115e-06, "loss": 2.4881, "step": 1706 }, { "epoch": 0.21, "learning_rate": 9.424190121017027e-06, "loss": 2.6046, "step": 1707 }, { "epoch": 0.21, "learning_rate": 9.423254396178003e-06, "loss": 2.5127, "step": 1708 }, { "epoch": 0.21, "learning_rate": 9.422317958183908e-06, "loss": 2.6742, "step": 1709 }, { "epoch": 0.21, "learning_rate": 9.421380807185727e-06, "loss": 2.5407, "step": 1710 }, { "epoch": 0.21, "learning_rate": 9.420442943334551e-06, "loss": 2.5994, "step": 1711 }, { "epoch": 0.21, "learning_rate": 9.419504366781591e-06, "loss": 2.6025, "step": 1712 }, { "epoch": 0.21, "learning_rate": 9.418565077678174e-06, "loss": 2.7089, "step": 1713 }, { "epoch": 0.21, "learning_rate": 9.417625076175741e-06, "loss": 2.5048, "step": 1714 }, { "epoch": 0.21, "learning_rate": 9.416684362425846e-06, "loss": 2.5556, "step": 1715 }, { "epoch": 0.21, "learning_rate": 9.415742936580156e-06, "loss": 2.5666, "step": 1716 }, { "epoch": 0.21, "learning_rate": 9.41480079879046e-06, "loss": 2.5515, "step": 1717 }, { "epoch": 0.21, "learning_rate": 9.413857949208655e-06, "loss": 2.7239, "step": 1718 }, { "epoch": 0.21, "learning_rate": 9.412914387986758e-06, "loss": 2.4883, "step": 1719 }, { "epoch": 0.21, "learning_rate": 9.411970115276897e-06, "loss": 2.6383, "step": 1720 }, { "epoch": 0.21, "learning_rate": 9.411025131231313e-06, "loss": 2.5343, "step": 1721 }, { "epoch": 0.21, "learning_rate": 9.410079436002367e-06, "loss": 2.6647, "step": 1722 }, { "epoch": 0.21, "learning_rate": 9.409133029742532e-06, "loss": 2.539, "step": 1723 }, { "epoch": 0.21, "learning_rate": 9.408185912604395e-06, "loss": 2.6446, "step": 1724 }, { "epoch": 0.21, "learning_rate": 9.407238084740658e-06, "loss": 2.4825, "step": 1725 }, { "epoch": 0.21, "learning_rate": 9.40628954630414e-06, "loss": 2.5409, "step": 1726 }, { "epoch": 0.21, "learning_rate": 9.405340297447772e-06, "loss": 2.647, "step": 1727 }, { "epoch": 0.21, "learning_rate": 9.404390338324599e-06, "loss": 2.5909, "step": 1728 }, { "epoch": 0.21, "learning_rate": 9.40343966908778e-06, "loss": 2.7705, "step": 1729 }, { "epoch": 0.21, "learning_rate": 9.402488289890593e-06, "loss": 2.544, "step": 1730 }, { "epoch": 0.21, "learning_rate": 9.401536200886426e-06, "loss": 2.6641, "step": 1731 }, { "epoch": 0.21, "learning_rate": 9.400583402228785e-06, "loss": 2.5942, "step": 1732 }, { "epoch": 0.21, "learning_rate": 9.399629894071285e-06, "loss": 2.8705, "step": 1733 }, { "epoch": 0.21, "learning_rate": 9.398675676567662e-06, "loss": 2.5475, "step": 1734 }, { "epoch": 0.21, "learning_rate": 9.39772074987176e-06, "loss": 2.6146, "step": 1735 }, { "epoch": 0.21, "learning_rate": 9.396765114137544e-06, "loss": 2.5474, "step": 1736 }, { "epoch": 0.21, "learning_rate": 9.395808769519086e-06, "loss": 2.6273, "step": 1737 }, { "epoch": 0.21, "learning_rate": 9.394851716170582e-06, "loss": 2.3296, "step": 1738 }, { "epoch": 0.21, "learning_rate": 9.393893954246328e-06, "loss": 2.5264, "step": 1739 }, { "epoch": 0.21, "learning_rate": 9.39293548390075e-06, "loss": 2.5208, "step": 1740 }, { "epoch": 0.21, "learning_rate": 9.391976305288376e-06, "loss": 2.5311, "step": 1741 }, { "epoch": 0.21, "learning_rate": 9.391016418563856e-06, "loss": 2.5949, "step": 1742 }, { "epoch": 0.21, "learning_rate": 9.39005582388195e-06, "loss": 2.664, "step": 1743 }, { "epoch": 0.21, "learning_rate": 9.389094521397532e-06, "loss": 2.6469, "step": 1744 }, { "epoch": 0.21, "learning_rate": 9.388132511265594e-06, "loss": 2.3803, "step": 1745 }, { "epoch": 0.21, "learning_rate": 9.38716979364124e-06, "loss": 2.815, "step": 1746 }, { "epoch": 0.21, "learning_rate": 9.386206368679684e-06, "loss": 2.6434, "step": 1747 }, { "epoch": 0.21, "learning_rate": 9.385242236536259e-06, "loss": 2.6816, "step": 1748 }, { "epoch": 0.21, "learning_rate": 9.384277397366413e-06, "loss": 2.6157, "step": 1749 }, { "epoch": 0.21, "learning_rate": 9.383311851325702e-06, "loss": 2.6216, "step": 1750 }, { "epoch": 0.21, "learning_rate": 9.382345598569805e-06, "loss": 2.6737, "step": 1751 }, { "epoch": 0.21, "learning_rate": 9.381378639254504e-06, "loss": 2.5271, "step": 1752 }, { "epoch": 0.21, "learning_rate": 9.380410973535702e-06, "loss": 2.7343, "step": 1753 }, { "epoch": 0.21, "learning_rate": 9.379442601569415e-06, "loss": 2.5608, "step": 1754 }, { "epoch": 0.21, "learning_rate": 9.378473523511774e-06, "loss": 2.623, "step": 1755 }, { "epoch": 0.21, "learning_rate": 9.377503739519019e-06, "loss": 2.709, "step": 1756 }, { "epoch": 0.21, "learning_rate": 9.37653324974751e-06, "loss": 2.7383, "step": 1757 }, { "epoch": 0.21, "learning_rate": 9.375562054353714e-06, "loss": 2.6502, "step": 1758 }, { "epoch": 0.21, "learning_rate": 9.37459015349422e-06, "loss": 2.6749, "step": 1759 }, { "epoch": 0.21, "learning_rate": 9.37361754732572e-06, "loss": 2.725, "step": 1760 }, { "epoch": 0.21, "learning_rate": 9.37264423600503e-06, "loss": 2.5349, "step": 1761 }, { "epoch": 0.21, "learning_rate": 9.371670219689077e-06, "loss": 2.5546, "step": 1762 }, { "epoch": 0.21, "learning_rate": 9.370695498534898e-06, "loss": 2.5613, "step": 1763 }, { "epoch": 0.21, "learning_rate": 9.369720072699648e-06, "loss": 2.5287, "step": 1764 }, { "epoch": 0.21, "learning_rate": 9.36874394234059e-06, "loss": 2.6847, "step": 1765 }, { "epoch": 0.21, "learning_rate": 9.367767107615106e-06, "loss": 2.6523, "step": 1766 }, { "epoch": 0.21, "learning_rate": 9.36678956868069e-06, "loss": 2.7404, "step": 1767 }, { "epoch": 0.21, "learning_rate": 9.365811325694949e-06, "loss": 2.6472, "step": 1768 }, { "epoch": 0.21, "learning_rate": 9.364832378815602e-06, "loss": 2.4614, "step": 1769 }, { "epoch": 0.21, "learning_rate": 9.363852728200488e-06, "loss": 2.5167, "step": 1770 }, { "epoch": 0.21, "learning_rate": 9.36287237400755e-06, "loss": 2.7275, "step": 1771 }, { "epoch": 0.21, "learning_rate": 9.36189131639485e-06, "loss": 2.6802, "step": 1772 }, { "epoch": 0.21, "learning_rate": 9.360909555520565e-06, "loss": 2.7541, "step": 1773 }, { "epoch": 0.21, "learning_rate": 9.35992709154298e-06, "loss": 2.5189, "step": 1774 }, { "epoch": 0.21, "learning_rate": 9.358943924620498e-06, "loss": 2.5649, "step": 1775 }, { "epoch": 0.21, "learning_rate": 9.357960054911633e-06, "loss": 2.5926, "step": 1776 }, { "epoch": 0.21, "learning_rate": 9.356975482575013e-06, "loss": 2.5905, "step": 1777 }, { "epoch": 0.21, "learning_rate": 9.355990207769378e-06, "loss": 2.7679, "step": 1778 }, { "epoch": 0.21, "learning_rate": 9.355004230653586e-06, "loss": 2.4523, "step": 1779 }, { "epoch": 0.21, "learning_rate": 9.354017551386599e-06, "loss": 2.6743, "step": 1780 }, { "epoch": 0.21, "learning_rate": 9.353030170127505e-06, "loss": 2.5748, "step": 1781 }, { "epoch": 0.21, "learning_rate": 9.352042087035491e-06, "loss": 2.5235, "step": 1782 }, { "epoch": 0.21, "learning_rate": 9.351053302269871e-06, "loss": 2.5453, "step": 1783 }, { "epoch": 0.21, "learning_rate": 9.35006381599006e-06, "loss": 2.8055, "step": 1784 }, { "epoch": 0.21, "learning_rate": 9.349073628355593e-06, "loss": 2.5441, "step": 1785 }, { "epoch": 0.21, "learning_rate": 9.348082739526116e-06, "loss": 2.569, "step": 1786 }, { "epoch": 0.21, "learning_rate": 9.347091149661392e-06, "loss": 2.5793, "step": 1787 }, { "epoch": 0.21, "learning_rate": 9.346098858921292e-06, "loss": 2.5131, "step": 1788 }, { "epoch": 0.21, "learning_rate": 9.345105867465798e-06, "loss": 2.6083, "step": 1789 }, { "epoch": 0.22, "learning_rate": 9.344112175455013e-06, "loss": 2.5978, "step": 1790 }, { "epoch": 0.22, "learning_rate": 9.343117783049148e-06, "loss": 2.5766, "step": 1791 }, { "epoch": 0.22, "learning_rate": 9.342122690408526e-06, "loss": 2.5388, "step": 1792 }, { "epoch": 0.22, "learning_rate": 9.341126897693583e-06, "loss": 2.6094, "step": 1793 }, { "epoch": 0.22, "learning_rate": 9.340130405064873e-06, "loss": 2.459, "step": 1794 }, { "epoch": 0.22, "learning_rate": 9.339133212683058e-06, "loss": 2.5272, "step": 1795 }, { "epoch": 0.22, "learning_rate": 9.338135320708912e-06, "loss": 2.4644, "step": 1796 }, { "epoch": 0.22, "learning_rate": 9.337136729303324e-06, "loss": 2.7315, "step": 1797 }, { "epoch": 0.22, "learning_rate": 9.336137438627299e-06, "loss": 2.7504, "step": 1798 }, { "epoch": 0.22, "learning_rate": 9.335137448841947e-06, "loss": 2.6567, "step": 1799 }, { "epoch": 0.22, "learning_rate": 9.334136760108496e-06, "loss": 2.6186, "step": 1800 }, { "epoch": 0.22, "learning_rate": 9.333135372588287e-06, "loss": 2.6296, "step": 1801 }, { "epoch": 0.22, "learning_rate": 9.332133286442772e-06, "loss": 2.8078, "step": 1802 }, { "epoch": 0.22, "learning_rate": 9.331130501833516e-06, "loss": 2.5569, "step": 1803 }, { "epoch": 0.22, "learning_rate": 9.330127018922195e-06, "loss": 2.5636, "step": 1804 }, { "epoch": 0.22, "learning_rate": 9.329122837870599e-06, "loss": 2.701, "step": 1805 }, { "epoch": 0.22, "learning_rate": 9.328117958840632e-06, "loss": 2.6382, "step": 1806 }, { "epoch": 0.22, "learning_rate": 9.327112381994312e-06, "loss": 2.7414, "step": 1807 }, { "epoch": 0.22, "learning_rate": 9.326106107493762e-06, "loss": 2.7015, "step": 1808 }, { "epoch": 0.22, "learning_rate": 9.325099135501223e-06, "loss": 2.4536, "step": 1809 }, { "epoch": 0.22, "learning_rate": 9.324091466179051e-06, "loss": 2.4581, "step": 1810 }, { "epoch": 0.22, "learning_rate": 9.323083099689705e-06, "loss": 2.5679, "step": 1811 }, { "epoch": 0.22, "learning_rate": 9.32207403619577e-06, "loss": 2.9358, "step": 1812 }, { "epoch": 0.22, "learning_rate": 9.32106427585993e-06, "loss": 2.6042, "step": 1813 }, { "epoch": 0.22, "learning_rate": 9.32005381884499e-06, "loss": 2.6182, "step": 1814 }, { "epoch": 0.22, "learning_rate": 9.319042665313865e-06, "loss": 2.6229, "step": 1815 }, { "epoch": 0.22, "learning_rate": 9.318030815429579e-06, "loss": 2.5722, "step": 1816 }, { "epoch": 0.22, "learning_rate": 9.317018269355276e-06, "loss": 2.7883, "step": 1817 }, { "epoch": 0.22, "learning_rate": 9.316005027254202e-06, "loss": 2.607, "step": 1818 }, { "epoch": 0.22, "learning_rate": 9.314991089289722e-06, "loss": 2.421, "step": 1819 }, { "epoch": 0.22, "learning_rate": 9.313976455625316e-06, "loss": 2.7702, "step": 1820 }, { "epoch": 0.22, "learning_rate": 9.312961126424565e-06, "loss": 2.6267, "step": 1821 }, { "epoch": 0.22, "learning_rate": 9.311945101851175e-06, "loss": 2.5482, "step": 1822 }, { "epoch": 0.22, "learning_rate": 9.310928382068955e-06, "loss": 2.623, "step": 1823 }, { "epoch": 0.22, "learning_rate": 9.309910967241831e-06, "loss": 2.6183, "step": 1824 }, { "epoch": 0.22, "learning_rate": 9.30889285753384e-06, "loss": 2.5061, "step": 1825 }, { "epoch": 0.22, "learning_rate": 9.307874053109127e-06, "loss": 2.4959, "step": 1826 }, { "epoch": 0.22, "learning_rate": 9.306854554131954e-06, "loss": 2.6524, "step": 1827 }, { "epoch": 0.22, "learning_rate": 9.305834360766695e-06, "loss": 2.6139, "step": 1828 }, { "epoch": 0.22, "learning_rate": 9.304813473177834e-06, "loss": 2.6624, "step": 1829 }, { "epoch": 0.22, "learning_rate": 9.303791891529966e-06, "loss": 2.5326, "step": 1830 }, { "epoch": 0.22, "learning_rate": 9.302769615987798e-06, "loss": 2.6291, "step": 1831 }, { "epoch": 0.22, "learning_rate": 9.301746646716152e-06, "loss": 2.4875, "step": 1832 }, { "epoch": 0.22, "learning_rate": 9.30072298387996e-06, "loss": 2.5696, "step": 1833 }, { "epoch": 0.22, "learning_rate": 9.299698627644266e-06, "loss": 2.4787, "step": 1834 }, { "epoch": 0.22, "learning_rate": 9.298673578174225e-06, "loss": 2.5011, "step": 1835 }, { "epoch": 0.22, "learning_rate": 9.297647835635102e-06, "loss": 2.5731, "step": 1836 }, { "epoch": 0.22, "learning_rate": 9.29662140019228e-06, "loss": 2.6629, "step": 1837 }, { "epoch": 0.22, "learning_rate": 9.295594272011246e-06, "loss": 2.5676, "step": 1838 }, { "epoch": 0.22, "learning_rate": 9.294566451257607e-06, "loss": 2.3752, "step": 1839 }, { "epoch": 0.22, "learning_rate": 9.293537938097073e-06, "loss": 2.6747, "step": 1840 }, { "epoch": 0.22, "learning_rate": 9.29250873269547e-06, "loss": 2.6185, "step": 1841 }, { "epoch": 0.22, "learning_rate": 9.291478835218737e-06, "loss": 2.6347, "step": 1842 }, { "epoch": 0.22, "learning_rate": 9.290448245832922e-06, "loss": 2.6457, "step": 1843 }, { "epoch": 0.22, "learning_rate": 9.289416964704186e-06, "loss": 2.5412, "step": 1844 }, { "epoch": 0.22, "learning_rate": 9.288384991998801e-06, "loss": 2.5117, "step": 1845 }, { "epoch": 0.22, "learning_rate": 9.28735232788315e-06, "loss": 2.5874, "step": 1846 }, { "epoch": 0.22, "learning_rate": 9.286318972523728e-06, "loss": 2.5137, "step": 1847 }, { "epoch": 0.22, "learning_rate": 9.285284926087144e-06, "loss": 2.5435, "step": 1848 }, { "epoch": 0.22, "learning_rate": 9.284250188740111e-06, "loss": 2.7115, "step": 1849 }, { "epoch": 0.22, "learning_rate": 9.283214760649462e-06, "loss": 2.5199, "step": 1850 }, { "epoch": 0.22, "learning_rate": 9.282178641982136e-06, "loss": 2.4881, "step": 1851 }, { "epoch": 0.22, "learning_rate": 9.281141832905185e-06, "loss": 2.6333, "step": 1852 }, { "epoch": 0.22, "learning_rate": 9.280104333585771e-06, "loss": 2.6317, "step": 1853 }, { "epoch": 0.22, "learning_rate": 9.279066144191173e-06, "loss": 2.6584, "step": 1854 }, { "epoch": 0.22, "learning_rate": 9.278027264888774e-06, "loss": 2.6966, "step": 1855 }, { "epoch": 0.22, "learning_rate": 9.27698769584607e-06, "loss": 2.523, "step": 1856 }, { "epoch": 0.22, "learning_rate": 9.27594743723067e-06, "loss": 2.5527, "step": 1857 }, { "epoch": 0.22, "learning_rate": 9.274906489210294e-06, "loss": 2.5175, "step": 1858 }, { "epoch": 0.22, "learning_rate": 9.273864851952771e-06, "loss": 2.4365, "step": 1859 }, { "epoch": 0.22, "learning_rate": 9.272822525626047e-06, "loss": 2.7369, "step": 1860 }, { "epoch": 0.22, "learning_rate": 9.271779510398168e-06, "loss": 2.4506, "step": 1861 }, { "epoch": 0.22, "learning_rate": 9.270735806437306e-06, "loss": 2.514, "step": 1862 }, { "epoch": 0.22, "learning_rate": 9.269691413911727e-06, "loss": 2.5532, "step": 1863 }, { "epoch": 0.22, "learning_rate": 9.268646332989826e-06, "loss": 2.7467, "step": 1864 }, { "epoch": 0.22, "learning_rate": 9.267600563840093e-06, "loss": 2.6881, "step": 1865 }, { "epoch": 0.22, "learning_rate": 9.266554106631137e-06, "loss": 2.6248, "step": 1866 }, { "epoch": 0.22, "learning_rate": 9.26550696153168e-06, "loss": 2.5816, "step": 1867 }, { "epoch": 0.22, "learning_rate": 9.26445912871055e-06, "loss": 2.6071, "step": 1868 }, { "epoch": 0.22, "learning_rate": 9.263410608336687e-06, "loss": 2.5906, "step": 1869 }, { "epoch": 0.22, "learning_rate": 9.262361400579145e-06, "loss": 2.8241, "step": 1870 }, { "epoch": 0.22, "learning_rate": 9.26131150560708e-06, "loss": 2.633, "step": 1871 }, { "epoch": 0.22, "learning_rate": 9.260260923589773e-06, "loss": 2.5108, "step": 1872 }, { "epoch": 0.23, "learning_rate": 9.259209654696602e-06, "loss": 2.5262, "step": 1873 }, { "epoch": 0.23, "learning_rate": 9.258157699097065e-06, "loss": 2.8399, "step": 1874 }, { "epoch": 0.23, "learning_rate": 9.257105056960767e-06, "loss": 2.447, "step": 1875 }, { "epoch": 0.23, "learning_rate": 9.25605172845742e-06, "loss": 2.5732, "step": 1876 }, { "epoch": 0.23, "learning_rate": 9.254997713756857e-06, "loss": 2.4732, "step": 1877 }, { "epoch": 0.23, "learning_rate": 9.25394301302901e-06, "loss": 2.4912, "step": 1878 }, { "epoch": 0.23, "learning_rate": 9.25288762644393e-06, "loss": 2.3482, "step": 1879 }, { "epoch": 0.23, "learning_rate": 9.251831554171773e-06, "loss": 2.7347, "step": 1880 }, { "epoch": 0.23, "learning_rate": 9.250774796382812e-06, "loss": 2.7068, "step": 1881 }, { "epoch": 0.23, "learning_rate": 9.249717353247422e-06, "loss": 2.7201, "step": 1882 }, { "epoch": 0.23, "learning_rate": 9.248659224936095e-06, "loss": 2.4898, "step": 1883 }, { "epoch": 0.23, "learning_rate": 9.247600411619434e-06, "loss": 2.6139, "step": 1884 }, { "epoch": 0.23, "learning_rate": 9.246540913468147e-06, "loss": 2.4889, "step": 1885 }, { "epoch": 0.23, "learning_rate": 9.245480730653055e-06, "loss": 2.6162, "step": 1886 }, { "epoch": 0.23, "learning_rate": 9.24441986334509e-06, "loss": 2.4791, "step": 1887 }, { "epoch": 0.23, "learning_rate": 9.243358311715298e-06, "loss": 2.5717, "step": 1888 }, { "epoch": 0.23, "learning_rate": 9.242296075934825e-06, "loss": 2.5317, "step": 1889 }, { "epoch": 0.23, "learning_rate": 9.24123315617494e-06, "loss": 2.5668, "step": 1890 }, { "epoch": 0.23, "learning_rate": 9.240169552607012e-06, "loss": 2.7414, "step": 1891 }, { "epoch": 0.23, "learning_rate": 9.239105265402525e-06, "loss": 2.5536, "step": 1892 }, { "epoch": 0.23, "learning_rate": 9.238040294733074e-06, "loss": 2.7504, "step": 1893 }, { "epoch": 0.23, "learning_rate": 9.236974640770362e-06, "loss": 2.6142, "step": 1894 }, { "epoch": 0.23, "learning_rate": 9.235908303686204e-06, "loss": 2.8001, "step": 1895 }, { "epoch": 0.23, "learning_rate": 9.23484128365252e-06, "loss": 2.5903, "step": 1896 }, { "epoch": 0.23, "learning_rate": 9.233773580841348e-06, "loss": 2.5884, "step": 1897 }, { "epoch": 0.23, "learning_rate": 9.232705195424832e-06, "loss": 2.4989, "step": 1898 }, { "epoch": 0.23, "learning_rate": 9.231636127575224e-06, "loss": 2.806, "step": 1899 }, { "epoch": 0.23, "learning_rate": 9.23056637746489e-06, "loss": 2.6711, "step": 1900 }, { "epoch": 0.23, "learning_rate": 9.229495945266304e-06, "loss": 2.6043, "step": 1901 }, { "epoch": 0.23, "learning_rate": 9.22842483115205e-06, "loss": 2.6686, "step": 1902 }, { "epoch": 0.23, "learning_rate": 9.227353035294823e-06, "loss": 2.5233, "step": 1903 }, { "epoch": 0.23, "learning_rate": 9.226280557867428e-06, "loss": 2.4793, "step": 1904 }, { "epoch": 0.23, "learning_rate": 9.225207399042775e-06, "loss": 2.4527, "step": 1905 }, { "epoch": 0.23, "learning_rate": 9.224133558993894e-06, "loss": 2.583, "step": 1906 }, { "epoch": 0.23, "learning_rate": 9.22305903789391e-06, "loss": 2.4216, "step": 1907 }, { "epoch": 0.23, "learning_rate": 9.221983835916074e-06, "loss": 2.3007, "step": 1908 }, { "epoch": 0.23, "learning_rate": 9.22090795323374e-06, "loss": 2.493, "step": 1909 }, { "epoch": 0.23, "learning_rate": 9.219831390020367e-06, "loss": 2.8029, "step": 1910 }, { "epoch": 0.23, "learning_rate": 9.218754146449526e-06, "loss": 2.9164, "step": 1911 }, { "epoch": 0.23, "learning_rate": 9.217676222694905e-06, "loss": 2.6063, "step": 1912 }, { "epoch": 0.23, "learning_rate": 9.216597618930292e-06, "loss": 2.5349, "step": 1913 }, { "epoch": 0.23, "learning_rate": 9.215518335329591e-06, "loss": 2.5932, "step": 1914 }, { "epoch": 0.23, "learning_rate": 9.214438372066812e-06, "loss": 2.5948, "step": 1915 }, { "epoch": 0.23, "learning_rate": 9.213357729316077e-06, "loss": 2.6243, "step": 1916 }, { "epoch": 0.23, "learning_rate": 9.212276407251616e-06, "loss": 2.6098, "step": 1917 }, { "epoch": 0.23, "learning_rate": 9.21119440604777e-06, "loss": 2.7271, "step": 1918 }, { "epoch": 0.23, "learning_rate": 9.210111725878986e-06, "loss": 2.4493, "step": 1919 }, { "epoch": 0.23, "learning_rate": 9.209028366919825e-06, "loss": 2.5795, "step": 1920 }, { "epoch": 0.23, "learning_rate": 9.207944329344956e-06, "loss": 2.5114, "step": 1921 }, { "epoch": 0.23, "learning_rate": 9.206859613329155e-06, "loss": 2.4511, "step": 1922 }, { "epoch": 0.23, "learning_rate": 9.205774219047309e-06, "loss": 2.6197, "step": 1923 }, { "epoch": 0.23, "learning_rate": 9.204688146674418e-06, "loss": 2.5737, "step": 1924 }, { "epoch": 0.23, "learning_rate": 9.203601396385584e-06, "loss": 2.5748, "step": 1925 }, { "epoch": 0.23, "learning_rate": 9.202513968356027e-06, "loss": 2.5756, "step": 1926 }, { "epoch": 0.23, "learning_rate": 9.201425862761065e-06, "loss": 2.6434, "step": 1927 }, { "epoch": 0.23, "learning_rate": 9.200337079776136e-06, "loss": 2.5419, "step": 1928 }, { "epoch": 0.23, "learning_rate": 9.199247619576783e-06, "loss": 2.6994, "step": 1929 }, { "epoch": 0.23, "learning_rate": 9.198157482338655e-06, "loss": 2.7211, "step": 1930 }, { "epoch": 0.23, "learning_rate": 9.197066668237518e-06, "loss": 2.4605, "step": 1931 }, { "epoch": 0.23, "learning_rate": 9.195975177449238e-06, "loss": 2.6158, "step": 1932 }, { "epoch": 0.23, "learning_rate": 9.194883010149797e-06, "loss": 2.4616, "step": 1933 }, { "epoch": 0.23, "learning_rate": 9.193790166515282e-06, "loss": 2.6718, "step": 1934 }, { "epoch": 0.23, "learning_rate": 9.192696646721893e-06, "loss": 2.6205, "step": 1935 }, { "epoch": 0.23, "learning_rate": 9.191602450945935e-06, "loss": 2.6955, "step": 1936 }, { "epoch": 0.23, "learning_rate": 9.190507579363823e-06, "loss": 2.399, "step": 1937 }, { "epoch": 0.23, "learning_rate": 9.189412032152083e-06, "loss": 2.5756, "step": 1938 }, { "epoch": 0.23, "learning_rate": 9.188315809487349e-06, "loss": 2.5637, "step": 1939 }, { "epoch": 0.23, "learning_rate": 9.187218911546363e-06, "loss": 2.7103, "step": 1940 }, { "epoch": 0.23, "learning_rate": 9.186121338505973e-06, "loss": 2.4783, "step": 1941 }, { "epoch": 0.23, "learning_rate": 9.185023090543144e-06, "loss": 2.715, "step": 1942 }, { "epoch": 0.23, "learning_rate": 9.183924167834943e-06, "loss": 2.6709, "step": 1943 }, { "epoch": 0.23, "learning_rate": 9.182824570558546e-06, "loss": 2.6041, "step": 1944 }, { "epoch": 0.23, "learning_rate": 9.181724298891243e-06, "loss": 2.5058, "step": 1945 }, { "epoch": 0.23, "learning_rate": 9.180623353010428e-06, "loss": 2.592, "step": 1946 }, { "epoch": 0.23, "learning_rate": 9.179521733093602e-06, "loss": 2.5656, "step": 1947 }, { "epoch": 0.23, "learning_rate": 9.178419439318382e-06, "loss": 2.512, "step": 1948 }, { "epoch": 0.23, "learning_rate": 9.177316471862485e-06, "loss": 2.5563, "step": 1949 }, { "epoch": 0.23, "learning_rate": 9.176212830903746e-06, "loss": 2.7808, "step": 1950 }, { "epoch": 0.23, "learning_rate": 9.175108516620099e-06, "loss": 2.7265, "step": 1951 }, { "epoch": 0.23, "learning_rate": 9.174003529189592e-06, "loss": 2.5679, "step": 1952 }, { "epoch": 0.23, "learning_rate": 9.172897868790383e-06, "loss": 2.3957, "step": 1953 }, { "epoch": 0.23, "learning_rate": 9.171791535600733e-06, "loss": 2.641, "step": 1954 }, { "epoch": 0.23, "learning_rate": 9.170684529799017e-06, "loss": 2.4124, "step": 1955 }, { "epoch": 0.23, "learning_rate": 9.169576851563715e-06, "loss": 2.7982, "step": 1956 }, { "epoch": 0.24, "learning_rate": 9.168468501073415e-06, "loss": 2.5457, "step": 1957 }, { "epoch": 0.24, "learning_rate": 9.167359478506816e-06, "loss": 2.6227, "step": 1958 }, { "epoch": 0.24, "learning_rate": 9.166249784042725e-06, "loss": 2.5325, "step": 1959 }, { "epoch": 0.24, "learning_rate": 9.165139417860057e-06, "loss": 2.4889, "step": 1960 }, { "epoch": 0.24, "learning_rate": 9.16402838013783e-06, "loss": 2.5367, "step": 1961 }, { "epoch": 0.24, "learning_rate": 9.162916671055182e-06, "loss": 2.4938, "step": 1962 }, { "epoch": 0.24, "learning_rate": 9.161804290791346e-06, "loss": 2.5626, "step": 1963 }, { "epoch": 0.24, "learning_rate": 9.160691239525675e-06, "loss": 2.7628, "step": 1964 }, { "epoch": 0.24, "learning_rate": 9.15957751743762e-06, "loss": 2.5254, "step": 1965 }, { "epoch": 0.24, "learning_rate": 9.158463124706746e-06, "loss": 2.3984, "step": 1966 }, { "epoch": 0.24, "learning_rate": 9.157348061512728e-06, "loss": 2.4631, "step": 1967 }, { "epoch": 0.24, "learning_rate": 9.156232328035342e-06, "loss": 2.7109, "step": 1968 }, { "epoch": 0.24, "learning_rate": 9.155115924454478e-06, "loss": 2.4724, "step": 1969 }, { "epoch": 0.24, "learning_rate": 9.153998850950133e-06, "loss": 2.538, "step": 1970 }, { "epoch": 0.24, "learning_rate": 9.15288110770241e-06, "loss": 2.6395, "step": 1971 }, { "epoch": 0.24, "learning_rate": 9.151762694891522e-06, "loss": 2.5424, "step": 1972 }, { "epoch": 0.24, "learning_rate": 9.150643612697789e-06, "loss": 2.4426, "step": 1973 }, { "epoch": 0.24, "learning_rate": 9.149523861301636e-06, "loss": 2.5139, "step": 1974 }, { "epoch": 0.24, "learning_rate": 9.148403440883604e-06, "loss": 2.5783, "step": 1975 }, { "epoch": 0.24, "learning_rate": 9.147282351624334e-06, "loss": 2.6957, "step": 1976 }, { "epoch": 0.24, "learning_rate": 9.146160593704578e-06, "loss": 2.5462, "step": 1977 }, { "epoch": 0.24, "learning_rate": 9.145038167305196e-06, "loss": 2.7778, "step": 1978 }, { "epoch": 0.24, "learning_rate": 9.143915072607154e-06, "loss": 2.6598, "step": 1979 }, { "epoch": 0.24, "learning_rate": 9.142791309791528e-06, "loss": 2.6909, "step": 1980 }, { "epoch": 0.24, "learning_rate": 9.1416668790395e-06, "loss": 2.5852, "step": 1981 }, { "epoch": 0.24, "learning_rate": 9.140541780532362e-06, "loss": 2.4709, "step": 1982 }, { "epoch": 0.24, "learning_rate": 9.139416014451508e-06, "loss": 2.5523, "step": 1983 }, { "epoch": 0.24, "learning_rate": 9.138289580978449e-06, "loss": 2.6897, "step": 1984 }, { "epoch": 0.24, "learning_rate": 9.137162480294795e-06, "loss": 2.515, "step": 1985 }, { "epoch": 0.24, "learning_rate": 9.136034712582267e-06, "loss": 2.608, "step": 1986 }, { "epoch": 0.24, "learning_rate": 9.134906278022694e-06, "loss": 2.5264, "step": 1987 }, { "epoch": 0.24, "learning_rate": 9.133777176798013e-06, "loss": 2.5854, "step": 1988 }, { "epoch": 0.24, "learning_rate": 9.132647409090267e-06, "loss": 2.626, "step": 1989 }, { "epoch": 0.24, "learning_rate": 9.131516975081604e-06, "loss": 2.6434, "step": 1990 }, { "epoch": 0.24, "learning_rate": 9.130385874954286e-06, "loss": 2.4179, "step": 1991 }, { "epoch": 0.24, "learning_rate": 9.129254108890678e-06, "loss": 2.5204, "step": 1992 }, { "epoch": 0.24, "learning_rate": 9.128121677073251e-06, "loss": 2.5353, "step": 1993 }, { "epoch": 0.24, "learning_rate": 9.126988579684587e-06, "loss": 2.7299, "step": 1994 }, { "epoch": 0.24, "learning_rate": 9.125854816907371e-06, "loss": 2.6015, "step": 1995 }, { "epoch": 0.24, "learning_rate": 9.124720388924403e-06, "loss": 2.4297, "step": 1996 }, { "epoch": 0.24, "learning_rate": 9.123585295918581e-06, "loss": 2.644, "step": 1997 }, { "epoch": 0.24, "learning_rate": 9.122449538072918e-06, "loss": 2.6259, "step": 1998 }, { "epoch": 0.24, "learning_rate": 9.121313115570525e-06, "loss": 2.674, "step": 1999 }, { "epoch": 0.24, "learning_rate": 9.120176028594632e-06, "loss": 2.5436, "step": 2000 }, { "epoch": 0.24, "learning_rate": 9.119038277328568e-06, "loss": 2.4888, "step": 2001 }, { "epoch": 0.24, "learning_rate": 9.117899861955767e-06, "loss": 2.7402, "step": 2002 }, { "epoch": 0.24, "learning_rate": 9.116760782659781e-06, "loss": 2.6142, "step": 2003 }, { "epoch": 0.24, "learning_rate": 9.115621039624256e-06, "loss": 2.7426, "step": 2004 }, { "epoch": 0.24, "learning_rate": 9.114480633032956e-06, "loss": 2.5397, "step": 2005 }, { "epoch": 0.24, "learning_rate": 9.113339563069742e-06, "loss": 2.5849, "step": 2006 }, { "epoch": 0.24, "learning_rate": 9.112197829918591e-06, "loss": 2.7125, "step": 2007 }, { "epoch": 0.24, "learning_rate": 9.111055433763582e-06, "loss": 2.6083, "step": 2008 }, { "epoch": 0.24, "learning_rate": 9.109912374788904e-06, "loss": 2.6097, "step": 2009 }, { "epoch": 0.24, "learning_rate": 9.108768653178848e-06, "loss": 2.733, "step": 2010 }, { "epoch": 0.24, "learning_rate": 9.107624269117813e-06, "loss": 2.3806, "step": 2011 }, { "epoch": 0.24, "learning_rate": 9.106479222790312e-06, "loss": 2.4341, "step": 2012 }, { "epoch": 0.24, "learning_rate": 9.105333514380953e-06, "loss": 2.4488, "step": 2013 }, { "epoch": 0.24, "learning_rate": 9.104187144074461e-06, "loss": 2.6244, "step": 2014 }, { "epoch": 0.24, "learning_rate": 9.103040112055663e-06, "loss": 2.6491, "step": 2015 }, { "epoch": 0.24, "learning_rate": 9.101892418509492e-06, "loss": 2.5754, "step": 2016 }, { "epoch": 0.24, "learning_rate": 9.100744063620991e-06, "loss": 2.562, "step": 2017 }, { "epoch": 0.24, "learning_rate": 9.099595047575308e-06, "loss": 2.4391, "step": 2018 }, { "epoch": 0.24, "learning_rate": 9.098445370557694e-06, "loss": 2.6503, "step": 2019 }, { "epoch": 0.24, "learning_rate": 9.09729503275351e-06, "loss": 2.5, "step": 2020 }, { "epoch": 0.24, "learning_rate": 9.096144034348227e-06, "loss": 2.4237, "step": 2021 }, { "epoch": 0.24, "learning_rate": 9.094992375527415e-06, "loss": 2.8561, "step": 2022 }, { "epoch": 0.24, "learning_rate": 9.093840056476759e-06, "loss": 2.5787, "step": 2023 }, { "epoch": 0.24, "learning_rate": 9.092687077382043e-06, "loss": 2.6063, "step": 2024 }, { "epoch": 0.24, "learning_rate": 9.091533438429159e-06, "loss": 2.5558, "step": 2025 }, { "epoch": 0.24, "learning_rate": 9.090379139804107e-06, "loss": 2.6062, "step": 2026 }, { "epoch": 0.24, "learning_rate": 9.089224181692992e-06, "loss": 2.5327, "step": 2027 }, { "epoch": 0.24, "learning_rate": 9.08806856428203e-06, "loss": 2.7563, "step": 2028 }, { "epoch": 0.24, "learning_rate": 9.086912287757538e-06, "loss": 2.555, "step": 2029 }, { "epoch": 0.24, "learning_rate": 9.08575535230594e-06, "loss": 2.6447, "step": 2030 }, { "epoch": 0.24, "learning_rate": 9.08459775811377e-06, "loss": 2.5739, "step": 2031 }, { "epoch": 0.24, "learning_rate": 9.083439505367658e-06, "loss": 2.7103, "step": 2032 }, { "epoch": 0.24, "learning_rate": 9.082280594254353e-06, "loss": 2.643, "step": 2033 }, { "epoch": 0.24, "learning_rate": 9.081121024960707e-06, "loss": 2.6475, "step": 2034 }, { "epoch": 0.24, "learning_rate": 9.079960797673671e-06, "loss": 2.4778, "step": 2035 }, { "epoch": 0.24, "learning_rate": 9.078799912580305e-06, "loss": 2.7608, "step": 2036 }, { "epoch": 0.24, "learning_rate": 9.077638369867783e-06, "loss": 2.6815, "step": 2037 }, { "epoch": 0.24, "learning_rate": 9.076476169723376e-06, "loss": 2.6208, "step": 2038 }, { "epoch": 0.24, "learning_rate": 9.075313312334465e-06, "loss": 2.6385, "step": 2039 }, { "epoch": 0.25, "learning_rate": 9.074149797888532e-06, "loss": 2.6229, "step": 2040 }, { "epoch": 0.25, "learning_rate": 9.072985626573171e-06, "loss": 2.5069, "step": 2041 }, { "epoch": 0.25, "learning_rate": 9.071820798576083e-06, "loss": 2.6007, "step": 2042 }, { "epoch": 0.25, "learning_rate": 9.070655314085068e-06, "loss": 2.3999, "step": 2043 }, { "epoch": 0.25, "learning_rate": 9.069489173288037e-06, "loss": 2.5186, "step": 2044 }, { "epoch": 0.25, "learning_rate": 9.068322376373004e-06, "loss": 2.5328, "step": 2045 }, { "epoch": 0.25, "learning_rate": 9.06715492352809e-06, "loss": 2.6631, "step": 2046 }, { "epoch": 0.25, "learning_rate": 9.065986814941523e-06, "loss": 2.5228, "step": 2047 }, { "epoch": 0.25, "learning_rate": 9.064818050801634e-06, "loss": 2.711, "step": 2048 }, { "epoch": 0.25, "learning_rate": 9.063648631296861e-06, "loss": 2.5728, "step": 2049 }, { "epoch": 0.25, "learning_rate": 9.062478556615751e-06, "loss": 2.3394, "step": 2050 }, { "epoch": 0.25, "learning_rate": 9.06130782694695e-06, "loss": 2.6653, "step": 2051 }, { "epoch": 0.25, "learning_rate": 9.060136442479215e-06, "loss": 2.6855, "step": 2052 }, { "epoch": 0.25, "learning_rate": 9.058964403401407e-06, "loss": 2.7237, "step": 2053 }, { "epoch": 0.25, "learning_rate": 9.057791709902491e-06, "loss": 2.5775, "step": 2054 }, { "epoch": 0.25, "learning_rate": 9.056618362171537e-06, "loss": 2.6503, "step": 2055 }, { "epoch": 0.25, "learning_rate": 9.055444360397727e-06, "loss": 2.722, "step": 2056 }, { "epoch": 0.25, "learning_rate": 9.05426970477034e-06, "loss": 2.5831, "step": 2057 }, { "epoch": 0.25, "learning_rate": 9.053094395478763e-06, "loss": 2.6116, "step": 2058 }, { "epoch": 0.25, "learning_rate": 9.051918432712492e-06, "loss": 2.8308, "step": 2059 }, { "epoch": 0.25, "learning_rate": 9.050741816661128e-06, "loss": 2.5763, "step": 2060 }, { "epoch": 0.25, "learning_rate": 9.04956454751437e-06, "loss": 2.5228, "step": 2061 }, { "epoch": 0.25, "learning_rate": 9.048386625462028e-06, "loss": 2.6537, "step": 2062 }, { "epoch": 0.25, "learning_rate": 9.047208050694021e-06, "loss": 2.7104, "step": 2063 }, { "epoch": 0.25, "learning_rate": 9.046028823400368e-06, "loss": 2.7202, "step": 2064 }, { "epoch": 0.25, "learning_rate": 9.04484894377119e-06, "loss": 2.7263, "step": 2065 }, { "epoch": 0.25, "learning_rate": 9.04366841199672e-06, "loss": 2.6479, "step": 2066 }, { "epoch": 0.25, "learning_rate": 9.042487228267297e-06, "loss": 2.8151, "step": 2067 }, { "epoch": 0.25, "learning_rate": 9.041305392773355e-06, "loss": 2.6305, "step": 2068 }, { "epoch": 0.25, "learning_rate": 9.040122905705443e-06, "loss": 2.5059, "step": 2069 }, { "epoch": 0.25, "learning_rate": 9.03893976725421e-06, "loss": 2.4531, "step": 2070 }, { "epoch": 0.25, "learning_rate": 9.037755977610413e-06, "loss": 2.7036, "step": 2071 }, { "epoch": 0.25, "learning_rate": 9.036571536964915e-06, "loss": 2.5204, "step": 2072 }, { "epoch": 0.25, "learning_rate": 9.035386445508681e-06, "loss": 2.6363, "step": 2073 }, { "epoch": 0.25, "learning_rate": 9.034200703432776e-06, "loss": 2.5696, "step": 2074 }, { "epoch": 0.25, "learning_rate": 9.033014310928383e-06, "loss": 2.7125, "step": 2075 }, { "epoch": 0.25, "learning_rate": 9.03182726818678e-06, "loss": 2.6088, "step": 2076 }, { "epoch": 0.25, "learning_rate": 9.030639575399347e-06, "loss": 2.621, "step": 2077 }, { "epoch": 0.25, "learning_rate": 9.029451232757581e-06, "loss": 2.5088, "step": 2078 }, { "epoch": 0.25, "learning_rate": 9.028262240453074e-06, "loss": 2.4172, "step": 2079 }, { "epoch": 0.25, "learning_rate": 9.027072598677526e-06, "loss": 2.7664, "step": 2080 }, { "epoch": 0.25, "learning_rate": 9.025882307622741e-06, "loss": 2.6369, "step": 2081 }, { "epoch": 0.25, "learning_rate": 9.024691367480627e-06, "loss": 2.5216, "step": 2082 }, { "epoch": 0.25, "learning_rate": 9.0234997784432e-06, "loss": 2.6354, "step": 2083 }, { "epoch": 0.25, "learning_rate": 9.022307540702576e-06, "loss": 2.6607, "step": 2084 }, { "epoch": 0.25, "learning_rate": 9.021114654450978e-06, "loss": 2.5529, "step": 2085 }, { "epoch": 0.25, "learning_rate": 9.019921119880735e-06, "loss": 2.457, "step": 2086 }, { "epoch": 0.25, "learning_rate": 9.018726937184278e-06, "loss": 2.4658, "step": 2087 }, { "epoch": 0.25, "learning_rate": 9.017532106554143e-06, "loss": 2.5262, "step": 2088 }, { "epoch": 0.25, "learning_rate": 9.01633662818297e-06, "loss": 2.6535, "step": 2089 }, { "epoch": 0.25, "learning_rate": 9.015140502263506e-06, "loss": 2.7527, "step": 2090 }, { "epoch": 0.25, "learning_rate": 9.0139437289886e-06, "loss": 2.7131, "step": 2091 }, { "epoch": 0.25, "learning_rate": 9.012746308551208e-06, "loss": 2.6539, "step": 2092 }, { "epoch": 0.25, "learning_rate": 9.011548241144386e-06, "loss": 2.6242, "step": 2093 }, { "epoch": 0.25, "learning_rate": 9.010349526961295e-06, "loss": 2.7233, "step": 2094 }, { "epoch": 0.25, "learning_rate": 9.009150166195206e-06, "loss": 2.5733, "step": 2095 }, { "epoch": 0.25, "learning_rate": 9.007950159039488e-06, "loss": 2.6706, "step": 2096 }, { "epoch": 0.25, "learning_rate": 9.006749505687618e-06, "loss": 2.7089, "step": 2097 }, { "epoch": 0.25, "learning_rate": 9.005548206333172e-06, "loss": 2.6481, "step": 2098 }, { "epoch": 0.25, "learning_rate": 9.004346261169838e-06, "loss": 2.5028, "step": 2099 }, { "epoch": 0.25, "learning_rate": 9.003143670391403e-06, "loss": 2.646, "step": 2100 }, { "epoch": 0.25, "learning_rate": 9.001940434191759e-06, "loss": 2.7566, "step": 2101 }, { "epoch": 0.25, "learning_rate": 9.0007365527649e-06, "loss": 2.7202, "step": 2102 }, { "epoch": 0.25, "learning_rate": 8.999532026304928e-06, "loss": 2.5645, "step": 2103 }, { "epoch": 0.25, "learning_rate": 8.998326855006047e-06, "loss": 2.5185, "step": 2104 }, { "epoch": 0.25, "learning_rate": 8.997121039062564e-06, "loss": 2.7027, "step": 2105 }, { "epoch": 0.25, "learning_rate": 8.995914578668892e-06, "loss": 2.5019, "step": 2106 }, { "epoch": 0.25, "learning_rate": 8.994707474019547e-06, "loss": 2.694, "step": 2107 }, { "epoch": 0.25, "learning_rate": 8.993499725309148e-06, "loss": 2.4672, "step": 2108 }, { "epoch": 0.25, "learning_rate": 8.99229133273242e-06, "loss": 2.7499, "step": 2109 }, { "epoch": 0.25, "learning_rate": 8.991082296484188e-06, "loss": 2.5739, "step": 2110 }, { "epoch": 0.25, "learning_rate": 8.989872616759387e-06, "loss": 2.5765, "step": 2111 }, { "epoch": 0.25, "learning_rate": 8.988662293753047e-06, "loss": 2.5603, "step": 2112 }, { "epoch": 0.25, "learning_rate": 8.98745132766031e-06, "loss": 2.4647, "step": 2113 }, { "epoch": 0.25, "learning_rate": 8.98623971867642e-06, "loss": 2.5239, "step": 2114 }, { "epoch": 0.25, "learning_rate": 8.985027466996718e-06, "loss": 2.5029, "step": 2115 }, { "epoch": 0.25, "learning_rate": 8.983814572816656e-06, "loss": 2.5892, "step": 2116 }, { "epoch": 0.25, "learning_rate": 8.982601036331788e-06, "loss": 2.5345, "step": 2117 }, { "epoch": 0.25, "learning_rate": 8.981386857737773e-06, "loss": 2.4747, "step": 2118 }, { "epoch": 0.25, "learning_rate": 8.980172037230365e-06, "loss": 2.6332, "step": 2119 }, { "epoch": 0.25, "learning_rate": 8.978956575005432e-06, "loss": 2.4839, "step": 2120 }, { "epoch": 0.25, "learning_rate": 8.977740471258943e-06, "loss": 2.5226, "step": 2121 }, { "epoch": 0.25, "learning_rate": 8.976523726186966e-06, "loss": 2.5374, "step": 2122 }, { "epoch": 0.26, "learning_rate": 8.975306339985674e-06, "loss": 2.5473, "step": 2123 }, { "epoch": 0.26, "learning_rate": 8.974088312851346e-06, "loss": 2.6036, "step": 2124 }, { "epoch": 0.26, "learning_rate": 8.972869644980363e-06, "loss": 2.641, "step": 2125 }, { "epoch": 0.26, "learning_rate": 8.971650336569208e-06, "loss": 2.4896, "step": 2126 }, { "epoch": 0.26, "learning_rate": 8.97043038781447e-06, "loss": 2.7799, "step": 2127 }, { "epoch": 0.26, "learning_rate": 8.96920979891284e-06, "loss": 2.481, "step": 2128 }, { "epoch": 0.26, "learning_rate": 8.96798857006111e-06, "loss": 2.5405, "step": 2129 }, { "epoch": 0.26, "learning_rate": 8.966766701456177e-06, "loss": 2.7012, "step": 2130 }, { "epoch": 0.26, "learning_rate": 8.96554419329504e-06, "loss": 2.6387, "step": 2131 }, { "epoch": 0.26, "learning_rate": 8.964321045774808e-06, "loss": 2.5018, "step": 2132 }, { "epoch": 0.26, "learning_rate": 8.963097259092682e-06, "loss": 2.6597, "step": 2133 }, { "epoch": 0.26, "learning_rate": 8.961872833445971e-06, "loss": 2.6073, "step": 2134 }, { "epoch": 0.26, "learning_rate": 8.960647769032091e-06, "loss": 2.7935, "step": 2135 }, { "epoch": 0.26, "learning_rate": 8.959422066048556e-06, "loss": 2.6213, "step": 2136 }, { "epoch": 0.26, "learning_rate": 8.958195724692982e-06, "loss": 2.5845, "step": 2137 }, { "epoch": 0.26, "learning_rate": 8.956968745163093e-06, "loss": 2.5792, "step": 2138 }, { "epoch": 0.26, "learning_rate": 8.955741127656713e-06, "loss": 2.515, "step": 2139 }, { "epoch": 0.26, "learning_rate": 8.954512872371768e-06, "loss": 2.4261, "step": 2140 }, { "epoch": 0.26, "learning_rate": 8.95328397950629e-06, "loss": 2.4368, "step": 2141 }, { "epoch": 0.26, "learning_rate": 8.952054449258409e-06, "loss": 2.7058, "step": 2142 }, { "epoch": 0.26, "learning_rate": 8.95082428182636e-06, "loss": 2.3984, "step": 2143 }, { "epoch": 0.26, "learning_rate": 8.949593477408485e-06, "loss": 2.5358, "step": 2144 }, { "epoch": 0.26, "learning_rate": 8.948362036203222e-06, "loss": 2.5752, "step": 2145 }, { "epoch": 0.26, "learning_rate": 8.947129958409113e-06, "loss": 2.5008, "step": 2146 }, { "epoch": 0.26, "learning_rate": 8.945897244224808e-06, "loss": 2.5538, "step": 2147 }, { "epoch": 0.26, "learning_rate": 8.944663893849053e-06, "loss": 2.5601, "step": 2148 }, { "epoch": 0.26, "learning_rate": 8.9434299074807e-06, "loss": 2.7238, "step": 2149 }, { "epoch": 0.26, "learning_rate": 8.942195285318705e-06, "loss": 2.5887, "step": 2150 }, { "epoch": 0.26, "learning_rate": 8.940960027562122e-06, "loss": 2.7081, "step": 2151 }, { "epoch": 0.26, "learning_rate": 8.939724134410111e-06, "loss": 2.5943, "step": 2152 }, { "epoch": 0.26, "learning_rate": 8.93848760606193e-06, "loss": 2.6945, "step": 2153 }, { "epoch": 0.26, "learning_rate": 8.937250442716947e-06, "loss": 2.5849, "step": 2154 }, { "epoch": 0.26, "learning_rate": 8.936012644574627e-06, "loss": 2.634, "step": 2155 }, { "epoch": 0.26, "learning_rate": 8.934774211834538e-06, "loss": 2.6516, "step": 2156 }, { "epoch": 0.26, "learning_rate": 8.933535144696352e-06, "loss": 2.5767, "step": 2157 }, { "epoch": 0.26, "learning_rate": 8.932295443359837e-06, "loss": 2.6149, "step": 2158 }, { "epoch": 0.26, "learning_rate": 8.931055108024875e-06, "loss": 2.4116, "step": 2159 }, { "epoch": 0.26, "learning_rate": 8.929814138891442e-06, "loss": 2.553, "step": 2160 }, { "epoch": 0.26, "learning_rate": 8.928572536159614e-06, "loss": 2.3409, "step": 2161 }, { "epoch": 0.26, "learning_rate": 8.927330300029575e-06, "loss": 2.6586, "step": 2162 }, { "epoch": 0.26, "learning_rate": 8.92608743070161e-06, "loss": 2.5511, "step": 2163 }, { "epoch": 0.26, "learning_rate": 8.924843928376105e-06, "loss": 2.475, "step": 2164 }, { "epoch": 0.26, "learning_rate": 8.923599793253547e-06, "loss": 2.6248, "step": 2165 }, { "epoch": 0.26, "learning_rate": 8.922355025534526e-06, "loss": 2.5138, "step": 2166 }, { "epoch": 0.26, "learning_rate": 8.921109625419734e-06, "loss": 2.7369, "step": 2167 }, { "epoch": 0.26, "learning_rate": 8.919863593109967e-06, "loss": 2.6541, "step": 2168 }, { "epoch": 0.26, "learning_rate": 8.91861692880612e-06, "loss": 2.8143, "step": 2169 }, { "epoch": 0.26, "learning_rate": 8.917369632709189e-06, "loss": 2.6361, "step": 2170 }, { "epoch": 0.26, "learning_rate": 8.916121705020277e-06, "loss": 2.5115, "step": 2171 }, { "epoch": 0.26, "learning_rate": 8.914873145940585e-06, "loss": 2.6785, "step": 2172 }, { "epoch": 0.26, "learning_rate": 8.913623955671413e-06, "loss": 2.4036, "step": 2173 }, { "epoch": 0.26, "learning_rate": 8.912374134414171e-06, "loss": 2.4772, "step": 2174 }, { "epoch": 0.26, "learning_rate": 8.911123682370364e-06, "loss": 2.7584, "step": 2175 }, { "epoch": 0.26, "learning_rate": 8.909872599741598e-06, "loss": 2.6212, "step": 2176 }, { "epoch": 0.26, "learning_rate": 8.908620886729586e-06, "loss": 2.6147, "step": 2177 }, { "epoch": 0.26, "learning_rate": 8.907368543536141e-06, "loss": 2.6618, "step": 2178 }, { "epoch": 0.26, "learning_rate": 8.906115570363174e-06, "loss": 2.7665, "step": 2179 }, { "epoch": 0.26, "learning_rate": 8.904861967412702e-06, "loss": 2.5554, "step": 2180 }, { "epoch": 0.26, "learning_rate": 8.903607734886842e-06, "loss": 2.4749, "step": 2181 }, { "epoch": 0.26, "learning_rate": 8.902352872987809e-06, "loss": 2.7009, "step": 2182 }, { "epoch": 0.26, "learning_rate": 8.901097381917925e-06, "loss": 2.4677, "step": 2183 }, { "epoch": 0.26, "learning_rate": 8.899841261879609e-06, "loss": 2.7227, "step": 2184 }, { "epoch": 0.26, "learning_rate": 8.898584513075387e-06, "loss": 2.4948, "step": 2185 }, { "epoch": 0.26, "learning_rate": 8.897327135707881e-06, "loss": 2.5652, "step": 2186 }, { "epoch": 0.26, "learning_rate": 8.896069129979814e-06, "loss": 2.4784, "step": 2187 }, { "epoch": 0.26, "learning_rate": 8.894810496094016e-06, "loss": 2.5692, "step": 2188 }, { "epoch": 0.26, "learning_rate": 8.893551234253414e-06, "loss": 2.4778, "step": 2189 }, { "epoch": 0.26, "learning_rate": 8.892291344661035e-06, "loss": 2.6541, "step": 2190 }, { "epoch": 0.26, "learning_rate": 8.89103082752001e-06, "loss": 2.5475, "step": 2191 }, { "epoch": 0.26, "learning_rate": 8.889769683033573e-06, "loss": 2.6381, "step": 2192 }, { "epoch": 0.26, "learning_rate": 8.888507911405055e-06, "loss": 2.6299, "step": 2193 }, { "epoch": 0.26, "learning_rate": 8.887245512837887e-06, "loss": 2.5083, "step": 2194 }, { "epoch": 0.26, "learning_rate": 8.885982487535607e-06, "loss": 2.7068, "step": 2195 }, { "epoch": 0.26, "learning_rate": 8.88471883570185e-06, "loss": 2.648, "step": 2196 }, { "epoch": 0.26, "learning_rate": 8.88345455754035e-06, "loss": 2.6323, "step": 2197 }, { "epoch": 0.26, "learning_rate": 8.882189653254951e-06, "loss": 2.6511, "step": 2198 }, { "epoch": 0.26, "learning_rate": 8.880924123049586e-06, "loss": 2.578, "step": 2199 }, { "epoch": 0.26, "learning_rate": 8.879657967128297e-06, "loss": 2.5624, "step": 2200 }, { "epoch": 0.26, "learning_rate": 8.878391185695223e-06, "loss": 2.5314, "step": 2201 }, { "epoch": 0.26, "learning_rate": 8.877123778954608e-06, "loss": 2.5884, "step": 2202 }, { "epoch": 0.26, "learning_rate": 8.875855747110792e-06, "loss": 2.7062, "step": 2203 }, { "epoch": 0.26, "learning_rate": 8.874587090368221e-06, "loss": 2.7647, "step": 2204 }, { "epoch": 0.26, "learning_rate": 8.873317808931433e-06, "loss": 2.663, "step": 2205 }, { "epoch": 0.27, "learning_rate": 8.872047903005079e-06, "loss": 2.4433, "step": 2206 }, { "epoch": 0.27, "learning_rate": 8.8707773727939e-06, "loss": 2.6787, "step": 2207 }, { "epoch": 0.27, "learning_rate": 8.869506218502742e-06, "loss": 2.6936, "step": 2208 }, { "epoch": 0.27, "learning_rate": 8.868234440336555e-06, "loss": 2.8175, "step": 2209 }, { "epoch": 0.27, "learning_rate": 8.86696203850038e-06, "loss": 2.7346, "step": 2210 }, { "epoch": 0.27, "learning_rate": 8.865689013199369e-06, "loss": 2.5446, "step": 2211 }, { "epoch": 0.27, "learning_rate": 8.86441536463877e-06, "loss": 2.546, "step": 2212 }, { "epoch": 0.27, "learning_rate": 8.863141093023928e-06, "loss": 2.4981, "step": 2213 }, { "epoch": 0.27, "learning_rate": 8.861866198560297e-06, "loss": 2.8057, "step": 2214 }, { "epoch": 0.27, "learning_rate": 8.860590681453424e-06, "loss": 2.7094, "step": 2215 }, { "epoch": 0.27, "learning_rate": 8.859314541908957e-06, "loss": 2.3175, "step": 2216 }, { "epoch": 0.27, "learning_rate": 8.858037780132649e-06, "loss": 2.4956, "step": 2217 }, { "epoch": 0.27, "learning_rate": 8.85676039633035e-06, "loss": 2.6197, "step": 2218 }, { "epoch": 0.27, "learning_rate": 8.85548239070801e-06, "loss": 2.6171, "step": 2219 }, { "epoch": 0.27, "learning_rate": 8.85420376347168e-06, "loss": 2.7136, "step": 2220 }, { "epoch": 0.27, "learning_rate": 8.852924514827512e-06, "loss": 2.509, "step": 2221 }, { "epoch": 0.27, "learning_rate": 8.851644644981756e-06, "loss": 2.5588, "step": 2222 }, { "epoch": 0.27, "learning_rate": 8.850364154140764e-06, "loss": 2.458, "step": 2223 }, { "epoch": 0.27, "learning_rate": 8.849083042510991e-06, "loss": 2.4914, "step": 2224 }, { "epoch": 0.27, "learning_rate": 8.847801310298985e-06, "loss": 2.6884, "step": 2225 }, { "epoch": 0.27, "learning_rate": 8.846518957711398e-06, "loss": 2.5802, "step": 2226 }, { "epoch": 0.27, "learning_rate": 8.845235984954985e-06, "loss": 2.596, "step": 2227 }, { "epoch": 0.27, "learning_rate": 8.843952392236595e-06, "loss": 2.6337, "step": 2228 }, { "epoch": 0.27, "learning_rate": 8.84266817976318e-06, "loss": 2.6232, "step": 2229 }, { "epoch": 0.27, "learning_rate": 8.841383347741794e-06, "loss": 2.5654, "step": 2230 }, { "epoch": 0.27, "learning_rate": 8.840097896379585e-06, "loss": 2.6835, "step": 2231 }, { "epoch": 0.27, "learning_rate": 8.838811825883808e-06, "loss": 2.602, "step": 2232 }, { "epoch": 0.27, "learning_rate": 8.837525136461814e-06, "loss": 2.6585, "step": 2233 }, { "epoch": 0.27, "learning_rate": 8.83623782832105e-06, "loss": 2.5441, "step": 2234 }, { "epoch": 0.27, "learning_rate": 8.834949901669073e-06, "loss": 2.5665, "step": 2235 }, { "epoch": 0.27, "learning_rate": 8.833661356713528e-06, "loss": 2.5135, "step": 2236 }, { "epoch": 0.27, "learning_rate": 8.83237219366217e-06, "loss": 2.5457, "step": 2237 }, { "epoch": 0.27, "learning_rate": 8.831082412722845e-06, "loss": 2.4427, "step": 2238 }, { "epoch": 0.27, "learning_rate": 8.829792014103505e-06, "loss": 2.551, "step": 2239 }, { "epoch": 0.27, "learning_rate": 8.8285009980122e-06, "loss": 2.6009, "step": 2240 }, { "epoch": 0.27, "learning_rate": 8.827209364657074e-06, "loss": 2.6982, "step": 2241 }, { "epoch": 0.27, "learning_rate": 8.825917114246382e-06, "loss": 2.5978, "step": 2242 }, { "epoch": 0.27, "learning_rate": 8.824624246988467e-06, "loss": 2.5223, "step": 2243 }, { "epoch": 0.27, "learning_rate": 8.823330763091775e-06, "loss": 2.5859, "step": 2244 }, { "epoch": 0.27, "learning_rate": 8.822036662764856e-06, "loss": 2.7149, "step": 2245 }, { "epoch": 0.27, "learning_rate": 8.820741946216357e-06, "loss": 2.6577, "step": 2246 }, { "epoch": 0.27, "learning_rate": 8.819446613655021e-06, "loss": 2.6481, "step": 2247 }, { "epoch": 0.27, "learning_rate": 8.81815066528969e-06, "loss": 2.7125, "step": 2248 }, { "epoch": 0.27, "learning_rate": 8.816854101329313e-06, "loss": 2.6123, "step": 2249 }, { "epoch": 0.27, "learning_rate": 8.81555692198293e-06, "loss": 2.5834, "step": 2250 }, { "epoch": 0.27, "learning_rate": 8.814259127459686e-06, "loss": 2.5848, "step": 2251 }, { "epoch": 0.27, "learning_rate": 8.81296071796882e-06, "loss": 2.531, "step": 2252 }, { "epoch": 0.27, "learning_rate": 8.811661693719673e-06, "loss": 2.5899, "step": 2253 }, { "epoch": 0.27, "learning_rate": 8.810362054921685e-06, "loss": 2.5189, "step": 2254 }, { "epoch": 0.27, "learning_rate": 8.809061801784395e-06, "loss": 2.4461, "step": 2255 }, { "epoch": 0.27, "learning_rate": 8.807760934517444e-06, "loss": 2.7421, "step": 2256 }, { "epoch": 0.27, "learning_rate": 8.806459453330565e-06, "loss": 2.7232, "step": 2257 }, { "epoch": 0.27, "learning_rate": 8.805157358433595e-06, "loss": 2.5685, "step": 2258 }, { "epoch": 0.27, "learning_rate": 8.80385465003647e-06, "loss": 2.5733, "step": 2259 }, { "epoch": 0.27, "learning_rate": 8.802551328349222e-06, "loss": 2.6334, "step": 2260 }, { "epoch": 0.27, "learning_rate": 8.801247393581987e-06, "loss": 2.6151, "step": 2261 }, { "epoch": 0.27, "learning_rate": 8.799942845944993e-06, "loss": 2.6007, "step": 2262 }, { "epoch": 0.27, "learning_rate": 8.79863768564857e-06, "loss": 2.6084, "step": 2263 }, { "epoch": 0.27, "learning_rate": 8.797331912903152e-06, "loss": 2.5446, "step": 2264 }, { "epoch": 0.27, "learning_rate": 8.796025527919263e-06, "loss": 2.718, "step": 2265 }, { "epoch": 0.27, "learning_rate": 8.794718530907529e-06, "loss": 2.5722, "step": 2266 }, { "epoch": 0.27, "learning_rate": 8.793410922078677e-06, "loss": 2.5749, "step": 2267 }, { "epoch": 0.27, "learning_rate": 8.792102701643532e-06, "loss": 2.386, "step": 2268 }, { "epoch": 0.27, "learning_rate": 8.790793869813014e-06, "loss": 2.7055, "step": 2269 }, { "epoch": 0.27, "learning_rate": 8.789484426798148e-06, "loss": 2.6045, "step": 2270 }, { "epoch": 0.27, "learning_rate": 8.788174372810048e-06, "loss": 2.5907, "step": 2271 }, { "epoch": 0.27, "learning_rate": 8.786863708059936e-06, "loss": 2.5085, "step": 2272 }, { "epoch": 0.27, "learning_rate": 8.785552432759127e-06, "loss": 2.6217, "step": 2273 }, { "epoch": 0.27, "learning_rate": 8.784240547119039e-06, "loss": 2.746, "step": 2274 }, { "epoch": 0.27, "learning_rate": 8.782928051351183e-06, "loss": 2.4063, "step": 2275 }, { "epoch": 0.27, "learning_rate": 8.78161494566717e-06, "loss": 2.662, "step": 2276 }, { "epoch": 0.27, "learning_rate": 8.780301230278711e-06, "loss": 2.6546, "step": 2277 }, { "epoch": 0.27, "learning_rate": 8.778986905397615e-06, "loss": 2.5244, "step": 2278 }, { "epoch": 0.27, "learning_rate": 8.77767197123579e-06, "loss": 2.5505, "step": 2279 }, { "epoch": 0.27, "learning_rate": 8.776356428005237e-06, "loss": 2.7441, "step": 2280 }, { "epoch": 0.27, "learning_rate": 8.775040275918063e-06, "loss": 2.69, "step": 2281 }, { "epoch": 0.27, "learning_rate": 8.77372351518647e-06, "loss": 2.5176, "step": 2282 }, { "epoch": 0.27, "learning_rate": 8.772406146022751e-06, "loss": 2.5723, "step": 2283 }, { "epoch": 0.27, "learning_rate": 8.771088168639312e-06, "loss": 2.5704, "step": 2284 }, { "epoch": 0.27, "learning_rate": 8.769769583248645e-06, "loss": 2.7373, "step": 2285 }, { "epoch": 0.27, "learning_rate": 8.768450390063342e-06, "loss": 2.5102, "step": 2286 }, { "epoch": 0.27, "learning_rate": 8.767130589296095e-06, "loss": 2.4319, "step": 2287 }, { "epoch": 0.27, "learning_rate": 8.765810181159696e-06, "loss": 2.6602, "step": 2288 }, { "epoch": 0.27, "learning_rate": 8.764489165867029e-06, "loss": 2.5159, "step": 2289 }, { "epoch": 0.28, "learning_rate": 8.763167543631084e-06, "loss": 2.6135, "step": 2290 }, { "epoch": 0.28, "learning_rate": 8.761845314664942e-06, "loss": 2.7723, "step": 2291 }, { "epoch": 0.28, "learning_rate": 8.760522479181784e-06, "loss": 2.6285, "step": 2292 }, { "epoch": 0.28, "learning_rate": 8.759199037394888e-06, "loss": 2.5177, "step": 2293 }, { "epoch": 0.28, "learning_rate": 8.757874989517631e-06, "loss": 2.6341, "step": 2294 }, { "epoch": 0.28, "learning_rate": 8.75655033576349e-06, "loss": 2.5947, "step": 2295 }, { "epoch": 0.28, "learning_rate": 8.755225076346035e-06, "loss": 2.5884, "step": 2296 }, { "epoch": 0.28, "learning_rate": 8.753899211478933e-06, "loss": 2.5412, "step": 2297 }, { "epoch": 0.28, "learning_rate": 8.752572741375956e-06, "loss": 2.6923, "step": 2298 }, { "epoch": 0.28, "learning_rate": 8.751245666250968e-06, "loss": 2.6304, "step": 2299 }, { "epoch": 0.28, "learning_rate": 8.74991798631793e-06, "loss": 2.4996, "step": 2300 }, { "epoch": 0.28, "learning_rate": 8.7485897017909e-06, "loss": 2.6367, "step": 2301 }, { "epoch": 0.28, "learning_rate": 8.74726081288404e-06, "loss": 2.703, "step": 2302 }, { "epoch": 0.28, "learning_rate": 8.745931319811603e-06, "loss": 2.4673, "step": 2303 }, { "epoch": 0.28, "learning_rate": 8.744601222787938e-06, "loss": 2.5757, "step": 2304 }, { "epoch": 0.28, "learning_rate": 8.7432705220275e-06, "loss": 2.6648, "step": 2305 }, { "epoch": 0.28, "learning_rate": 8.741939217744835e-06, "loss": 2.6826, "step": 2306 }, { "epoch": 0.28, "learning_rate": 8.740607310154583e-06, "loss": 2.7921, "step": 2307 }, { "epoch": 0.28, "learning_rate": 8.739274799471492e-06, "loss": 2.6572, "step": 2308 }, { "epoch": 0.28, "learning_rate": 8.737941685910395e-06, "loss": 2.2318, "step": 2309 }, { "epoch": 0.28, "learning_rate": 8.736607969686231e-06, "loss": 2.6085, "step": 2310 }, { "epoch": 0.28, "learning_rate": 8.735273651014031e-06, "loss": 2.6578, "step": 2311 }, { "epoch": 0.28, "learning_rate": 8.733938730108928e-06, "loss": 2.6034, "step": 2312 }, { "epoch": 0.28, "learning_rate": 8.73260320718615e-06, "loss": 2.6364, "step": 2313 }, { "epoch": 0.28, "learning_rate": 8.731267082461018e-06, "loss": 2.6456, "step": 2314 }, { "epoch": 0.28, "learning_rate": 8.729930356148956e-06, "loss": 2.5852, "step": 2315 }, { "epoch": 0.28, "learning_rate": 8.728593028465481e-06, "loss": 2.6869, "step": 2316 }, { "epoch": 0.28, "learning_rate": 8.72725509962621e-06, "loss": 2.5301, "step": 2317 }, { "epoch": 0.28, "learning_rate": 8.725916569846854e-06, "loss": 2.5863, "step": 2318 }, { "epoch": 0.28, "learning_rate": 8.724577439343223e-06, "loss": 2.5897, "step": 2319 }, { "epoch": 0.28, "learning_rate": 8.723237708331225e-06, "loss": 2.6298, "step": 2320 }, { "epoch": 0.28, "learning_rate": 8.721897377026859e-06, "loss": 2.7035, "step": 2321 }, { "epoch": 0.28, "learning_rate": 8.720556445646226e-06, "loss": 2.4774, "step": 2322 }, { "epoch": 0.28, "learning_rate": 8.719214914405525e-06, "loss": 2.4448, "step": 2323 }, { "epoch": 0.28, "learning_rate": 8.717872783521048e-06, "loss": 2.4175, "step": 2324 }, { "epoch": 0.28, "learning_rate": 8.716530053209182e-06, "loss": 2.4623, "step": 2325 }, { "epoch": 0.28, "learning_rate": 8.715186723686418e-06, "loss": 2.6693, "step": 2326 }, { "epoch": 0.28, "learning_rate": 8.713842795169334e-06, "loss": 2.7202, "step": 2327 }, { "epoch": 0.28, "learning_rate": 8.712498267874615e-06, "loss": 2.7234, "step": 2328 }, { "epoch": 0.28, "learning_rate": 8.711153142019035e-06, "loss": 2.4721, "step": 2329 }, { "epoch": 0.28, "learning_rate": 8.709807417819464e-06, "loss": 2.6127, "step": 2330 }, { "epoch": 0.28, "learning_rate": 8.708461095492876e-06, "loss": 2.4876, "step": 2331 }, { "epoch": 0.28, "learning_rate": 8.707114175256335e-06, "loss": 2.6058, "step": 2332 }, { "epoch": 0.28, "learning_rate": 8.705766657326999e-06, "loss": 2.3585, "step": 2333 }, { "epoch": 0.28, "learning_rate": 8.704418541922132e-06, "loss": 2.5525, "step": 2334 }, { "epoch": 0.28, "learning_rate": 8.703069829259087e-06, "loss": 2.4915, "step": 2335 }, { "epoch": 0.28, "learning_rate": 8.701720519555315e-06, "loss": 2.5493, "step": 2336 }, { "epoch": 0.28, "learning_rate": 8.700370613028364e-06, "loss": 2.6009, "step": 2337 }, { "epoch": 0.28, "learning_rate": 8.699020109895875e-06, "loss": 2.5307, "step": 2338 }, { "epoch": 0.28, "learning_rate": 8.69766901037559e-06, "loss": 2.3723, "step": 2339 }, { "epoch": 0.28, "learning_rate": 8.696317314685342e-06, "loss": 2.5767, "step": 2340 }, { "epoch": 0.28, "learning_rate": 8.694965023043067e-06, "loss": 2.5408, "step": 2341 }, { "epoch": 0.28, "learning_rate": 8.69361213566679e-06, "loss": 2.5031, "step": 2342 }, { "epoch": 0.28, "learning_rate": 8.692258652774636e-06, "loss": 2.4459, "step": 2343 }, { "epoch": 0.28, "learning_rate": 8.690904574584828e-06, "loss": 2.5701, "step": 2344 }, { "epoch": 0.28, "learning_rate": 8.689549901315677e-06, "loss": 2.3174, "step": 2345 }, { "epoch": 0.28, "learning_rate": 8.6881946331856e-06, "loss": 2.6292, "step": 2346 }, { "epoch": 0.28, "learning_rate": 8.6868387704131e-06, "loss": 2.5507, "step": 2347 }, { "epoch": 0.28, "learning_rate": 8.685482313216784e-06, "loss": 2.6359, "step": 2348 }, { "epoch": 0.28, "learning_rate": 8.684125261815352e-06, "loss": 2.5649, "step": 2349 }, { "epoch": 0.28, "learning_rate": 8.682767616427598e-06, "loss": 2.5765, "step": 2350 }, { "epoch": 0.28, "learning_rate": 8.681409377272414e-06, "loss": 2.7976, "step": 2351 }, { "epoch": 0.28, "learning_rate": 8.680050544568788e-06, "loss": 2.8242, "step": 2352 }, { "epoch": 0.28, "learning_rate": 8.6786911185358e-06, "loss": 2.5279, "step": 2353 }, { "epoch": 0.28, "learning_rate": 8.67733109939263e-06, "loss": 2.7454, "step": 2354 }, { "epoch": 0.28, "learning_rate": 8.675970487358552e-06, "loss": 2.7214, "step": 2355 }, { "epoch": 0.28, "learning_rate": 8.674609282652936e-06, "loss": 2.4745, "step": 2356 }, { "epoch": 0.28, "learning_rate": 8.673247485495247e-06, "loss": 2.7342, "step": 2357 }, { "epoch": 0.28, "learning_rate": 8.671885096105042e-06, "loss": 2.4902, "step": 2358 }, { "epoch": 0.28, "learning_rate": 8.670522114701983e-06, "loss": 2.7203, "step": 2359 }, { "epoch": 0.28, "learning_rate": 8.669158541505817e-06, "loss": 2.5739, "step": 2360 }, { "epoch": 0.28, "learning_rate": 8.667794376736395e-06, "loss": 2.5216, "step": 2361 }, { "epoch": 0.28, "learning_rate": 8.666429620613656e-06, "loss": 2.7359, "step": 2362 }, { "epoch": 0.28, "learning_rate": 8.665064273357638e-06, "loss": 2.547, "step": 2363 }, { "epoch": 0.28, "learning_rate": 8.663698335188477e-06, "loss": 2.5363, "step": 2364 }, { "epoch": 0.28, "learning_rate": 8.662331806326399e-06, "loss": 2.5336, "step": 2365 }, { "epoch": 0.28, "learning_rate": 8.660964686991725e-06, "loss": 2.6045, "step": 2366 }, { "epoch": 0.28, "learning_rate": 8.659596977404879e-06, "loss": 2.6891, "step": 2367 }, { "epoch": 0.28, "learning_rate": 8.65822867778637e-06, "loss": 2.523, "step": 2368 }, { "epoch": 0.28, "learning_rate": 8.656859788356811e-06, "loss": 2.6495, "step": 2369 }, { "epoch": 0.28, "learning_rate": 8.655490309336905e-06, "loss": 2.5656, "step": 2370 }, { "epoch": 0.28, "learning_rate": 8.65412024094745e-06, "loss": 2.5992, "step": 2371 }, { "epoch": 0.28, "learning_rate": 8.65274958340934e-06, "loss": 2.699, "step": 2372 }, { "epoch": 0.29, "learning_rate": 8.651378336943565e-06, "loss": 2.5365, "step": 2373 }, { "epoch": 0.29, "learning_rate": 8.65000650177121e-06, "loss": 2.5822, "step": 2374 }, { "epoch": 0.29, "learning_rate": 8.648634078113453e-06, "loss": 2.5401, "step": 2375 }, { "epoch": 0.29, "learning_rate": 8.647261066191569e-06, "loss": 2.5774, "step": 2376 }, { "epoch": 0.29, "learning_rate": 8.645887466226923e-06, "loss": 2.6625, "step": 2377 }, { "epoch": 0.29, "learning_rate": 8.644513278440984e-06, "loss": 2.5682, "step": 2378 }, { "epoch": 0.29, "learning_rate": 8.643138503055306e-06, "loss": 2.6275, "step": 2379 }, { "epoch": 0.29, "learning_rate": 8.641763140291546e-06, "loss": 2.5354, "step": 2380 }, { "epoch": 0.29, "learning_rate": 8.640387190371448e-06, "loss": 2.3807, "step": 2381 }, { "epoch": 0.29, "learning_rate": 8.639010653516858e-06, "loss": 2.6182, "step": 2382 }, { "epoch": 0.29, "learning_rate": 8.63763352994971e-06, "loss": 2.5359, "step": 2383 }, { "epoch": 0.29, "learning_rate": 8.636255819892037e-06, "loss": 2.6359, "step": 2384 }, { "epoch": 0.29, "learning_rate": 8.634877523565964e-06, "loss": 2.6336, "step": 2385 }, { "epoch": 0.29, "learning_rate": 8.633498641193713e-06, "loss": 2.6452, "step": 2386 }, { "epoch": 0.29, "learning_rate": 8.632119172997601e-06, "loss": 2.4194, "step": 2387 }, { "epoch": 0.29, "learning_rate": 8.630739119200035e-06, "loss": 2.5368, "step": 2388 }, { "epoch": 0.29, "learning_rate": 8.629358480023521e-06, "loss": 2.4869, "step": 2389 }, { "epoch": 0.29, "learning_rate": 8.627977255690658e-06, "loss": 2.4915, "step": 2390 }, { "epoch": 0.29, "learning_rate": 8.626595446424133e-06, "loss": 2.782, "step": 2391 }, { "epoch": 0.29, "learning_rate": 8.62521305244674e-06, "loss": 2.5767, "step": 2392 }, { "epoch": 0.29, "learning_rate": 8.623830073981361e-06, "loss": 2.446, "step": 2393 }, { "epoch": 0.29, "learning_rate": 8.622446511250964e-06, "loss": 2.4755, "step": 2394 }, { "epoch": 0.29, "learning_rate": 8.621062364478627e-06, "loss": 2.5466, "step": 2395 }, { "epoch": 0.29, "learning_rate": 8.61967763388751e-06, "loss": 2.4267, "step": 2396 }, { "epoch": 0.29, "learning_rate": 8.61829231970087e-06, "loss": 2.5937, "step": 2397 }, { "epoch": 0.29, "learning_rate": 8.616906422142061e-06, "loss": 2.5518, "step": 2398 }, { "epoch": 0.29, "learning_rate": 8.61551994143453e-06, "loss": 2.5754, "step": 2399 }, { "epoch": 0.29, "learning_rate": 8.614132877801817e-06, "loss": 2.7716, "step": 2400 }, { "epoch": 0.29, "learning_rate": 8.612745231467556e-06, "loss": 2.5672, "step": 2401 }, { "epoch": 0.29, "learning_rate": 8.611357002655475e-06, "loss": 2.6149, "step": 2402 }, { "epoch": 0.29, "learning_rate": 8.609968191589396e-06, "loss": 2.6132, "step": 2403 }, { "epoch": 0.29, "learning_rate": 8.608578798493237e-06, "loss": 2.6278, "step": 2404 }, { "epoch": 0.29, "learning_rate": 8.607188823591004e-06, "loss": 2.6757, "step": 2405 }, { "epoch": 0.29, "learning_rate": 8.605798267106805e-06, "loss": 2.7148, "step": 2406 }, { "epoch": 0.29, "learning_rate": 8.604407129264835e-06, "loss": 2.7476, "step": 2407 }, { "epoch": 0.29, "learning_rate": 8.603015410289387e-06, "loss": 2.5226, "step": 2408 }, { "epoch": 0.29, "learning_rate": 8.601623110404841e-06, "loss": 2.5611, "step": 2409 }, { "epoch": 0.29, "learning_rate": 8.600230229835682e-06, "loss": 2.6794, "step": 2410 }, { "epoch": 0.29, "learning_rate": 8.598836768806478e-06, "loss": 2.6658, "step": 2411 }, { "epoch": 0.29, "learning_rate": 8.597442727541898e-06, "loss": 2.6075, "step": 2412 }, { "epoch": 0.29, "learning_rate": 8.596048106266697e-06, "loss": 2.567, "step": 2413 }, { "epoch": 0.29, "learning_rate": 8.594652905205731e-06, "loss": 2.5864, "step": 2414 }, { "epoch": 0.29, "learning_rate": 8.593257124583946e-06, "loss": 2.5504, "step": 2415 }, { "epoch": 0.29, "learning_rate": 8.591860764626381e-06, "loss": 2.5646, "step": 2416 }, { "epoch": 0.29, "learning_rate": 8.590463825558169e-06, "loss": 2.6392, "step": 2417 }, { "epoch": 0.29, "learning_rate": 8.589066307604537e-06, "loss": 2.758, "step": 2418 }, { "epoch": 0.29, "learning_rate": 8.587668210990805e-06, "loss": 2.4847, "step": 2419 }, { "epoch": 0.29, "learning_rate": 8.586269535942386e-06, "loss": 2.5166, "step": 2420 }, { "epoch": 0.29, "learning_rate": 8.584870282684786e-06, "loss": 2.6342, "step": 2421 }, { "epoch": 0.29, "learning_rate": 8.583470451443605e-06, "loss": 2.6081, "step": 2422 }, { "epoch": 0.29, "learning_rate": 8.582070042444535e-06, "loss": 2.5615, "step": 2423 }, { "epoch": 0.29, "learning_rate": 8.580669055913364e-06, "loss": 2.5954, "step": 2424 }, { "epoch": 0.29, "learning_rate": 8.579267492075968e-06, "loss": 2.4868, "step": 2425 }, { "epoch": 0.29, "learning_rate": 8.577865351158324e-06, "loss": 2.4834, "step": 2426 }, { "epoch": 0.29, "learning_rate": 8.57646263338649e-06, "loss": 2.5618, "step": 2427 }, { "epoch": 0.29, "learning_rate": 8.575059338986632e-06, "loss": 2.4996, "step": 2428 }, { "epoch": 0.29, "learning_rate": 8.573655468184997e-06, "loss": 2.5122, "step": 2429 }, { "epoch": 0.29, "learning_rate": 8.57225102120793e-06, "loss": 2.4806, "step": 2430 }, { "epoch": 0.29, "learning_rate": 8.570845998281865e-06, "loss": 2.6045, "step": 2431 }, { "epoch": 0.29, "learning_rate": 8.569440399633337e-06, "loss": 2.4304, "step": 2432 }, { "epoch": 0.29, "learning_rate": 8.568034225488964e-06, "loss": 2.4538, "step": 2433 }, { "epoch": 0.29, "learning_rate": 8.566627476075467e-06, "loss": 2.64, "step": 2434 }, { "epoch": 0.29, "learning_rate": 8.565220151619648e-06, "loss": 2.6859, "step": 2435 }, { "epoch": 0.29, "learning_rate": 8.563812252348412e-06, "loss": 2.7395, "step": 2436 }, { "epoch": 0.29, "learning_rate": 8.56240377848875e-06, "loss": 2.5786, "step": 2437 }, { "epoch": 0.29, "learning_rate": 8.560994730267751e-06, "loss": 2.4372, "step": 2438 }, { "epoch": 0.29, "learning_rate": 8.559585107912593e-06, "loss": 2.7312, "step": 2439 }, { "epoch": 0.29, "learning_rate": 8.558174911650546e-06, "loss": 2.54, "step": 2440 }, { "epoch": 0.29, "learning_rate": 8.556764141708975e-06, "loss": 2.3839, "step": 2441 }, { "epoch": 0.29, "learning_rate": 8.555352798315339e-06, "loss": 2.3791, "step": 2442 }, { "epoch": 0.29, "learning_rate": 8.553940881697182e-06, "loss": 2.6749, "step": 2443 }, { "epoch": 0.29, "learning_rate": 8.552528392082147e-06, "loss": 2.7619, "step": 2444 }, { "epoch": 0.29, "learning_rate": 8.55111532969797e-06, "loss": 2.4611, "step": 2445 }, { "epoch": 0.29, "learning_rate": 8.549701694772475e-06, "loss": 2.5515, "step": 2446 }, { "epoch": 0.29, "learning_rate": 8.548287487533579e-06, "loss": 2.4892, "step": 2447 }, { "epoch": 0.29, "learning_rate": 8.546872708209297e-06, "loss": 2.4429, "step": 2448 }, { "epoch": 0.29, "learning_rate": 8.545457357027727e-06, "loss": 2.6093, "step": 2449 }, { "epoch": 0.29, "learning_rate": 8.544041434217067e-06, "loss": 2.7221, "step": 2450 }, { "epoch": 0.29, "learning_rate": 8.542624940005604e-06, "loss": 2.6011, "step": 2451 }, { "epoch": 0.29, "learning_rate": 8.541207874621718e-06, "loss": 2.5159, "step": 2452 }, { "epoch": 0.29, "learning_rate": 8.539790238293878e-06, "loss": 2.514, "step": 2453 }, { "epoch": 0.29, "learning_rate": 8.53837203125065e-06, "loss": 2.4945, "step": 2454 }, { "epoch": 0.29, "learning_rate": 8.536953253720687e-06, "loss": 2.4896, "step": 2455 }, { "epoch": 0.3, "learning_rate": 8.535533905932739e-06, "loss": 2.4572, "step": 2456 }, { "epoch": 0.3, "learning_rate": 8.534113988115645e-06, "loss": 2.7591, "step": 2457 }, { "epoch": 0.3, "learning_rate": 8.532693500498334e-06, "loss": 2.7264, "step": 2458 }, { "epoch": 0.3, "learning_rate": 8.53127244330983e-06, "loss": 2.6027, "step": 2459 }, { "epoch": 0.3, "learning_rate": 8.529850816779252e-06, "loss": 2.4524, "step": 2460 }, { "epoch": 0.3, "learning_rate": 8.528428621135802e-06, "loss": 2.6452, "step": 2461 }, { "epoch": 0.3, "learning_rate": 8.52700585660878e-06, "loss": 2.6584, "step": 2462 }, { "epoch": 0.3, "learning_rate": 8.525582523427578e-06, "loss": 2.6005, "step": 2463 }, { "epoch": 0.3, "learning_rate": 8.524158621821678e-06, "loss": 2.5459, "step": 2464 }, { "epoch": 0.3, "learning_rate": 8.52273415202065e-06, "loss": 2.6272, "step": 2465 }, { "epoch": 0.3, "learning_rate": 8.521309114254164e-06, "loss": 2.4999, "step": 2466 }, { "epoch": 0.3, "learning_rate": 8.519883508751972e-06, "loss": 2.6229, "step": 2467 }, { "epoch": 0.3, "learning_rate": 8.518457335743927e-06, "loss": 2.5676, "step": 2468 }, { "epoch": 0.3, "learning_rate": 8.517030595459966e-06, "loss": 2.4274, "step": 2469 }, { "epoch": 0.3, "learning_rate": 8.515603288130119e-06, "loss": 2.4998, "step": 2470 }, { "epoch": 0.3, "learning_rate": 8.514175413984513e-06, "loss": 2.6171, "step": 2471 }, { "epoch": 0.3, "learning_rate": 8.512746973253358e-06, "loss": 2.6117, "step": 2472 }, { "epoch": 0.3, "learning_rate": 8.511317966166963e-06, "loss": 2.6337, "step": 2473 }, { "epoch": 0.3, "learning_rate": 8.509888392955725e-06, "loss": 2.5162, "step": 2474 }, { "epoch": 0.3, "learning_rate": 8.508458253850126e-06, "loss": 2.6302, "step": 2475 }, { "epoch": 0.3, "learning_rate": 8.507027549080753e-06, "loss": 2.5069, "step": 2476 }, { "epoch": 0.3, "learning_rate": 8.505596278878272e-06, "loss": 2.5346, "step": 2477 }, { "epoch": 0.3, "learning_rate": 8.504164443473446e-06, "loss": 2.6742, "step": 2478 }, { "epoch": 0.3, "learning_rate": 8.502732043097128e-06, "loss": 2.468, "step": 2479 }, { "epoch": 0.3, "learning_rate": 8.50129907798026e-06, "loss": 2.4726, "step": 2480 }, { "epoch": 0.3, "learning_rate": 8.499865548353879e-06, "loss": 2.6581, "step": 2481 }, { "epoch": 0.3, "learning_rate": 8.49843145444911e-06, "loss": 2.5507, "step": 2482 }, { "epoch": 0.3, "learning_rate": 8.496996796497172e-06, "loss": 2.5632, "step": 2483 }, { "epoch": 0.3, "learning_rate": 8.49556157472937e-06, "loss": 2.6134, "step": 2484 }, { "epoch": 0.3, "learning_rate": 8.494125789377104e-06, "loss": 2.7207, "step": 2485 }, { "epoch": 0.3, "learning_rate": 8.492689440671865e-06, "loss": 2.6244, "step": 2486 }, { "epoch": 0.3, "learning_rate": 8.491252528845229e-06, "loss": 2.5673, "step": 2487 }, { "epoch": 0.3, "learning_rate": 8.489815054128874e-06, "loss": 2.6189, "step": 2488 }, { "epoch": 0.3, "learning_rate": 8.488377016754556e-06, "loss": 2.5662, "step": 2489 }, { "epoch": 0.3, "learning_rate": 8.48693841695413e-06, "loss": 2.5665, "step": 2490 }, { "epoch": 0.3, "learning_rate": 8.485499254959542e-06, "loss": 2.4691, "step": 2491 }, { "epoch": 0.3, "learning_rate": 8.484059531002822e-06, "loss": 2.4533, "step": 2492 }, { "epoch": 0.3, "learning_rate": 8.482619245316094e-06, "loss": 2.6268, "step": 2493 }, { "epoch": 0.3, "learning_rate": 8.481178398131578e-06, "loss": 2.6128, "step": 2494 }, { "epoch": 0.3, "learning_rate": 8.47973698968158e-06, "loss": 2.6875, "step": 2495 }, { "epoch": 0.3, "learning_rate": 8.478295020198488e-06, "loss": 2.5892, "step": 2496 }, { "epoch": 0.3, "learning_rate": 8.476852489914797e-06, "loss": 2.6404, "step": 2497 }, { "epoch": 0.3, "learning_rate": 8.475409399063081e-06, "loss": 2.629, "step": 2498 }, { "epoch": 0.3, "learning_rate": 8.473965747876007e-06, "loss": 2.6444, "step": 2499 }, { "epoch": 0.3, "learning_rate": 8.472521536586336e-06, "loss": 2.362, "step": 2500 }, { "epoch": 0.3, "learning_rate": 8.471076765426913e-06, "loss": 2.6292, "step": 2501 }, { "epoch": 0.3, "learning_rate": 8.469631434630677e-06, "loss": 2.6224, "step": 2502 }, { "epoch": 0.3, "learning_rate": 8.468185544430656e-06, "loss": 2.6199, "step": 2503 }, { "epoch": 0.3, "learning_rate": 8.46673909505997e-06, "loss": 2.6567, "step": 2504 }, { "epoch": 0.3, "learning_rate": 8.465292086751829e-06, "loss": 2.5208, "step": 2505 }, { "epoch": 0.3, "learning_rate": 8.46384451973953e-06, "loss": 2.571, "step": 2506 }, { "epoch": 0.3, "learning_rate": 8.462396394256462e-06, "loss": 2.7089, "step": 2507 }, { "epoch": 0.3, "learning_rate": 8.460947710536108e-06, "loss": 2.5557, "step": 2508 }, { "epoch": 0.3, "learning_rate": 8.459498468812032e-06, "loss": 2.6597, "step": 2509 }, { "epoch": 0.3, "learning_rate": 8.458048669317897e-06, "loss": 2.6636, "step": 2510 }, { "epoch": 0.3, "learning_rate": 8.45659831228745e-06, "loss": 2.5195, "step": 2511 }, { "epoch": 0.3, "learning_rate": 8.45514739795453e-06, "loss": 2.7085, "step": 2512 }, { "epoch": 0.3, "learning_rate": 8.45369592655307e-06, "loss": 2.3491, "step": 2513 }, { "epoch": 0.3, "learning_rate": 8.452243898317083e-06, "loss": 2.5634, "step": 2514 }, { "epoch": 0.3, "learning_rate": 8.450791313480679e-06, "loss": 2.6207, "step": 2515 }, { "epoch": 0.3, "learning_rate": 8.44933817227806e-06, "loss": 2.6451, "step": 2516 }, { "epoch": 0.3, "learning_rate": 8.447884474943509e-06, "loss": 2.7452, "step": 2517 }, { "epoch": 0.3, "learning_rate": 8.446430221711406e-06, "loss": 2.5703, "step": 2518 }, { "epoch": 0.3, "learning_rate": 8.444975412816216e-06, "loss": 2.5749, "step": 2519 }, { "epoch": 0.3, "learning_rate": 8.4435200484925e-06, "loss": 2.3245, "step": 2520 }, { "epoch": 0.3, "learning_rate": 8.442064128974901e-06, "loss": 2.7889, "step": 2521 }, { "epoch": 0.3, "learning_rate": 8.440607654498156e-06, "loss": 2.5646, "step": 2522 }, { "epoch": 0.3, "learning_rate": 8.43915062529709e-06, "loss": 2.4603, "step": 2523 }, { "epoch": 0.3, "learning_rate": 8.437693041606619e-06, "loss": 2.5879, "step": 2524 }, { "epoch": 0.3, "learning_rate": 8.436234903661744e-06, "loss": 2.655, "step": 2525 }, { "epoch": 0.3, "learning_rate": 8.434776211697559e-06, "loss": 2.4387, "step": 2526 }, { "epoch": 0.3, "learning_rate": 8.433316965949253e-06, "loss": 2.5422, "step": 2527 }, { "epoch": 0.3, "learning_rate": 8.43185716665209e-06, "loss": 2.655, "step": 2528 }, { "epoch": 0.3, "learning_rate": 8.430396814041436e-06, "loss": 2.5647, "step": 2529 }, { "epoch": 0.3, "learning_rate": 8.42893590835274e-06, "loss": 2.4441, "step": 2530 }, { "epoch": 0.3, "learning_rate": 8.427474449821543e-06, "loss": 2.7744, "step": 2531 }, { "epoch": 0.3, "learning_rate": 8.426012438683472e-06, "loss": 2.5379, "step": 2532 }, { "epoch": 0.3, "learning_rate": 8.424549875174248e-06, "loss": 2.4646, "step": 2533 }, { "epoch": 0.3, "learning_rate": 8.423086759529676e-06, "loss": 2.772, "step": 2534 }, { "epoch": 0.3, "learning_rate": 8.42162309198565e-06, "loss": 2.6128, "step": 2535 }, { "epoch": 0.3, "learning_rate": 8.42015887277816e-06, "loss": 2.62, "step": 2536 }, { "epoch": 0.3, "learning_rate": 8.418694102143274e-06, "loss": 2.6508, "step": 2537 }, { "epoch": 0.3, "learning_rate": 8.417228780317159e-06, "loss": 2.7049, "step": 2538 }, { "epoch": 0.31, "learning_rate": 8.41576290753607e-06, "loss": 2.634, "step": 2539 }, { "epoch": 0.31, "learning_rate": 8.41429648403634e-06, "loss": 2.5676, "step": 2540 }, { "epoch": 0.31, "learning_rate": 8.4128295100544e-06, "loss": 2.625, "step": 2541 }, { "epoch": 0.31, "learning_rate": 8.411361985826775e-06, "loss": 2.4087, "step": 2542 }, { "epoch": 0.31, "learning_rate": 8.409893911590063e-06, "loss": 2.5044, "step": 2543 }, { "epoch": 0.31, "learning_rate": 8.408425287580966e-06, "loss": 2.5427, "step": 2544 }, { "epoch": 0.31, "learning_rate": 8.406956114036265e-06, "loss": 2.6852, "step": 2545 }, { "epoch": 0.31, "learning_rate": 8.405486391192834e-06, "loss": 2.4742, "step": 2546 }, { "epoch": 0.31, "learning_rate": 8.404016119287633e-06, "loss": 2.6787, "step": 2547 }, { "epoch": 0.31, "learning_rate": 8.402545298557712e-06, "loss": 2.6733, "step": 2548 }, { "epoch": 0.31, "learning_rate": 8.401073929240211e-06, "loss": 2.5572, "step": 2549 }, { "epoch": 0.31, "learning_rate": 8.399602011572356e-06, "loss": 2.4537, "step": 2550 }, { "epoch": 0.31, "learning_rate": 8.398129545791463e-06, "loss": 2.6312, "step": 2551 }, { "epoch": 0.31, "learning_rate": 8.396656532134934e-06, "loss": 2.5922, "step": 2552 }, { "epoch": 0.31, "learning_rate": 8.395182970840261e-06, "loss": 2.5495, "step": 2553 }, { "epoch": 0.31, "learning_rate": 8.393708862145024e-06, "loss": 2.4656, "step": 2554 }, { "epoch": 0.31, "learning_rate": 8.392234206286894e-06, "loss": 2.5872, "step": 2555 }, { "epoch": 0.31, "learning_rate": 8.390759003503624e-06, "loss": 2.5661, "step": 2556 }, { "epoch": 0.31, "learning_rate": 8.389283254033061e-06, "loss": 2.5764, "step": 2557 }, { "epoch": 0.31, "learning_rate": 8.387806958113139e-06, "loss": 2.648, "step": 2558 }, { "epoch": 0.31, "learning_rate": 8.386330115981877e-06, "loss": 2.5034, "step": 2559 }, { "epoch": 0.31, "learning_rate": 8.384852727877386e-06, "loss": 2.5501, "step": 2560 }, { "epoch": 0.31, "learning_rate": 8.383374794037862e-06, "loss": 2.4438, "step": 2561 }, { "epoch": 0.31, "learning_rate": 8.381896314701589e-06, "loss": 2.6433, "step": 2562 }, { "epoch": 0.31, "learning_rate": 8.380417290106943e-06, "loss": 2.5714, "step": 2563 }, { "epoch": 0.31, "learning_rate": 8.378937720492384e-06, "loss": 2.4141, "step": 2564 }, { "epoch": 0.31, "learning_rate": 8.37745760609646e-06, "loss": 2.5779, "step": 2565 }, { "epoch": 0.31, "learning_rate": 8.375976947157808e-06, "loss": 2.604, "step": 2566 }, { "epoch": 0.31, "learning_rate": 8.374495743915153e-06, "loss": 2.5995, "step": 2567 }, { "epoch": 0.31, "learning_rate": 8.373013996607309e-06, "loss": 2.7605, "step": 2568 }, { "epoch": 0.31, "learning_rate": 8.371531705473172e-06, "loss": 2.6018, "step": 2569 }, { "epoch": 0.31, "learning_rate": 8.370048870751732e-06, "loss": 2.4328, "step": 2570 }, { "epoch": 0.31, "learning_rate": 8.368565492682064e-06, "loss": 2.5006, "step": 2571 }, { "epoch": 0.31, "learning_rate": 8.367081571503332e-06, "loss": 2.4701, "step": 2572 }, { "epoch": 0.31, "learning_rate": 8.365597107454786e-06, "loss": 2.5793, "step": 2573 }, { "epoch": 0.31, "learning_rate": 8.364112100775765e-06, "loss": 2.6341, "step": 2574 }, { "epoch": 0.31, "learning_rate": 8.36262655170569e-06, "loss": 2.5406, "step": 2575 }, { "epoch": 0.31, "learning_rate": 8.361140460484081e-06, "loss": 2.5491, "step": 2576 }, { "epoch": 0.31, "learning_rate": 8.359653827350533e-06, "loss": 2.3944, "step": 2577 }, { "epoch": 0.31, "learning_rate": 8.358166652544734e-06, "loss": 2.4618, "step": 2578 }, { "epoch": 0.31, "learning_rate": 8.356678936306463e-06, "loss": 2.773, "step": 2579 }, { "epoch": 0.31, "learning_rate": 8.355190678875577e-06, "loss": 2.5812, "step": 2580 }, { "epoch": 0.31, "learning_rate": 8.353701880492031e-06, "loss": 2.6375, "step": 2581 }, { "epoch": 0.31, "learning_rate": 8.352212541395859e-06, "loss": 2.5355, "step": 2582 }, { "epoch": 0.31, "learning_rate": 8.350722661827186e-06, "loss": 2.5235, "step": 2583 }, { "epoch": 0.31, "learning_rate": 8.349232242026221e-06, "loss": 2.6211, "step": 2584 }, { "epoch": 0.31, "learning_rate": 8.347741282233265e-06, "loss": 2.4973, "step": 2585 }, { "epoch": 0.31, "learning_rate": 8.346249782688705e-06, "loss": 2.5139, "step": 2586 }, { "epoch": 0.31, "learning_rate": 8.344757743633007e-06, "loss": 2.6732, "step": 2587 }, { "epoch": 0.31, "learning_rate": 8.343265165306736e-06, "loss": 2.5139, "step": 2588 }, { "epoch": 0.31, "learning_rate": 8.341772047950534e-06, "loss": 2.5775, "step": 2589 }, { "epoch": 0.31, "learning_rate": 8.34027839180514e-06, "loss": 2.4471, "step": 2590 }, { "epoch": 0.31, "learning_rate": 8.338784197111367e-06, "loss": 2.5801, "step": 2591 }, { "epoch": 0.31, "learning_rate": 8.337289464110128e-06, "loss": 2.5727, "step": 2592 }, { "epoch": 0.31, "learning_rate": 8.335794193042413e-06, "loss": 2.5963, "step": 2593 }, { "epoch": 0.31, "learning_rate": 8.334298384149305e-06, "loss": 2.6013, "step": 2594 }, { "epoch": 0.31, "learning_rate": 8.332802037671968e-06, "loss": 2.529, "step": 2595 }, { "epoch": 0.31, "learning_rate": 8.331305153851659e-06, "loss": 2.4846, "step": 2596 }, { "epoch": 0.31, "learning_rate": 8.329807732929715e-06, "loss": 2.57, "step": 2597 }, { "epoch": 0.31, "learning_rate": 8.328309775147567e-06, "loss": 2.6741, "step": 2598 }, { "epoch": 0.31, "learning_rate": 8.326811280746727e-06, "loss": 2.7164, "step": 2599 }, { "epoch": 0.31, "learning_rate": 8.325312249968795e-06, "loss": 2.4808, "step": 2600 }, { "epoch": 0.31, "learning_rate": 8.323812683055457e-06, "loss": 2.564, "step": 2601 }, { "epoch": 0.31, "learning_rate": 8.322312580248488e-06, "loss": 2.6342, "step": 2602 }, { "epoch": 0.31, "learning_rate": 8.320811941789746e-06, "loss": 2.668, "step": 2603 }, { "epoch": 0.31, "learning_rate": 8.319310767921174e-06, "loss": 2.5528, "step": 2604 }, { "epoch": 0.31, "learning_rate": 8.317809058884809e-06, "loss": 2.4981, "step": 2605 }, { "epoch": 0.31, "learning_rate": 8.316306814922769e-06, "loss": 2.3741, "step": 2606 }, { "epoch": 0.31, "learning_rate": 8.314804036277254e-06, "loss": 2.436, "step": 2607 }, { "epoch": 0.31, "learning_rate": 8.313300723190561e-06, "loss": 2.5505, "step": 2608 }, { "epoch": 0.31, "learning_rate": 8.311796875905061e-06, "loss": 2.635, "step": 2609 }, { "epoch": 0.31, "learning_rate": 8.310292494663222e-06, "loss": 2.671, "step": 2610 }, { "epoch": 0.31, "learning_rate": 8.308787579707591e-06, "loss": 2.5532, "step": 2611 }, { "epoch": 0.31, "learning_rate": 8.307282131280805e-06, "loss": 2.4858, "step": 2612 }, { "epoch": 0.31, "learning_rate": 8.305776149625584e-06, "loss": 2.5576, "step": 2613 }, { "epoch": 0.31, "learning_rate": 8.304269634984735e-06, "loss": 2.4927, "step": 2614 }, { "epoch": 0.31, "learning_rate": 8.30276258760115e-06, "loss": 2.5737, "step": 2615 }, { "epoch": 0.31, "learning_rate": 8.301255007717812e-06, "loss": 2.5424, "step": 2616 }, { "epoch": 0.31, "learning_rate": 8.299746895577785e-06, "loss": 2.6324, "step": 2617 }, { "epoch": 0.31, "learning_rate": 8.298238251424216e-06, "loss": 2.551, "step": 2618 }, { "epoch": 0.31, "learning_rate": 8.296729075500345e-06, "loss": 2.5114, "step": 2619 }, { "epoch": 0.31, "learning_rate": 8.295219368049494e-06, "loss": 2.5515, "step": 2620 }, { "epoch": 0.31, "learning_rate": 8.29370912931507e-06, "loss": 2.7195, "step": 2621 }, { "epoch": 0.31, "learning_rate": 8.292198359540566e-06, "loss": 2.5085, "step": 2622 }, { "epoch": 0.32, "learning_rate": 8.290687058969564e-06, "loss": 2.5845, "step": 2623 }, { "epoch": 0.32, "learning_rate": 8.289175227845727e-06, "loss": 2.6207, "step": 2624 }, { "epoch": 0.32, "learning_rate": 8.287662866412807e-06, "loss": 2.5274, "step": 2625 }, { "epoch": 0.32, "learning_rate": 8.286149974914637e-06, "loss": 2.3412, "step": 2626 }, { "epoch": 0.32, "learning_rate": 8.28463655359514e-06, "loss": 2.6722, "step": 2627 }, { "epoch": 0.32, "learning_rate": 8.283122602698324e-06, "loss": 2.5865, "step": 2628 }, { "epoch": 0.32, "learning_rate": 8.281608122468278e-06, "loss": 2.5272, "step": 2629 }, { "epoch": 0.32, "learning_rate": 8.280093113149182e-06, "loss": 2.4534, "step": 2630 }, { "epoch": 0.32, "learning_rate": 8.2785775749853e-06, "loss": 2.6454, "step": 2631 }, { "epoch": 0.32, "learning_rate": 8.277061508220975e-06, "loss": 2.6761, "step": 2632 }, { "epoch": 0.32, "learning_rate": 8.275544913100646e-06, "loss": 2.7751, "step": 2633 }, { "epoch": 0.32, "learning_rate": 8.274027789868828e-06, "loss": 2.6434, "step": 2634 }, { "epoch": 0.32, "learning_rate": 8.272510138770128e-06, "loss": 2.5789, "step": 2635 }, { "epoch": 0.32, "learning_rate": 8.270991960049231e-06, "loss": 2.5515, "step": 2636 }, { "epoch": 0.32, "learning_rate": 8.26947325395091e-06, "loss": 2.723, "step": 2637 }, { "epoch": 0.32, "learning_rate": 8.267954020720029e-06, "loss": 2.554, "step": 2638 }, { "epoch": 0.32, "learning_rate": 8.266434260601528e-06, "loss": 2.5653, "step": 2639 }, { "epoch": 0.32, "learning_rate": 8.264913973840439e-06, "loss": 2.7289, "step": 2640 }, { "epoch": 0.32, "learning_rate": 8.26339316068187e-06, "loss": 2.6784, "step": 2641 }, { "epoch": 0.32, "learning_rate": 8.261871821371026e-06, "loss": 2.6692, "step": 2642 }, { "epoch": 0.32, "learning_rate": 8.260349956153185e-06, "loss": 2.5945, "step": 2643 }, { "epoch": 0.32, "learning_rate": 8.258827565273717e-06, "loss": 2.7162, "step": 2644 }, { "epoch": 0.32, "learning_rate": 8.25730464897808e-06, "loss": 2.5601, "step": 2645 }, { "epoch": 0.32, "learning_rate": 8.255781207511804e-06, "loss": 2.6387, "step": 2646 }, { "epoch": 0.32, "learning_rate": 8.254257241120514e-06, "loss": 2.5941, "step": 2647 }, { "epoch": 0.32, "learning_rate": 8.252732750049918e-06, "loss": 2.6675, "step": 2648 }, { "epoch": 0.32, "learning_rate": 8.251207734545807e-06, "loss": 2.6384, "step": 2649 }, { "epoch": 0.32, "learning_rate": 8.249682194854059e-06, "loss": 2.5124, "step": 2650 }, { "epoch": 0.32, "learning_rate": 8.248156131220631e-06, "loss": 2.6139, "step": 2651 }, { "epoch": 0.32, "learning_rate": 8.24662954389157e-06, "loss": 2.627, "step": 2652 }, { "epoch": 0.32, "learning_rate": 8.245102433113005e-06, "loss": 2.6104, "step": 2653 }, { "epoch": 0.32, "learning_rate": 8.24357479913115e-06, "loss": 2.7312, "step": 2654 }, { "epoch": 0.32, "learning_rate": 8.242046642192304e-06, "loss": 2.553, "step": 2655 }, { "epoch": 0.32, "learning_rate": 8.240517962542849e-06, "loss": 2.5021, "step": 2656 }, { "epoch": 0.32, "learning_rate": 8.238988760429252e-06, "loss": 2.5739, "step": 2657 }, { "epoch": 0.32, "learning_rate": 8.237459036098064e-06, "loss": 2.6064, "step": 2658 }, { "epoch": 0.32, "learning_rate": 8.23592878979592e-06, "loss": 2.7111, "step": 2659 }, { "epoch": 0.32, "learning_rate": 8.234398021769541e-06, "loss": 2.6277, "step": 2660 }, { "epoch": 0.32, "learning_rate": 8.23286673226573e-06, "loss": 2.5882, "step": 2661 }, { "epoch": 0.32, "learning_rate": 8.23133492153137e-06, "loss": 2.7023, "step": 2662 }, { "epoch": 0.32, "learning_rate": 8.229802589813442e-06, "loss": 2.6135, "step": 2663 }, { "epoch": 0.32, "learning_rate": 8.228269737358993e-06, "loss": 2.3393, "step": 2664 }, { "epoch": 0.32, "learning_rate": 8.226736364415167e-06, "loss": 2.5233, "step": 2665 }, { "epoch": 0.32, "learning_rate": 8.225202471229187e-06, "loss": 2.5155, "step": 2666 }, { "epoch": 0.32, "learning_rate": 8.22366805804836e-06, "loss": 2.555, "step": 2667 }, { "epoch": 0.32, "learning_rate": 8.222133125120076e-06, "loss": 2.5612, "step": 2668 }, { "epoch": 0.32, "learning_rate": 8.220597672691812e-06, "loss": 2.6521, "step": 2669 }, { "epoch": 0.32, "learning_rate": 8.219061701011125e-06, "loss": 2.4864, "step": 2670 }, { "epoch": 0.32, "learning_rate": 8.217525210325662e-06, "loss": 2.5519, "step": 2671 }, { "epoch": 0.32, "learning_rate": 8.215988200883145e-06, "loss": 2.4437, "step": 2672 }, { "epoch": 0.32, "learning_rate": 8.214450672931385e-06, "loss": 2.41, "step": 2673 }, { "epoch": 0.32, "learning_rate": 8.212912626718273e-06, "loss": 2.6167, "step": 2674 }, { "epoch": 0.32, "learning_rate": 8.21137406249179e-06, "loss": 2.642, "step": 2675 }, { "epoch": 0.32, "learning_rate": 8.209834980499995e-06, "loss": 2.8119, "step": 2676 }, { "epoch": 0.32, "learning_rate": 8.20829538099103e-06, "loss": 2.6948, "step": 2677 }, { "epoch": 0.32, "learning_rate": 8.206755264213128e-06, "loss": 2.5394, "step": 2678 }, { "epoch": 0.32, "learning_rate": 8.205214630414594e-06, "loss": 2.6643, "step": 2679 }, { "epoch": 0.32, "learning_rate": 8.203673479843824e-06, "loss": 2.3948, "step": 2680 }, { "epoch": 0.32, "learning_rate": 8.202131812749296e-06, "loss": 2.5228, "step": 2681 }, { "epoch": 0.32, "learning_rate": 8.200589629379572e-06, "loss": 2.5046, "step": 2682 }, { "epoch": 0.32, "learning_rate": 8.199046929983294e-06, "loss": 2.6575, "step": 2683 }, { "epoch": 0.32, "learning_rate": 8.19750371480919e-06, "loss": 2.5759, "step": 2684 }, { "epoch": 0.32, "learning_rate": 8.195959984106072e-06, "loss": 2.6241, "step": 2685 }, { "epoch": 0.32, "learning_rate": 8.19441573812283e-06, "loss": 2.5886, "step": 2686 }, { "epoch": 0.32, "learning_rate": 8.192870977108443e-06, "loss": 2.594, "step": 2687 }, { "epoch": 0.32, "learning_rate": 8.191325701311971e-06, "loss": 2.581, "step": 2688 }, { "epoch": 0.32, "learning_rate": 8.189779910982556e-06, "loss": 2.6978, "step": 2689 }, { "epoch": 0.32, "learning_rate": 8.188233606369422e-06, "loss": 2.5803, "step": 2690 }, { "epoch": 0.32, "learning_rate": 8.18668678772188e-06, "loss": 2.642, "step": 2691 }, { "epoch": 0.32, "learning_rate": 8.185139455289322e-06, "loss": 2.6413, "step": 2692 }, { "epoch": 0.32, "learning_rate": 8.183591609321217e-06, "loss": 2.6384, "step": 2693 }, { "epoch": 0.32, "learning_rate": 8.182043250067128e-06, "loss": 2.4781, "step": 2694 }, { "epoch": 0.32, "learning_rate": 8.180494377776694e-06, "loss": 2.6023, "step": 2695 }, { "epoch": 0.32, "learning_rate": 8.178944992699632e-06, "loss": 2.5401, "step": 2696 }, { "epoch": 0.32, "learning_rate": 8.177395095085754e-06, "loss": 2.6168, "step": 2697 }, { "epoch": 0.32, "learning_rate": 8.175844685184942e-06, "loss": 2.4881, "step": 2698 }, { "epoch": 0.32, "learning_rate": 8.174293763247172e-06, "loss": 2.5601, "step": 2699 }, { "epoch": 0.32, "learning_rate": 8.172742329522493e-06, "loss": 2.4295, "step": 2700 }, { "epoch": 0.32, "learning_rate": 8.171190384261043e-06, "loss": 2.5413, "step": 2701 }, { "epoch": 0.32, "learning_rate": 8.169637927713037e-06, "loss": 2.589, "step": 2702 }, { "epoch": 0.32, "learning_rate": 8.16808496012878e-06, "loss": 2.5369, "step": 2703 }, { "epoch": 0.32, "learning_rate": 8.166531481758649e-06, "loss": 2.5705, "step": 2704 }, { "epoch": 0.32, "learning_rate": 8.164977492853113e-06, "loss": 2.527, "step": 2705 }, { "epoch": 0.33, "learning_rate": 8.163422993662718e-06, "loss": 2.6226, "step": 2706 }, { "epoch": 0.33, "learning_rate": 8.161867984438094e-06, "loss": 2.7103, "step": 2707 }, { "epoch": 0.33, "learning_rate": 8.160312465429952e-06, "loss": 2.6387, "step": 2708 }, { "epoch": 0.33, "learning_rate": 8.158756436889088e-06, "loss": 2.4585, "step": 2709 }, { "epoch": 0.33, "learning_rate": 8.157199899066379e-06, "loss": 2.6166, "step": 2710 }, { "epoch": 0.33, "learning_rate": 8.15564285221278e-06, "loss": 2.6646, "step": 2711 }, { "epoch": 0.33, "learning_rate": 8.154085296579335e-06, "loss": 2.5158, "step": 2712 }, { "epoch": 0.33, "learning_rate": 8.152527232417163e-06, "loss": 2.6282, "step": 2713 }, { "epoch": 0.33, "learning_rate": 8.150968659977472e-06, "loss": 2.5294, "step": 2714 }, { "epoch": 0.33, "learning_rate": 8.149409579511545e-06, "loss": 2.5221, "step": 2715 }, { "epoch": 0.33, "learning_rate": 8.147849991270753e-06, "loss": 2.4804, "step": 2716 }, { "epoch": 0.33, "learning_rate": 8.146289895506546e-06, "loss": 2.5638, "step": 2717 }, { "epoch": 0.33, "learning_rate": 8.144729292470454e-06, "loss": 2.5047, "step": 2718 }, { "epoch": 0.33, "learning_rate": 8.143168182414094e-06, "loss": 2.5307, "step": 2719 }, { "epoch": 0.33, "learning_rate": 8.141606565589157e-06, "loss": 2.4673, "step": 2720 }, { "epoch": 0.33, "learning_rate": 8.140044442247425e-06, "loss": 2.7557, "step": 2721 }, { "epoch": 0.33, "learning_rate": 8.138481812640755e-06, "loss": 2.3536, "step": 2722 }, { "epoch": 0.33, "learning_rate": 8.136918677021088e-06, "loss": 2.5491, "step": 2723 }, { "epoch": 0.33, "learning_rate": 8.135355035640445e-06, "loss": 2.4149, "step": 2724 }, { "epoch": 0.33, "learning_rate": 8.13379088875093e-06, "loss": 2.4424, "step": 2725 }, { "epoch": 0.33, "learning_rate": 8.132226236604728e-06, "loss": 2.5938, "step": 2726 }, { "epoch": 0.33, "learning_rate": 8.130661079454108e-06, "loss": 2.5032, "step": 2727 }, { "epoch": 0.33, "learning_rate": 8.129095417551416e-06, "loss": 2.5452, "step": 2728 }, { "epoch": 0.33, "learning_rate": 8.127529251149081e-06, "loss": 2.6004, "step": 2729 }, { "epoch": 0.33, "learning_rate": 8.125962580499616e-06, "loss": 2.3647, "step": 2730 }, { "epoch": 0.33, "learning_rate": 8.124395405855609e-06, "loss": 2.6357, "step": 2731 }, { "epoch": 0.33, "learning_rate": 8.122827727469737e-06, "loss": 2.6049, "step": 2732 }, { "epoch": 0.33, "learning_rate": 8.121259545594756e-06, "loss": 2.545, "step": 2733 }, { "epoch": 0.33, "learning_rate": 8.119690860483497e-06, "loss": 2.4327, "step": 2734 }, { "epoch": 0.33, "learning_rate": 8.11812167238888e-06, "loss": 2.5694, "step": 2735 }, { "epoch": 0.33, "learning_rate": 8.116551981563903e-06, "loss": 2.536, "step": 2736 }, { "epoch": 0.33, "learning_rate": 8.114981788261642e-06, "loss": 2.6239, "step": 2737 }, { "epoch": 0.33, "learning_rate": 8.113411092735262e-06, "loss": 2.4997, "step": 2738 }, { "epoch": 0.33, "learning_rate": 8.111839895238e-06, "loss": 2.4794, "step": 2739 }, { "epoch": 0.33, "learning_rate": 8.110268196023179e-06, "loss": 2.5425, "step": 2740 }, { "epoch": 0.33, "learning_rate": 8.108695995344202e-06, "loss": 2.4319, "step": 2741 }, { "epoch": 0.33, "learning_rate": 8.107123293454555e-06, "loss": 2.4695, "step": 2742 }, { "epoch": 0.33, "learning_rate": 8.1055500906078e-06, "loss": 2.3558, "step": 2743 }, { "epoch": 0.33, "learning_rate": 8.103976387057579e-06, "loss": 2.6216, "step": 2744 }, { "epoch": 0.33, "learning_rate": 8.102402183057624e-06, "loss": 2.7285, "step": 2745 }, { "epoch": 0.33, "learning_rate": 8.100827478861741e-06, "loss": 2.6063, "step": 2746 }, { "epoch": 0.33, "learning_rate": 8.099252274723814e-06, "loss": 2.4137, "step": 2747 }, { "epoch": 0.33, "learning_rate": 8.097676570897814e-06, "loss": 2.496, "step": 2748 }, { "epoch": 0.33, "learning_rate": 8.096100367637787e-06, "loss": 2.5072, "step": 2749 }, { "epoch": 0.33, "learning_rate": 8.094523665197862e-06, "loss": 2.7217, "step": 2750 }, { "epoch": 0.33, "learning_rate": 8.092946463832251e-06, "loss": 2.4987, "step": 2751 }, { "epoch": 0.33, "learning_rate": 8.091368763795244e-06, "loss": 2.4136, "step": 2752 }, { "epoch": 0.33, "learning_rate": 8.089790565341208e-06, "loss": 2.4752, "step": 2753 }, { "epoch": 0.33, "learning_rate": 8.088211868724595e-06, "loss": 2.5046, "step": 2754 }, { "epoch": 0.33, "learning_rate": 8.086632674199939e-06, "loss": 2.6758, "step": 2755 }, { "epoch": 0.33, "learning_rate": 8.085052982021849e-06, "loss": 2.6192, "step": 2756 }, { "epoch": 0.33, "learning_rate": 8.083472792445014e-06, "loss": 2.6245, "step": 2757 }, { "epoch": 0.33, "learning_rate": 8.081892105724212e-06, "loss": 2.6182, "step": 2758 }, { "epoch": 0.33, "learning_rate": 8.080310922114287e-06, "loss": 2.5678, "step": 2759 }, { "epoch": 0.33, "learning_rate": 8.078729241870177e-06, "loss": 2.6756, "step": 2760 }, { "epoch": 0.33, "learning_rate": 8.077147065246895e-06, "loss": 2.4666, "step": 2761 }, { "epoch": 0.33, "learning_rate": 8.075564392499527e-06, "loss": 2.6777, "step": 2762 }, { "epoch": 0.33, "learning_rate": 8.07398122388325e-06, "loss": 2.6701, "step": 2763 }, { "epoch": 0.33, "learning_rate": 8.072397559653314e-06, "loss": 2.6755, "step": 2764 }, { "epoch": 0.33, "learning_rate": 8.070813400065051e-06, "loss": 2.6468, "step": 2765 }, { "epoch": 0.33, "learning_rate": 8.069228745373875e-06, "loss": 2.6097, "step": 2766 }, { "epoch": 0.33, "learning_rate": 8.067643595835274e-06, "loss": 2.5563, "step": 2767 }, { "epoch": 0.33, "learning_rate": 8.066057951704821e-06, "loss": 2.6363, "step": 2768 }, { "epoch": 0.33, "learning_rate": 8.06447181323817e-06, "loss": 2.5664, "step": 2769 }, { "epoch": 0.33, "learning_rate": 8.062885180691046e-06, "loss": 2.5854, "step": 2770 }, { "epoch": 0.33, "learning_rate": 8.061298054319267e-06, "loss": 2.7208, "step": 2771 }, { "epoch": 0.33, "learning_rate": 8.059710434378717e-06, "loss": 2.6048, "step": 2772 }, { "epoch": 0.33, "learning_rate": 8.058122321125368e-06, "loss": 2.6209, "step": 2773 }, { "epoch": 0.33, "learning_rate": 8.056533714815268e-06, "loss": 2.6068, "step": 2774 }, { "epoch": 0.33, "learning_rate": 8.054944615704548e-06, "loss": 2.563, "step": 2775 }, { "epoch": 0.33, "learning_rate": 8.053355024049415e-06, "loss": 2.6052, "step": 2776 }, { "epoch": 0.33, "learning_rate": 8.051764940106157e-06, "loss": 2.5926, "step": 2777 }, { "epoch": 0.33, "learning_rate": 8.05017436413114e-06, "loss": 2.4734, "step": 2778 }, { "epoch": 0.33, "learning_rate": 8.04858329638081e-06, "loss": 2.4617, "step": 2779 }, { "epoch": 0.33, "learning_rate": 8.046991737111696e-06, "loss": 2.4535, "step": 2780 }, { "epoch": 0.33, "learning_rate": 8.045399686580399e-06, "loss": 2.7043, "step": 2781 }, { "epoch": 0.33, "learning_rate": 8.043807145043604e-06, "loss": 2.691, "step": 2782 }, { "epoch": 0.33, "learning_rate": 8.042214112758075e-06, "loss": 2.5659, "step": 2783 }, { "epoch": 0.33, "learning_rate": 8.040620589980654e-06, "loss": 2.6798, "step": 2784 }, { "epoch": 0.33, "learning_rate": 8.039026576968262e-06, "loss": 2.5984, "step": 2785 }, { "epoch": 0.33, "learning_rate": 8.037432073977902e-06, "loss": 2.3856, "step": 2786 }, { "epoch": 0.33, "learning_rate": 8.03583708126665e-06, "loss": 2.6073, "step": 2787 }, { "epoch": 0.33, "learning_rate": 8.034241599091666e-06, "loss": 2.572, "step": 2788 }, { "epoch": 0.34, "learning_rate": 8.032645627710188e-06, "loss": 2.6734, "step": 2789 }, { "epoch": 0.34, "learning_rate": 8.03104916737953e-06, "loss": 2.5634, "step": 2790 }, { "epoch": 0.34, "learning_rate": 8.02945221835709e-06, "loss": 2.5344, "step": 2791 }, { "epoch": 0.34, "learning_rate": 8.027854780900339e-06, "loss": 2.5693, "step": 2792 }, { "epoch": 0.34, "learning_rate": 8.02625685526683e-06, "loss": 2.5066, "step": 2793 }, { "epoch": 0.34, "learning_rate": 8.024658441714197e-06, "loss": 2.4872, "step": 2794 }, { "epoch": 0.34, "learning_rate": 8.023059540500149e-06, "loss": 2.7201, "step": 2795 }, { "epoch": 0.34, "learning_rate": 8.021460151882472e-06, "loss": 2.4534, "step": 2796 }, { "epoch": 0.34, "learning_rate": 8.019860276119036e-06, "loss": 2.5352, "step": 2797 }, { "epoch": 0.34, "learning_rate": 8.018259913467785e-06, "loss": 2.4837, "step": 2798 }, { "epoch": 0.34, "learning_rate": 8.016659064186742e-06, "loss": 2.715, "step": 2799 }, { "epoch": 0.34, "learning_rate": 8.015057728534015e-06, "loss": 2.5463, "step": 2800 }, { "epoch": 0.34, "learning_rate": 8.01345590676778e-06, "loss": 2.5789, "step": 2801 }, { "epoch": 0.34, "learning_rate": 8.011853599146297e-06, "loss": 2.6799, "step": 2802 }, { "epoch": 0.34, "learning_rate": 8.010250805927907e-06, "loss": 2.651, "step": 2803 }, { "epoch": 0.34, "learning_rate": 8.008647527371022e-06, "loss": 2.4357, "step": 2804 }, { "epoch": 0.34, "learning_rate": 8.007043763734139e-06, "loss": 2.6758, "step": 2805 }, { "epoch": 0.34, "learning_rate": 8.00543951527583e-06, "loss": 2.6267, "step": 2806 }, { "epoch": 0.34, "learning_rate": 8.003834782254747e-06, "loss": 2.5666, "step": 2807 }, { "epoch": 0.34, "learning_rate": 8.002229564929616e-06, "loss": 2.2994, "step": 2808 }, { "epoch": 0.34, "learning_rate": 8.000623863559245e-06, "loss": 2.4898, "step": 2809 }, { "epoch": 0.34, "learning_rate": 7.999017678402518e-06, "loss": 2.8418, "step": 2810 }, { "epoch": 0.34, "learning_rate": 7.997411009718401e-06, "loss": 2.5341, "step": 2811 }, { "epoch": 0.34, "learning_rate": 7.995803857765934e-06, "loss": 2.4653, "step": 2812 }, { "epoch": 0.34, "learning_rate": 7.994196222804234e-06, "loss": 2.8119, "step": 2813 }, { "epoch": 0.34, "learning_rate": 7.992588105092498e-06, "loss": 2.5161, "step": 2814 }, { "epoch": 0.34, "learning_rate": 7.990979504890003e-06, "loss": 2.5044, "step": 2815 }, { "epoch": 0.34, "learning_rate": 7.989370422456098e-06, "loss": 2.7166, "step": 2816 }, { "epoch": 0.34, "learning_rate": 7.987760858050216e-06, "loss": 2.5338, "step": 2817 }, { "epoch": 0.34, "learning_rate": 7.986150811931864e-06, "loss": 2.5608, "step": 2818 }, { "epoch": 0.34, "learning_rate": 7.984540284360626e-06, "loss": 2.5387, "step": 2819 }, { "epoch": 0.34, "learning_rate": 7.982929275596164e-06, "loss": 2.5447, "step": 2820 }, { "epoch": 0.34, "learning_rate": 7.981317785898225e-06, "loss": 2.5504, "step": 2821 }, { "epoch": 0.34, "learning_rate": 7.979705815526621e-06, "loss": 2.6578, "step": 2822 }, { "epoch": 0.34, "learning_rate": 7.97809336474125e-06, "loss": 2.5047, "step": 2823 }, { "epoch": 0.34, "learning_rate": 7.976480433802085e-06, "loss": 2.5139, "step": 2824 }, { "epoch": 0.34, "learning_rate": 7.974867022969176e-06, "loss": 2.6403, "step": 2825 }, { "epoch": 0.34, "learning_rate": 7.973253132502652e-06, "loss": 2.676, "step": 2826 }, { "epoch": 0.34, "learning_rate": 7.971638762662717e-06, "loss": 2.5525, "step": 2827 }, { "epoch": 0.34, "learning_rate": 7.970023913709652e-06, "loss": 2.6945, "step": 2828 }, { "epoch": 0.34, "learning_rate": 7.968408585903823e-06, "loss": 2.5899, "step": 2829 }, { "epoch": 0.34, "learning_rate": 7.96679277950566e-06, "loss": 2.5245, "step": 2830 }, { "epoch": 0.34, "learning_rate": 7.965176494775684e-06, "loss": 2.556, "step": 2831 }, { "epoch": 0.34, "learning_rate": 7.96355973197448e-06, "loss": 2.5199, "step": 2832 }, { "epoch": 0.34, "learning_rate": 7.961942491362719e-06, "loss": 2.543, "step": 2833 }, { "epoch": 0.34, "learning_rate": 7.960324773201147e-06, "loss": 2.5165, "step": 2834 }, { "epoch": 0.34, "learning_rate": 7.958706577750586e-06, "loss": 2.6465, "step": 2835 }, { "epoch": 0.34, "learning_rate": 7.957087905271934e-06, "loss": 2.5395, "step": 2836 }, { "epoch": 0.34, "learning_rate": 7.955468756026168e-06, "loss": 2.5309, "step": 2837 }, { "epoch": 0.34, "learning_rate": 7.953849130274344e-06, "loss": 2.5853, "step": 2838 }, { "epoch": 0.34, "learning_rate": 7.952229028277588e-06, "loss": 2.5978, "step": 2839 }, { "epoch": 0.34, "learning_rate": 7.95060845029711e-06, "loss": 2.4975, "step": 2840 }, { "epoch": 0.34, "learning_rate": 7.94898739659419e-06, "loss": 2.5247, "step": 2841 }, { "epoch": 0.34, "learning_rate": 7.94736586743019e-06, "loss": 2.527, "step": 2842 }, { "epoch": 0.34, "learning_rate": 7.94574386306655e-06, "loss": 2.5681, "step": 2843 }, { "epoch": 0.34, "learning_rate": 7.944121383764775e-06, "loss": 2.4952, "step": 2844 }, { "epoch": 0.34, "learning_rate": 7.942498429786466e-06, "loss": 2.456, "step": 2845 }, { "epoch": 0.34, "learning_rate": 7.94087500139328e-06, "loss": 2.7886, "step": 2846 }, { "epoch": 0.34, "learning_rate": 7.939251098846968e-06, "loss": 2.5056, "step": 2847 }, { "epoch": 0.34, "learning_rate": 7.937626722409342e-06, "loss": 2.3708, "step": 2848 }, { "epoch": 0.34, "learning_rate": 7.936001872342303e-06, "loss": 2.6743, "step": 2849 }, { "epoch": 0.34, "learning_rate": 7.93437654890782e-06, "loss": 2.5541, "step": 2850 }, { "epoch": 0.34, "learning_rate": 7.932750752367947e-06, "loss": 2.4163, "step": 2851 }, { "epoch": 0.34, "learning_rate": 7.931124482984802e-06, "loss": 2.6016, "step": 2852 }, { "epoch": 0.34, "learning_rate": 7.929497741020592e-06, "loss": 2.579, "step": 2853 }, { "epoch": 0.34, "learning_rate": 7.92787052673759e-06, "loss": 2.7825, "step": 2854 }, { "epoch": 0.34, "learning_rate": 7.926242840398152e-06, "loss": 2.5535, "step": 2855 }, { "epoch": 0.34, "learning_rate": 7.924614682264707e-06, "loss": 2.5667, "step": 2856 }, { "epoch": 0.34, "learning_rate": 7.922986052599759e-06, "loss": 2.6106, "step": 2857 }, { "epoch": 0.34, "learning_rate": 7.921356951665894e-06, "loss": 2.6688, "step": 2858 }, { "epoch": 0.34, "learning_rate": 7.919727379725763e-06, "loss": 2.4968, "step": 2859 }, { "epoch": 0.34, "learning_rate": 7.918097337042106e-06, "loss": 2.5996, "step": 2860 }, { "epoch": 0.34, "learning_rate": 7.91646682387773e-06, "loss": 2.5838, "step": 2861 }, { "epoch": 0.34, "learning_rate": 7.914835840495518e-06, "loss": 2.542, "step": 2862 }, { "epoch": 0.34, "learning_rate": 7.913204387158435e-06, "loss": 2.5822, "step": 2863 }, { "epoch": 0.34, "learning_rate": 7.911572464129515e-06, "loss": 2.407, "step": 2864 }, { "epoch": 0.34, "learning_rate": 7.909940071671874e-06, "loss": 2.6295, "step": 2865 }, { "epoch": 0.34, "learning_rate": 7.908307210048695e-06, "loss": 2.461, "step": 2866 }, { "epoch": 0.34, "learning_rate": 7.906673879523249e-06, "loss": 2.4688, "step": 2867 }, { "epoch": 0.34, "learning_rate": 7.905040080358869e-06, "loss": 2.5864, "step": 2868 }, { "epoch": 0.34, "learning_rate": 7.903405812818974e-06, "loss": 2.5513, "step": 2869 }, { "epoch": 0.34, "learning_rate": 7.901771077167051e-06, "loss": 2.5014, "step": 2870 }, { "epoch": 0.34, "learning_rate": 7.900135873666672e-06, "loss": 2.606, "step": 2871 }, { "epoch": 0.35, "learning_rate": 7.898500202581474e-06, "loss": 2.7239, "step": 2872 }, { "epoch": 0.35, "learning_rate": 7.896864064175176e-06, "loss": 2.5848, "step": 2873 }, { "epoch": 0.35, "learning_rate": 7.895227458711567e-06, "loss": 2.6267, "step": 2874 }, { "epoch": 0.35, "learning_rate": 7.89359038645452e-06, "loss": 2.5691, "step": 2875 }, { "epoch": 0.35, "learning_rate": 7.891952847667973e-06, "loss": 2.6508, "step": 2876 }, { "epoch": 0.35, "learning_rate": 7.890314842615948e-06, "loss": 2.4033, "step": 2877 }, { "epoch": 0.35, "learning_rate": 7.888676371562534e-06, "loss": 2.5467, "step": 2878 }, { "epoch": 0.35, "learning_rate": 7.887037434771902e-06, "loss": 2.6814, "step": 2879 }, { "epoch": 0.35, "learning_rate": 7.885398032508296e-06, "loss": 2.6065, "step": 2880 }, { "epoch": 0.35, "learning_rate": 7.883758165036032e-06, "loss": 2.5961, "step": 2881 }, { "epoch": 0.35, "learning_rate": 7.882117832619506e-06, "loss": 2.7195, "step": 2882 }, { "epoch": 0.35, "learning_rate": 7.880477035523187e-06, "loss": 2.6041, "step": 2883 }, { "epoch": 0.35, "learning_rate": 7.878835774011615e-06, "loss": 2.4418, "step": 2884 }, { "epoch": 0.35, "learning_rate": 7.877194048349413e-06, "loss": 2.515, "step": 2885 }, { "epoch": 0.35, "learning_rate": 7.875551858801268e-06, "loss": 2.4094, "step": 2886 }, { "epoch": 0.35, "learning_rate": 7.873909205631951e-06, "loss": 2.5801, "step": 2887 }, { "epoch": 0.35, "learning_rate": 7.872266089106309e-06, "loss": 2.7062, "step": 2888 }, { "epoch": 0.35, "learning_rate": 7.870622509489251e-06, "loss": 2.5632, "step": 2889 }, { "epoch": 0.35, "learning_rate": 7.868978467045777e-06, "loss": 2.5447, "step": 2890 }, { "epoch": 0.35, "learning_rate": 7.867333962040948e-06, "loss": 2.6751, "step": 2891 }, { "epoch": 0.35, "learning_rate": 7.865688994739907e-06, "loss": 2.51, "step": 2892 }, { "epoch": 0.35, "learning_rate": 7.864043565407871e-06, "loss": 2.7387, "step": 2893 }, { "epoch": 0.35, "learning_rate": 7.862397674310127e-06, "loss": 2.7214, "step": 2894 }, { "epoch": 0.35, "learning_rate": 7.860751321712043e-06, "loss": 2.4684, "step": 2895 }, { "epoch": 0.35, "learning_rate": 7.859104507879058e-06, "loss": 2.5351, "step": 2896 }, { "epoch": 0.35, "learning_rate": 7.857457233076684e-06, "loss": 2.6763, "step": 2897 }, { "epoch": 0.35, "learning_rate": 7.85580949757051e-06, "loss": 2.6832, "step": 2898 }, { "epoch": 0.35, "learning_rate": 7.854161301626196e-06, "loss": 2.5517, "step": 2899 }, { "epoch": 0.35, "learning_rate": 7.85251264550948e-06, "loss": 2.4681, "step": 2900 }, { "epoch": 0.35, "learning_rate": 7.850863529486172e-06, "loss": 2.5925, "step": 2901 }, { "epoch": 0.35, "learning_rate": 7.849213953822158e-06, "loss": 2.6068, "step": 2902 }, { "epoch": 0.35, "learning_rate": 7.847563918783393e-06, "loss": 2.5288, "step": 2903 }, { "epoch": 0.35, "learning_rate": 7.845913424635915e-06, "loss": 2.521, "step": 2904 }, { "epoch": 0.35, "learning_rate": 7.844262471645827e-06, "loss": 2.4423, "step": 2905 }, { "epoch": 0.35, "learning_rate": 7.842611060079312e-06, "loss": 2.3436, "step": 2906 }, { "epoch": 0.35, "learning_rate": 7.840959190202623e-06, "loss": 2.6797, "step": 2907 }, { "epoch": 0.35, "learning_rate": 7.83930686228209e-06, "loss": 2.7181, "step": 2908 }, { "epoch": 0.35, "learning_rate": 7.837654076584115e-06, "loss": 2.5138, "step": 2909 }, { "epoch": 0.35, "learning_rate": 7.836000833375174e-06, "loss": 2.6641, "step": 2910 }, { "epoch": 0.35, "learning_rate": 7.834347132921817e-06, "loss": 2.5491, "step": 2911 }, { "epoch": 0.35, "learning_rate": 7.832692975490668e-06, "loss": 2.4358, "step": 2912 }, { "epoch": 0.35, "learning_rate": 7.831038361348425e-06, "loss": 2.6112, "step": 2913 }, { "epoch": 0.35, "learning_rate": 7.829383290761859e-06, "loss": 2.7002, "step": 2914 }, { "epoch": 0.35, "learning_rate": 7.827727763997815e-06, "loss": 2.4583, "step": 2915 }, { "epoch": 0.35, "learning_rate": 7.826071781323208e-06, "loss": 2.5323, "step": 2916 }, { "epoch": 0.35, "learning_rate": 7.824415343005035e-06, "loss": 2.4228, "step": 2917 }, { "epoch": 0.35, "learning_rate": 7.822758449310357e-06, "loss": 2.4258, "step": 2918 }, { "epoch": 0.35, "learning_rate": 7.821101100506317e-06, "loss": 2.6686, "step": 2919 }, { "epoch": 0.35, "learning_rate": 7.819443296860121e-06, "loss": 2.6419, "step": 2920 }, { "epoch": 0.35, "learning_rate": 7.817785038639058e-06, "loss": 2.7657, "step": 2921 }, { "epoch": 0.35, "learning_rate": 7.816126326110487e-06, "loss": 2.5512, "step": 2922 }, { "epoch": 0.35, "learning_rate": 7.814467159541841e-06, "loss": 2.651, "step": 2923 }, { "epoch": 0.35, "learning_rate": 7.812807539200622e-06, "loss": 2.4833, "step": 2924 }, { "epoch": 0.35, "learning_rate": 7.811147465354408e-06, "loss": 2.5305, "step": 2925 }, { "epoch": 0.35, "learning_rate": 7.809486938270853e-06, "loss": 2.7539, "step": 2926 }, { "epoch": 0.35, "learning_rate": 7.80782595821768e-06, "loss": 2.445, "step": 2927 }, { "epoch": 0.35, "learning_rate": 7.806164525462687e-06, "loss": 2.501, "step": 2928 }, { "epoch": 0.35, "learning_rate": 7.804502640273743e-06, "loss": 2.7106, "step": 2929 }, { "epoch": 0.35, "learning_rate": 7.802840302918794e-06, "loss": 2.7369, "step": 2930 }, { "epoch": 0.35, "learning_rate": 7.801177513665856e-06, "loss": 2.5599, "step": 2931 }, { "epoch": 0.35, "learning_rate": 7.799514272783014e-06, "loss": 2.3928, "step": 2932 }, { "epoch": 0.35, "learning_rate": 7.797850580538435e-06, "loss": 2.4631, "step": 2933 }, { "epoch": 0.35, "learning_rate": 7.796186437200352e-06, "loss": 2.6008, "step": 2934 }, { "epoch": 0.35, "learning_rate": 7.79452184303707e-06, "loss": 2.3959, "step": 2935 }, { "epoch": 0.35, "learning_rate": 7.792856798316975e-06, "loss": 2.7049, "step": 2936 }, { "epoch": 0.35, "learning_rate": 7.791191303308513e-06, "loss": 2.6206, "step": 2937 }, { "epoch": 0.35, "learning_rate": 7.789525358280216e-06, "loss": 2.6765, "step": 2938 }, { "epoch": 0.35, "learning_rate": 7.787858963500676e-06, "loss": 2.4868, "step": 2939 }, { "epoch": 0.35, "learning_rate": 7.786192119238568e-06, "loss": 2.5133, "step": 2940 }, { "epoch": 0.35, "learning_rate": 7.784524825762632e-06, "loss": 2.6607, "step": 2941 }, { "epoch": 0.35, "learning_rate": 7.782857083341685e-06, "loss": 2.6656, "step": 2942 }, { "epoch": 0.35, "learning_rate": 7.781188892244613e-06, "loss": 2.447, "step": 2943 }, { "epoch": 0.35, "learning_rate": 7.779520252740378e-06, "loss": 2.3656, "step": 2944 }, { "epoch": 0.35, "learning_rate": 7.777851165098012e-06, "loss": 2.3781, "step": 2945 }, { "epoch": 0.35, "learning_rate": 7.776181629586618e-06, "loss": 2.5658, "step": 2946 }, { "epoch": 0.35, "learning_rate": 7.774511646475376e-06, "loss": 2.6343, "step": 2947 }, { "epoch": 0.35, "learning_rate": 7.772841216033534e-06, "loss": 2.5894, "step": 2948 }, { "epoch": 0.35, "learning_rate": 7.771170338530411e-06, "loss": 2.6371, "step": 2949 }, { "epoch": 0.35, "learning_rate": 7.769499014235401e-06, "loss": 2.5845, "step": 2950 }, { "epoch": 0.35, "learning_rate": 7.767827243417971e-06, "loss": 2.6005, "step": 2951 }, { "epoch": 0.35, "learning_rate": 7.766155026347657e-06, "loss": 2.5869, "step": 2952 }, { "epoch": 0.35, "learning_rate": 7.764482363294068e-06, "loss": 2.5016, "step": 2953 }, { "epoch": 0.35, "learning_rate": 7.762809254526884e-06, "loss": 2.5446, "step": 2954 }, { "epoch": 0.35, "learning_rate": 7.761135700315863e-06, "loss": 2.6095, "step": 2955 }, { "epoch": 0.36, "learning_rate": 7.759461700930824e-06, "loss": 2.6276, "step": 2956 }, { "epoch": 0.36, "learning_rate": 7.757787256641666e-06, "loss": 2.5471, "step": 2957 }, { "epoch": 0.36, "learning_rate": 7.756112367718356e-06, "loss": 2.482, "step": 2958 }, { "epoch": 0.36, "learning_rate": 7.754437034430935e-06, "loss": 2.4878, "step": 2959 }, { "epoch": 0.36, "learning_rate": 7.752761257049517e-06, "loss": 2.3928, "step": 2960 }, { "epoch": 0.36, "learning_rate": 7.751085035844281e-06, "loss": 2.5217, "step": 2961 }, { "epoch": 0.36, "learning_rate": 7.749408371085484e-06, "loss": 2.61, "step": 2962 }, { "epoch": 0.36, "learning_rate": 7.747731263043453e-06, "loss": 2.5169, "step": 2963 }, { "epoch": 0.36, "learning_rate": 7.746053711988584e-06, "loss": 2.6868, "step": 2964 }, { "epoch": 0.36, "learning_rate": 7.744375718191347e-06, "loss": 2.4561, "step": 2965 }, { "epoch": 0.36, "learning_rate": 7.74269728192228e-06, "loss": 2.5379, "step": 2966 }, { "epoch": 0.36, "learning_rate": 7.741018403452e-06, "loss": 2.6429, "step": 2967 }, { "epoch": 0.36, "learning_rate": 7.739339083051186e-06, "loss": 2.5006, "step": 2968 }, { "epoch": 0.36, "learning_rate": 7.737659320990598e-06, "loss": 2.5228, "step": 2969 }, { "epoch": 0.36, "learning_rate": 7.735979117541054e-06, "loss": 2.4733, "step": 2970 }, { "epoch": 0.36, "learning_rate": 7.734298472973454e-06, "loss": 2.727, "step": 2971 }, { "epoch": 0.36, "learning_rate": 7.732617387558769e-06, "loss": 2.5065, "step": 2972 }, { "epoch": 0.36, "learning_rate": 7.730935861568034e-06, "loss": 2.3727, "step": 2973 }, { "epoch": 0.36, "learning_rate": 7.729253895272362e-06, "loss": 2.5114, "step": 2974 }, { "epoch": 0.36, "learning_rate": 7.727571488942931e-06, "loss": 2.5958, "step": 2975 }, { "epoch": 0.36, "learning_rate": 7.725888642850995e-06, "loss": 2.6005, "step": 2976 }, { "epoch": 0.36, "learning_rate": 7.724205357267877e-06, "loss": 2.4978, "step": 2977 }, { "epoch": 0.36, "learning_rate": 7.722521632464972e-06, "loss": 2.5824, "step": 2978 }, { "epoch": 0.36, "learning_rate": 7.72083746871374e-06, "loss": 2.4628, "step": 2979 }, { "epoch": 0.36, "learning_rate": 7.719152866285722e-06, "loss": 2.5842, "step": 2980 }, { "epoch": 0.36, "learning_rate": 7.717467825452518e-06, "loss": 2.5439, "step": 2981 }, { "epoch": 0.36, "learning_rate": 7.715782346485809e-06, "loss": 2.5301, "step": 2982 }, { "epoch": 0.36, "learning_rate": 7.714096429657344e-06, "loss": 2.5519, "step": 2983 }, { "epoch": 0.36, "learning_rate": 7.712410075238936e-06, "loss": 2.6597, "step": 2984 }, { "epoch": 0.36, "learning_rate": 7.710723283502476e-06, "loss": 2.5035, "step": 2985 }, { "epoch": 0.36, "learning_rate": 7.709036054719926e-06, "loss": 2.4965, "step": 2986 }, { "epoch": 0.36, "learning_rate": 7.707348389163309e-06, "loss": 2.5823, "step": 2987 }, { "epoch": 0.36, "learning_rate": 7.70566028710473e-06, "loss": 2.4176, "step": 2988 }, { "epoch": 0.36, "learning_rate": 7.703971748816358e-06, "loss": 2.558, "step": 2989 }, { "epoch": 0.36, "learning_rate": 7.702282774570434e-06, "loss": 2.5089, "step": 2990 }, { "epoch": 0.36, "learning_rate": 7.700593364639269e-06, "loss": 2.5334, "step": 2991 }, { "epoch": 0.36, "learning_rate": 7.698903519295242e-06, "loss": 2.3934, "step": 2992 }, { "epoch": 0.36, "learning_rate": 7.697213238810806e-06, "loss": 2.7482, "step": 2993 }, { "epoch": 0.36, "learning_rate": 7.695522523458484e-06, "loss": 2.7303, "step": 2994 }, { "epoch": 0.36, "learning_rate": 7.693831373510864e-06, "loss": 2.5855, "step": 2995 }, { "epoch": 0.36, "learning_rate": 7.692139789240611e-06, "loss": 2.4197, "step": 2996 }, { "epoch": 0.36, "learning_rate": 7.690447770920456e-06, "loss": 2.627, "step": 2997 }, { "epoch": 0.36, "learning_rate": 7.6887553188232e-06, "loss": 2.6645, "step": 2998 }, { "epoch": 0.36, "learning_rate": 7.687062433221715e-06, "loss": 2.6122, "step": 2999 }, { "epoch": 0.36, "learning_rate": 7.685369114388943e-06, "loss": 2.5169, "step": 3000 }, { "epoch": 0.36, "learning_rate": 7.683675362597893e-06, "loss": 2.5068, "step": 3001 }, { "epoch": 0.36, "learning_rate": 7.681981178121652e-06, "loss": 2.5219, "step": 3002 }, { "epoch": 0.36, "learning_rate": 7.680286561233365e-06, "loss": 2.6009, "step": 3003 }, { "epoch": 0.36, "learning_rate": 7.678591512206254e-06, "loss": 2.5132, "step": 3004 }, { "epoch": 0.36, "learning_rate": 7.676896031313612e-06, "loss": 2.5926, "step": 3005 }, { "epoch": 0.36, "learning_rate": 7.675200118828796e-06, "loss": 2.5614, "step": 3006 }, { "epoch": 0.36, "learning_rate": 7.673503775025237e-06, "loss": 2.6382, "step": 3007 }, { "epoch": 0.36, "learning_rate": 7.671807000176434e-06, "loss": 2.5241, "step": 3008 }, { "epoch": 0.36, "learning_rate": 7.670109794555955e-06, "loss": 2.4602, "step": 3009 }, { "epoch": 0.36, "learning_rate": 7.668412158437442e-06, "loss": 2.5793, "step": 3010 }, { "epoch": 0.36, "learning_rate": 7.666714092094596e-06, "loss": 2.5783, "step": 3011 }, { "epoch": 0.36, "learning_rate": 7.665015595801198e-06, "loss": 2.4706, "step": 3012 }, { "epoch": 0.36, "learning_rate": 7.663316669831092e-06, "loss": 2.601, "step": 3013 }, { "epoch": 0.36, "learning_rate": 7.661617314458194e-06, "loss": 2.6002, "step": 3014 }, { "epoch": 0.36, "learning_rate": 7.659917529956491e-06, "loss": 2.3782, "step": 3015 }, { "epoch": 0.36, "learning_rate": 7.658217316600033e-06, "loss": 2.7325, "step": 3016 }, { "epoch": 0.36, "learning_rate": 7.656516674662948e-06, "loss": 2.7176, "step": 3017 }, { "epoch": 0.36, "learning_rate": 7.654815604419424e-06, "loss": 2.598, "step": 3018 }, { "epoch": 0.36, "learning_rate": 7.653114106143723e-06, "loss": 2.5905, "step": 3019 }, { "epoch": 0.36, "learning_rate": 7.651412180110176e-06, "loss": 2.5564, "step": 3020 }, { "epoch": 0.36, "learning_rate": 7.649709826593182e-06, "loss": 2.5066, "step": 3021 }, { "epoch": 0.36, "learning_rate": 7.648007045867208e-06, "loss": 2.6303, "step": 3022 }, { "epoch": 0.36, "learning_rate": 7.646303838206791e-06, "loss": 2.512, "step": 3023 }, { "epoch": 0.36, "learning_rate": 7.644600203886537e-06, "loss": 2.6508, "step": 3024 }, { "epoch": 0.36, "learning_rate": 7.642896143181123e-06, "loss": 2.5663, "step": 3025 }, { "epoch": 0.36, "learning_rate": 7.641191656365288e-06, "loss": 2.4999, "step": 3026 }, { "epoch": 0.36, "learning_rate": 7.639486743713849e-06, "loss": 2.73, "step": 3027 }, { "epoch": 0.36, "learning_rate": 7.637781405501682e-06, "loss": 2.4688, "step": 3028 }, { "epoch": 0.36, "learning_rate": 7.636075642003738e-06, "loss": 2.4947, "step": 3029 }, { "epoch": 0.36, "learning_rate": 7.634369453495036e-06, "loss": 2.6289, "step": 3030 }, { "epoch": 0.36, "learning_rate": 7.632662840250661e-06, "loss": 2.4107, "step": 3031 }, { "epoch": 0.36, "learning_rate": 7.630955802545768e-06, "loss": 2.6414, "step": 3032 }, { "epoch": 0.36, "learning_rate": 7.629248340655582e-06, "loss": 2.6906, "step": 3033 }, { "epoch": 0.36, "learning_rate": 7.627540454855391e-06, "loss": 2.575, "step": 3034 }, { "epoch": 0.36, "learning_rate": 7.6258321454205586e-06, "loss": 2.5484, "step": 3035 }, { "epoch": 0.36, "learning_rate": 7.6241234126265115e-06, "loss": 2.6002, "step": 3036 }, { "epoch": 0.36, "learning_rate": 7.622414256748747e-06, "loss": 2.5317, "step": 3037 }, { "epoch": 0.36, "learning_rate": 7.6207046780628295e-06, "loss": 2.6132, "step": 3038 }, { "epoch": 0.37, "learning_rate": 7.618994676844391e-06, "loss": 2.6884, "step": 3039 }, { "epoch": 0.37, "learning_rate": 7.617284253369135e-06, "loss": 2.5946, "step": 3040 }, { "epoch": 0.37, "learning_rate": 7.615573407912827e-06, "loss": 2.5349, "step": 3041 }, { "epoch": 0.37, "learning_rate": 7.6138621407513084e-06, "loss": 2.5247, "step": 3042 }, { "epoch": 0.37, "learning_rate": 7.6121504521604805e-06, "loss": 2.5267, "step": 3043 }, { "epoch": 0.37, "learning_rate": 7.61043834241632e-06, "loss": 2.4852, "step": 3044 }, { "epoch": 0.37, "learning_rate": 7.608725811794866e-06, "loss": 2.4774, "step": 3045 }, { "epoch": 0.37, "learning_rate": 7.607012860572227e-06, "loss": 2.656, "step": 3046 }, { "epoch": 0.37, "learning_rate": 7.60529948902458e-06, "loss": 2.5886, "step": 3047 }, { "epoch": 0.37, "learning_rate": 7.603585697428169e-06, "loss": 2.6306, "step": 3048 }, { "epoch": 0.37, "learning_rate": 7.601871486059309e-06, "loss": 2.6293, "step": 3049 }, { "epoch": 0.37, "learning_rate": 7.600156855194376e-06, "loss": 2.5962, "step": 3050 }, { "epoch": 0.37, "learning_rate": 7.598441805109822e-06, "loss": 2.478, "step": 3051 }, { "epoch": 0.37, "learning_rate": 7.596726336082158e-06, "loss": 2.5075, "step": 3052 }, { "epoch": 0.37, "learning_rate": 7.595010448387967e-06, "loss": 2.7038, "step": 3053 }, { "epoch": 0.37, "learning_rate": 7.593294142303902e-06, "loss": 2.3905, "step": 3054 }, { "epoch": 0.37, "learning_rate": 7.591577418106678e-06, "loss": 2.4451, "step": 3055 }, { "epoch": 0.37, "learning_rate": 7.589860276073082e-06, "loss": 2.6799, "step": 3056 }, { "epoch": 0.37, "learning_rate": 7.588142716479965e-06, "loss": 2.3405, "step": 3057 }, { "epoch": 0.37, "learning_rate": 7.586424739604248e-06, "loss": 2.7073, "step": 3058 }, { "epoch": 0.37, "learning_rate": 7.584706345722914e-06, "loss": 2.5276, "step": 3059 }, { "epoch": 0.37, "learning_rate": 7.5829875351130224e-06, "loss": 2.3663, "step": 3060 }, { "epoch": 0.37, "learning_rate": 7.581268308051692e-06, "loss": 2.5418, "step": 3061 }, { "epoch": 0.37, "learning_rate": 7.579548664816112e-06, "loss": 2.3754, "step": 3062 }, { "epoch": 0.37, "learning_rate": 7.5778286056835395e-06, "loss": 2.586, "step": 3063 }, { "epoch": 0.37, "learning_rate": 7.576108130931292e-06, "loss": 2.5898, "step": 3064 }, { "epoch": 0.37, "learning_rate": 7.5743872408367645e-06, "loss": 2.5478, "step": 3065 }, { "epoch": 0.37, "learning_rate": 7.572665935677412e-06, "loss": 2.472, "step": 3066 }, { "epoch": 0.37, "learning_rate": 7.57094421573076e-06, "loss": 2.6841, "step": 3067 }, { "epoch": 0.37, "learning_rate": 7.569222081274396e-06, "loss": 2.416, "step": 3068 }, { "epoch": 0.37, "learning_rate": 7.567499532585978e-06, "loss": 2.7056, "step": 3069 }, { "epoch": 0.37, "learning_rate": 7.565776569943231e-06, "loss": 2.6592, "step": 3070 }, { "epoch": 0.37, "learning_rate": 7.564053193623944e-06, "loss": 2.2394, "step": 3071 }, { "epoch": 0.37, "learning_rate": 7.562329403905976e-06, "loss": 2.6694, "step": 3072 }, { "epoch": 0.37, "learning_rate": 7.5606052010672525e-06, "loss": 2.5527, "step": 3073 }, { "epoch": 0.37, "learning_rate": 7.558880585385762e-06, "loss": 2.6286, "step": 3074 }, { "epoch": 0.37, "learning_rate": 7.557155557139563e-06, "loss": 2.6077, "step": 3075 }, { "epoch": 0.37, "learning_rate": 7.555430116606778e-06, "loss": 2.6389, "step": 3076 }, { "epoch": 0.37, "learning_rate": 7.553704264065598e-06, "loss": 2.5701, "step": 3077 }, { "epoch": 0.37, "learning_rate": 7.5519779997942825e-06, "loss": 2.5976, "step": 3078 }, { "epoch": 0.37, "learning_rate": 7.550251324071152e-06, "loss": 2.5225, "step": 3079 }, { "epoch": 0.37, "learning_rate": 7.548524237174595e-06, "loss": 2.7193, "step": 3080 }, { "epoch": 0.37, "learning_rate": 7.5467967393830686e-06, "loss": 2.5269, "step": 3081 }, { "epoch": 0.37, "learning_rate": 7.545068830975096e-06, "loss": 2.7224, "step": 3082 }, { "epoch": 0.37, "learning_rate": 7.543340512229263e-06, "loss": 2.4984, "step": 3083 }, { "epoch": 0.37, "learning_rate": 7.5416117834242254e-06, "loss": 2.575, "step": 3084 }, { "epoch": 0.37, "learning_rate": 7.5398826448387055e-06, "loss": 2.6468, "step": 3085 }, { "epoch": 0.37, "learning_rate": 7.538153096751486e-06, "loss": 2.5131, "step": 3086 }, { "epoch": 0.37, "learning_rate": 7.536423139441421e-06, "loss": 2.5475, "step": 3087 }, { "epoch": 0.37, "learning_rate": 7.534692773187431e-06, "loss": 2.4431, "step": 3088 }, { "epoch": 0.37, "learning_rate": 7.532961998268498e-06, "loss": 2.7499, "step": 3089 }, { "epoch": 0.37, "learning_rate": 7.531230814963675e-06, "loss": 2.5988, "step": 3090 }, { "epoch": 0.37, "learning_rate": 7.529499223552075e-06, "loss": 2.4, "step": 3091 }, { "epoch": 0.37, "learning_rate": 7.527767224312883e-06, "loss": 2.6532, "step": 3092 }, { "epoch": 0.37, "learning_rate": 7.526034817525345e-06, "loss": 2.6422, "step": 3093 }, { "epoch": 0.37, "learning_rate": 7.524302003468774e-06, "loss": 2.6479, "step": 3094 }, { "epoch": 0.37, "learning_rate": 7.522568782422553e-06, "loss": 2.4361, "step": 3095 }, { "epoch": 0.37, "learning_rate": 7.520835154666121e-06, "loss": 2.6634, "step": 3096 }, { "epoch": 0.37, "learning_rate": 7.519101120478993e-06, "loss": 2.5177, "step": 3097 }, { "epoch": 0.37, "learning_rate": 7.517366680140743e-06, "loss": 2.6319, "step": 3098 }, { "epoch": 0.37, "learning_rate": 7.515631833931012e-06, "loss": 2.6566, "step": 3099 }, { "epoch": 0.37, "learning_rate": 7.513896582129507e-06, "loss": 2.7131, "step": 3100 }, { "epoch": 0.37, "learning_rate": 7.5121609250160024e-06, "loss": 2.5292, "step": 3101 }, { "epoch": 0.37, "learning_rate": 7.510424862870334e-06, "loss": 2.6434, "step": 3102 }, { "epoch": 0.37, "learning_rate": 7.508688395972403e-06, "loss": 2.5826, "step": 3103 }, { "epoch": 0.37, "learning_rate": 7.50695152460218e-06, "loss": 2.6154, "step": 3104 }, { "epoch": 0.37, "learning_rate": 7.505214249039696e-06, "loss": 2.4873, "step": 3105 }, { "epoch": 0.37, "learning_rate": 7.503476569565052e-06, "loss": 2.5442, "step": 3106 }, { "epoch": 0.37, "learning_rate": 7.501738486458411e-06, "loss": 2.5804, "step": 3107 }, { "epoch": 0.37, "learning_rate": 7.500000000000001e-06, "loss": 2.6347, "step": 3108 }, { "epoch": 0.37, "learning_rate": 7.498261110470116e-06, "loss": 2.6056, "step": 3109 }, { "epoch": 0.37, "learning_rate": 7.496521818149114e-06, "loss": 2.4335, "step": 3110 }, { "epoch": 0.37, "learning_rate": 7.49478212331742e-06, "loss": 2.4643, "step": 3111 }, { "epoch": 0.37, "learning_rate": 7.493042026255522e-06, "loss": 2.4925, "step": 3112 }, { "epoch": 0.37, "learning_rate": 7.4913015272439725e-06, "loss": 2.6064, "step": 3113 }, { "epoch": 0.37, "learning_rate": 7.489560626563392e-06, "loss": 2.641, "step": 3114 }, { "epoch": 0.37, "learning_rate": 7.48781932449446e-06, "loss": 2.5651, "step": 3115 }, { "epoch": 0.37, "learning_rate": 7.4860776213179264e-06, "loss": 2.6674, "step": 3116 }, { "epoch": 0.37, "learning_rate": 7.484335517314603e-06, "loss": 2.6051, "step": 3117 }, { "epoch": 0.37, "learning_rate": 7.482593012765368e-06, "loss": 2.6486, "step": 3118 }, { "epoch": 0.37, "learning_rate": 7.480850107951162e-06, "loss": 2.7443, "step": 3119 }, { "epoch": 0.37, "learning_rate": 7.479106803152991e-06, "loss": 2.6005, "step": 3120 }, { "epoch": 0.37, "learning_rate": 7.477363098651925e-06, "loss": 2.5229, "step": 3121 }, { "epoch": 0.38, "learning_rate": 7.4756189947291e-06, "loss": 2.5671, "step": 3122 }, { "epoch": 0.38, "learning_rate": 7.473874491665715e-06, "loss": 2.4166, "step": 3123 }, { "epoch": 0.38, "learning_rate": 7.472129589743034e-06, "loss": 2.5951, "step": 3124 }, { "epoch": 0.38, "learning_rate": 7.470384289242385e-06, "loss": 2.402, "step": 3125 }, { "epoch": 0.38, "learning_rate": 7.468638590445159e-06, "loss": 2.5425, "step": 3126 }, { "epoch": 0.38, "learning_rate": 7.466892493632816e-06, "loss": 2.6248, "step": 3127 }, { "epoch": 0.38, "learning_rate": 7.465145999086874e-06, "loss": 2.6268, "step": 3128 }, { "epoch": 0.38, "learning_rate": 7.463399107088917e-06, "loss": 2.6184, "step": 3129 }, { "epoch": 0.38, "learning_rate": 7.461651817920595e-06, "loss": 2.417, "step": 3130 }, { "epoch": 0.38, "learning_rate": 7.459904131863623e-06, "loss": 2.6385, "step": 3131 }, { "epoch": 0.38, "learning_rate": 7.458156049199775e-06, "loss": 2.5573, "step": 3132 }, { "epoch": 0.38, "learning_rate": 7.456407570210894e-06, "loss": 2.5578, "step": 3133 }, { "epoch": 0.38, "learning_rate": 7.454658695178885e-06, "loss": 2.3566, "step": 3134 }, { "epoch": 0.38, "learning_rate": 7.452909424385712e-06, "loss": 2.6145, "step": 3135 }, { "epoch": 0.38, "learning_rate": 7.451159758113414e-06, "loss": 2.4296, "step": 3136 }, { "epoch": 0.38, "learning_rate": 7.449409696644083e-06, "loss": 2.4347, "step": 3137 }, { "epoch": 0.38, "learning_rate": 7.447659240259881e-06, "loss": 2.4913, "step": 3138 }, { "epoch": 0.38, "learning_rate": 7.4459083892430315e-06, "loss": 2.5592, "step": 3139 }, { "epoch": 0.38, "learning_rate": 7.44415714387582e-06, "loss": 2.5811, "step": 3140 }, { "epoch": 0.38, "learning_rate": 7.442405504440598e-06, "loss": 2.6652, "step": 3141 }, { "epoch": 0.38, "learning_rate": 7.440653471219782e-06, "loss": 2.5482, "step": 3142 }, { "epoch": 0.38, "learning_rate": 7.438901044495846e-06, "loss": 2.6439, "step": 3143 }, { "epoch": 0.38, "learning_rate": 7.4371482245513345e-06, "loss": 2.5798, "step": 3144 }, { "epoch": 0.38, "learning_rate": 7.435395011668853e-06, "loss": 2.4018, "step": 3145 }, { "epoch": 0.38, "learning_rate": 7.433641406131065e-06, "loss": 2.6193, "step": 3146 }, { "epoch": 0.38, "learning_rate": 7.431887408220705e-06, "loss": 2.6327, "step": 3147 }, { "epoch": 0.38, "learning_rate": 7.430133018220567e-06, "loss": 2.5548, "step": 3148 }, { "epoch": 0.38, "learning_rate": 7.428378236413509e-06, "loss": 2.6812, "step": 3149 }, { "epoch": 0.38, "learning_rate": 7.426623063082452e-06, "loss": 2.6538, "step": 3150 }, { "epoch": 0.38, "learning_rate": 7.424867498510381e-06, "loss": 2.6022, "step": 3151 }, { "epoch": 0.38, "learning_rate": 7.4231115429803405e-06, "loss": 2.5677, "step": 3152 }, { "epoch": 0.38, "learning_rate": 7.421355196775444e-06, "loss": 2.663, "step": 3153 }, { "epoch": 0.38, "learning_rate": 7.41959846017886e-06, "loss": 2.6133, "step": 3154 }, { "epoch": 0.38, "learning_rate": 7.417841333473832e-06, "loss": 2.6399, "step": 3155 }, { "epoch": 0.38, "learning_rate": 7.416083816943653e-06, "loss": 2.732, "step": 3156 }, { "epoch": 0.38, "learning_rate": 7.414325910871688e-06, "loss": 2.6252, "step": 3157 }, { "epoch": 0.38, "learning_rate": 7.41256761554136e-06, "loss": 2.5641, "step": 3158 }, { "epoch": 0.38, "learning_rate": 7.410808931236155e-06, "loss": 2.4764, "step": 3159 }, { "epoch": 0.38, "learning_rate": 7.409049858239627e-06, "loss": 2.4578, "step": 3160 }, { "epoch": 0.38, "learning_rate": 7.407290396835387e-06, "loss": 2.4636, "step": 3161 }, { "epoch": 0.38, "learning_rate": 7.405530547307112e-06, "loss": 2.5102, "step": 3162 }, { "epoch": 0.38, "learning_rate": 7.403770309938537e-06, "loss": 2.5542, "step": 3163 }, { "epoch": 0.38, "learning_rate": 7.4020096850134635e-06, "loss": 2.4984, "step": 3164 }, { "epoch": 0.38, "learning_rate": 7.400248672815755e-06, "loss": 2.7014, "step": 3165 }, { "epoch": 0.38, "learning_rate": 7.398487273629339e-06, "loss": 2.5029, "step": 3166 }, { "epoch": 0.38, "learning_rate": 7.396725487738201e-06, "loss": 2.5174, "step": 3167 }, { "epoch": 0.38, "learning_rate": 7.394963315426393e-06, "loss": 2.5466, "step": 3168 }, { "epoch": 0.38, "learning_rate": 7.393200756978025e-06, "loss": 2.5507, "step": 3169 }, { "epoch": 0.38, "learning_rate": 7.391437812677274e-06, "loss": 2.7138, "step": 3170 }, { "epoch": 0.38, "learning_rate": 7.389674482808375e-06, "loss": 2.6353, "step": 3171 }, { "epoch": 0.38, "learning_rate": 7.38791076765563e-06, "loss": 2.4847, "step": 3172 }, { "epoch": 0.38, "learning_rate": 7.3861466675034e-06, "loss": 2.3597, "step": 3173 }, { "epoch": 0.38, "learning_rate": 7.384382182636105e-06, "loss": 2.6277, "step": 3174 }, { "epoch": 0.38, "learning_rate": 7.382617313338234e-06, "loss": 2.6321, "step": 3175 }, { "epoch": 0.38, "learning_rate": 7.380852059894331e-06, "loss": 2.6686, "step": 3176 }, { "epoch": 0.38, "learning_rate": 7.379086422589009e-06, "loss": 2.6114, "step": 3177 }, { "epoch": 0.38, "learning_rate": 7.377320401706937e-06, "loss": 2.6719, "step": 3178 }, { "epoch": 0.38, "learning_rate": 7.375553997532851e-06, "loss": 2.517, "step": 3179 }, { "epoch": 0.38, "learning_rate": 7.37378721035154e-06, "loss": 2.4126, "step": 3180 }, { "epoch": 0.38, "learning_rate": 7.372020040447866e-06, "loss": 2.5419, "step": 3181 }, { "epoch": 0.38, "learning_rate": 7.370252488106744e-06, "loss": 2.5483, "step": 3182 }, { "epoch": 0.38, "learning_rate": 7.368484553613157e-06, "loss": 2.5974, "step": 3183 }, { "epoch": 0.38, "learning_rate": 7.3667162372521436e-06, "loss": 2.6297, "step": 3184 }, { "epoch": 0.38, "learning_rate": 7.36494753930881e-06, "loss": 2.6335, "step": 3185 }, { "epoch": 0.38, "learning_rate": 7.363178460068319e-06, "loss": 2.429, "step": 3186 }, { "epoch": 0.38, "learning_rate": 7.361408999815895e-06, "loss": 2.4682, "step": 3187 }, { "epoch": 0.38, "learning_rate": 7.359639158836828e-06, "loss": 2.3934, "step": 3188 }, { "epoch": 0.38, "learning_rate": 7.357868937416467e-06, "loss": 2.5834, "step": 3189 }, { "epoch": 0.38, "learning_rate": 7.356098335840221e-06, "loss": 2.6682, "step": 3190 }, { "epoch": 0.38, "learning_rate": 7.3543273543935645e-06, "loss": 2.5951, "step": 3191 }, { "epoch": 0.38, "learning_rate": 7.352555993362025e-06, "loss": 2.5319, "step": 3192 }, { "epoch": 0.38, "learning_rate": 7.350784253031202e-06, "loss": 2.5352, "step": 3193 }, { "epoch": 0.38, "learning_rate": 7.349012133686748e-06, "loss": 2.4875, "step": 3194 }, { "epoch": 0.38, "learning_rate": 7.3472396356143806e-06, "loss": 2.7119, "step": 3195 }, { "epoch": 0.38, "learning_rate": 7.345466759099875e-06, "loss": 2.5444, "step": 3196 }, { "epoch": 0.38, "learning_rate": 7.343693504429071e-06, "loss": 2.424, "step": 3197 }, { "epoch": 0.38, "learning_rate": 7.341919871887868e-06, "loss": 2.6463, "step": 3198 }, { "epoch": 0.38, "learning_rate": 7.340145861762226e-06, "loss": 2.5197, "step": 3199 }, { "epoch": 0.38, "learning_rate": 7.3383714743381664e-06, "loss": 2.4189, "step": 3200 }, { "epoch": 0.38, "learning_rate": 7.3365967099017725e-06, "loss": 2.4497, "step": 3201 }, { "epoch": 0.38, "learning_rate": 7.3348215687391844e-06, "loss": 2.5978, "step": 3202 }, { "epoch": 0.38, "learning_rate": 7.333046051136606e-06, "loss": 2.7241, "step": 3203 }, { "epoch": 0.38, "learning_rate": 7.331270157380304e-06, "loss": 2.4933, "step": 3204 }, { "epoch": 0.39, "learning_rate": 7.329493887756599e-06, "loss": 2.6976, "step": 3205 }, { "epoch": 0.39, "learning_rate": 7.327717242551882e-06, "loss": 2.6631, "step": 3206 }, { "epoch": 0.39, "learning_rate": 7.325940222052594e-06, "loss": 2.6559, "step": 3207 }, { "epoch": 0.39, "learning_rate": 7.324162826545245e-06, "loss": 2.6597, "step": 3208 }, { "epoch": 0.39, "learning_rate": 7.3223850563163985e-06, "loss": 2.6216, "step": 3209 }, { "epoch": 0.39, "learning_rate": 7.3206069116526855e-06, "loss": 2.5557, "step": 3210 }, { "epoch": 0.39, "learning_rate": 7.318828392840791e-06, "loss": 2.435, "step": 3211 }, { "epoch": 0.39, "learning_rate": 7.317049500167466e-06, "loss": 2.4956, "step": 3212 }, { "epoch": 0.39, "learning_rate": 7.315270233919516e-06, "loss": 2.4526, "step": 3213 }, { "epoch": 0.39, "learning_rate": 7.313490594383812e-06, "loss": 2.544, "step": 3214 }, { "epoch": 0.39, "learning_rate": 7.3117105818472786e-06, "loss": 2.726, "step": 3215 }, { "epoch": 0.39, "learning_rate": 7.309930196596909e-06, "loss": 2.7468, "step": 3216 }, { "epoch": 0.39, "learning_rate": 7.308149438919752e-06, "loss": 2.7192, "step": 3217 }, { "epoch": 0.39, "learning_rate": 7.306368309102914e-06, "loss": 2.4523, "step": 3218 }, { "epoch": 0.39, "learning_rate": 7.304586807433567e-06, "loss": 2.6558, "step": 3219 }, { "epoch": 0.39, "learning_rate": 7.302804934198937e-06, "loss": 2.4579, "step": 3220 }, { "epoch": 0.39, "learning_rate": 7.301022689686313e-06, "loss": 2.6612, "step": 3221 }, { "epoch": 0.39, "learning_rate": 7.299240074183047e-06, "loss": 2.5375, "step": 3222 }, { "epoch": 0.39, "learning_rate": 7.297457087976546e-06, "loss": 2.5869, "step": 3223 }, { "epoch": 0.39, "learning_rate": 7.295673731354278e-06, "loss": 2.6784, "step": 3224 }, { "epoch": 0.39, "learning_rate": 7.2938900046037705e-06, "loss": 2.6059, "step": 3225 }, { "epoch": 0.39, "learning_rate": 7.292105908012612e-06, "loss": 2.416, "step": 3226 }, { "epoch": 0.39, "learning_rate": 7.29032144186845e-06, "loss": 2.5658, "step": 3227 }, { "epoch": 0.39, "learning_rate": 7.28853660645899e-06, "loss": 2.6764, "step": 3228 }, { "epoch": 0.39, "learning_rate": 7.286751402072002e-06, "loss": 2.6524, "step": 3229 }, { "epoch": 0.39, "learning_rate": 7.2849658289953084e-06, "loss": 2.6203, "step": 3230 }, { "epoch": 0.39, "learning_rate": 7.283179887516797e-06, "loss": 2.7371, "step": 3231 }, { "epoch": 0.39, "learning_rate": 7.28139357792441e-06, "loss": 2.513, "step": 3232 }, { "epoch": 0.39, "learning_rate": 7.2796069005061545e-06, "loss": 2.6752, "step": 3233 }, { "epoch": 0.39, "learning_rate": 7.277819855550091e-06, "loss": 2.514, "step": 3234 }, { "epoch": 0.39, "learning_rate": 7.2760324433443455e-06, "loss": 2.6619, "step": 3235 }, { "epoch": 0.39, "learning_rate": 7.2742446641770985e-06, "loss": 2.6035, "step": 3236 }, { "epoch": 0.39, "learning_rate": 7.272456518336589e-06, "loss": 2.6032, "step": 3237 }, { "epoch": 0.39, "learning_rate": 7.270668006111121e-06, "loss": 2.6293, "step": 3238 }, { "epoch": 0.39, "learning_rate": 7.268879127789051e-06, "loss": 2.7696, "step": 3239 }, { "epoch": 0.39, "learning_rate": 7.267089883658798e-06, "loss": 2.5116, "step": 3240 }, { "epoch": 0.39, "learning_rate": 7.265300274008841e-06, "loss": 2.4573, "step": 3241 }, { "epoch": 0.39, "learning_rate": 7.263510299127714e-06, "loss": 2.5243, "step": 3242 }, { "epoch": 0.39, "learning_rate": 7.261719959304012e-06, "loss": 2.5355, "step": 3243 }, { "epoch": 0.39, "learning_rate": 7.259929254826393e-06, "loss": 2.6284, "step": 3244 }, { "epoch": 0.39, "learning_rate": 7.258138185983563e-06, "loss": 2.4836, "step": 3245 }, { "epoch": 0.39, "learning_rate": 7.256346753064299e-06, "loss": 2.6707, "step": 3246 }, { "epoch": 0.39, "learning_rate": 7.254554956357431e-06, "loss": 2.5784, "step": 3247 }, { "epoch": 0.39, "learning_rate": 7.252762796151843e-06, "loss": 2.5519, "step": 3248 }, { "epoch": 0.39, "learning_rate": 7.250970272736489e-06, "loss": 2.3794, "step": 3249 }, { "epoch": 0.39, "learning_rate": 7.249177386400369e-06, "loss": 2.5234, "step": 3250 }, { "epoch": 0.39, "learning_rate": 7.2473841374325516e-06, "loss": 2.5567, "step": 3251 }, { "epoch": 0.39, "learning_rate": 7.2455905261221585e-06, "loss": 2.4524, "step": 3252 }, { "epoch": 0.39, "learning_rate": 7.243796552758371e-06, "loss": 2.7544, "step": 3253 }, { "epoch": 0.39, "learning_rate": 7.242002217630428e-06, "loss": 2.5569, "step": 3254 }, { "epoch": 0.39, "learning_rate": 7.2402075210276304e-06, "loss": 2.521, "step": 3255 }, { "epoch": 0.39, "learning_rate": 7.238412463239332e-06, "loss": 2.5745, "step": 3256 }, { "epoch": 0.39, "learning_rate": 7.236617044554948e-06, "loss": 2.5726, "step": 3257 }, { "epoch": 0.39, "learning_rate": 7.234821265263952e-06, "loss": 2.7212, "step": 3258 }, { "epoch": 0.39, "learning_rate": 7.2330251256558724e-06, "loss": 2.5722, "step": 3259 }, { "epoch": 0.39, "learning_rate": 7.231228626020303e-06, "loss": 2.6385, "step": 3260 }, { "epoch": 0.39, "learning_rate": 7.2294317666468875e-06, "loss": 2.546, "step": 3261 }, { "epoch": 0.39, "learning_rate": 7.227634547825332e-06, "loss": 2.512, "step": 3262 }, { "epoch": 0.39, "learning_rate": 7.225836969845398e-06, "loss": 2.5028, "step": 3263 }, { "epoch": 0.39, "learning_rate": 7.224039032996909e-06, "loss": 2.4587, "step": 3264 }, { "epoch": 0.39, "learning_rate": 7.222240737569741e-06, "loss": 2.6003, "step": 3265 }, { "epoch": 0.39, "learning_rate": 7.220442083853834e-06, "loss": 2.6241, "step": 3266 }, { "epoch": 0.39, "learning_rate": 7.2186430721391796e-06, "loss": 2.5696, "step": 3267 }, { "epoch": 0.39, "learning_rate": 7.216843702715831e-06, "loss": 2.4726, "step": 3268 }, { "epoch": 0.39, "learning_rate": 7.215043975873899e-06, "loss": 2.593, "step": 3269 }, { "epoch": 0.39, "learning_rate": 7.213243891903549e-06, "loss": 2.6046, "step": 3270 }, { "epoch": 0.39, "learning_rate": 7.211443451095007e-06, "loss": 2.4617, "step": 3271 }, { "epoch": 0.39, "learning_rate": 7.209642653738555e-06, "loss": 2.3496, "step": 3272 }, { "epoch": 0.39, "learning_rate": 7.207841500124535e-06, "loss": 2.4933, "step": 3273 }, { "epoch": 0.39, "learning_rate": 7.206039990543341e-06, "loss": 2.5011, "step": 3274 }, { "epoch": 0.39, "learning_rate": 7.204238125285432e-06, "loss": 2.4039, "step": 3275 }, { "epoch": 0.39, "learning_rate": 7.202435904641316e-06, "loss": 2.6036, "step": 3276 }, { "epoch": 0.39, "learning_rate": 7.200633328901565e-06, "loss": 2.5698, "step": 3277 }, { "epoch": 0.39, "learning_rate": 7.198830398356807e-06, "loss": 2.5325, "step": 3278 }, { "epoch": 0.39, "learning_rate": 7.197027113297722e-06, "loss": 2.4972, "step": 3279 }, { "epoch": 0.39, "learning_rate": 7.195223474015054e-06, "loss": 2.4004, "step": 3280 }, { "epoch": 0.39, "learning_rate": 7.193419480799601e-06, "loss": 2.5698, "step": 3281 }, { "epoch": 0.39, "learning_rate": 7.191615133942215e-06, "loss": 2.5352, "step": 3282 }, { "epoch": 0.39, "learning_rate": 7.1898104337338145e-06, "loss": 2.7194, "step": 3283 }, { "epoch": 0.39, "learning_rate": 7.188005380465365e-06, "loss": 2.5107, "step": 3284 }, { "epoch": 0.39, "learning_rate": 7.186199974427892e-06, "loss": 2.537, "step": 3285 }, { "epoch": 0.39, "learning_rate": 7.18439421591248e-06, "loss": 2.4788, "step": 3286 }, { "epoch": 0.39, "learning_rate": 7.1825881052102675e-06, "loss": 2.7171, "step": 3287 }, { "epoch": 0.4, "learning_rate": 7.180781642612453e-06, "loss": 2.4893, "step": 3288 }, { "epoch": 0.4, "learning_rate": 7.17897482841029e-06, "loss": 2.6121, "step": 3289 }, { "epoch": 0.4, "learning_rate": 7.177167662895087e-06, "loss": 2.68, "step": 3290 }, { "epoch": 0.4, "learning_rate": 7.175360146358212e-06, "loss": 2.5491, "step": 3291 }, { "epoch": 0.4, "learning_rate": 7.173552279091087e-06, "loss": 2.5489, "step": 3292 }, { "epoch": 0.4, "learning_rate": 7.1717440613851916e-06, "loss": 2.3796, "step": 3293 }, { "epoch": 0.4, "learning_rate": 7.169935493532065e-06, "loss": 2.5513, "step": 3294 }, { "epoch": 0.4, "learning_rate": 7.168126575823299e-06, "loss": 2.6148, "step": 3295 }, { "epoch": 0.4, "learning_rate": 7.166317308550541e-06, "loss": 2.4997, "step": 3296 }, { "epoch": 0.4, "learning_rate": 7.164507692005498e-06, "loss": 2.5133, "step": 3297 }, { "epoch": 0.4, "learning_rate": 7.162697726479931e-06, "loss": 2.426, "step": 3298 }, { "epoch": 0.4, "learning_rate": 7.16088741226566e-06, "loss": 2.5029, "step": 3299 }, { "epoch": 0.4, "learning_rate": 7.159076749654559e-06, "loss": 2.566, "step": 3300 }, { "epoch": 0.4, "learning_rate": 7.157265738938557e-06, "loss": 2.5352, "step": 3301 }, { "epoch": 0.4, "learning_rate": 7.1554543804096425e-06, "loss": 2.5181, "step": 3302 }, { "epoch": 0.4, "learning_rate": 7.153642674359855e-06, "loss": 2.5259, "step": 3303 }, { "epoch": 0.4, "learning_rate": 7.151830621081297e-06, "loss": 2.5003, "step": 3304 }, { "epoch": 0.4, "learning_rate": 7.1500182208661214e-06, "loss": 2.4168, "step": 3305 }, { "epoch": 0.4, "learning_rate": 7.148205474006542e-06, "loss": 2.5064, "step": 3306 }, { "epoch": 0.4, "learning_rate": 7.146392380794821e-06, "loss": 2.51, "step": 3307 }, { "epoch": 0.4, "learning_rate": 7.144578941523283e-06, "loss": 2.6186, "step": 3308 }, { "epoch": 0.4, "learning_rate": 7.142765156484306e-06, "loss": 2.7698, "step": 3309 }, { "epoch": 0.4, "learning_rate": 7.140951025970324e-06, "loss": 2.5073, "step": 3310 }, { "epoch": 0.4, "learning_rate": 7.139136550273828e-06, "loss": 2.5513, "step": 3311 }, { "epoch": 0.4, "learning_rate": 7.137321729687361e-06, "loss": 2.6306, "step": 3312 }, { "epoch": 0.4, "learning_rate": 7.135506564503525e-06, "loss": 2.6023, "step": 3313 }, { "epoch": 0.4, "learning_rate": 7.1336910550149775e-06, "loss": 2.5843, "step": 3314 }, { "epoch": 0.4, "learning_rate": 7.131875201514429e-06, "loss": 2.5588, "step": 3315 }, { "epoch": 0.4, "learning_rate": 7.130059004294647e-06, "loss": 2.5233, "step": 3316 }, { "epoch": 0.4, "learning_rate": 7.128242463648456e-06, "loss": 2.3727, "step": 3317 }, { "epoch": 0.4, "learning_rate": 7.126425579868733e-06, "loss": 2.4892, "step": 3318 }, { "epoch": 0.4, "learning_rate": 7.124608353248412e-06, "loss": 2.5658, "step": 3319 }, { "epoch": 0.4, "learning_rate": 7.122790784080482e-06, "loss": 2.6595, "step": 3320 }, { "epoch": 0.4, "learning_rate": 7.120972872657986e-06, "loss": 2.5787, "step": 3321 }, { "epoch": 0.4, "learning_rate": 7.119154619274027e-06, "loss": 2.6978, "step": 3322 }, { "epoch": 0.4, "learning_rate": 7.117336024221755e-06, "loss": 2.4182, "step": 3323 }, { "epoch": 0.4, "learning_rate": 7.115517087794381e-06, "loss": 2.5343, "step": 3324 }, { "epoch": 0.4, "learning_rate": 7.11369781028517e-06, "loss": 2.5621, "step": 3325 }, { "epoch": 0.4, "learning_rate": 7.111878191987441e-06, "loss": 2.5746, "step": 3326 }, { "epoch": 0.4, "learning_rate": 7.110058233194569e-06, "loss": 2.5858, "step": 3327 }, { "epoch": 0.4, "learning_rate": 7.108237934199983e-06, "loss": 2.5498, "step": 3328 }, { "epoch": 0.4, "learning_rate": 7.106417295297169e-06, "loss": 2.5795, "step": 3329 }, { "epoch": 0.4, "learning_rate": 7.104596316779663e-06, "loss": 2.4783, "step": 3330 }, { "epoch": 0.4, "learning_rate": 7.102774998941061e-06, "loss": 2.6812, "step": 3331 }, { "epoch": 0.4, "learning_rate": 7.10095334207501e-06, "loss": 2.3636, "step": 3332 }, { "epoch": 0.4, "learning_rate": 7.099131346475213e-06, "loss": 2.606, "step": 3333 }, { "epoch": 0.4, "learning_rate": 7.097309012435431e-06, "loss": 2.7828, "step": 3334 }, { "epoch": 0.4, "learning_rate": 7.095486340249473e-06, "loss": 2.3757, "step": 3335 }, { "epoch": 0.4, "learning_rate": 7.093663330211208e-06, "loss": 2.3866, "step": 3336 }, { "epoch": 0.4, "learning_rate": 7.091839982614555e-06, "loss": 2.6594, "step": 3337 }, { "epoch": 0.4, "learning_rate": 7.090016297753492e-06, "loss": 2.5154, "step": 3338 }, { "epoch": 0.4, "learning_rate": 7.088192275922046e-06, "loss": 2.4907, "step": 3339 }, { "epoch": 0.4, "learning_rate": 7.086367917414307e-06, "loss": 2.5544, "step": 3340 }, { "epoch": 0.4, "learning_rate": 7.084543222524408e-06, "loss": 2.3842, "step": 3341 }, { "epoch": 0.4, "learning_rate": 7.082718191546546e-06, "loss": 2.5327, "step": 3342 }, { "epoch": 0.4, "learning_rate": 7.080892824774965e-06, "loss": 2.5057, "step": 3343 }, { "epoch": 0.4, "learning_rate": 7.079067122503969e-06, "loss": 2.7276, "step": 3344 }, { "epoch": 0.4, "learning_rate": 7.07724108502791e-06, "loss": 2.6554, "step": 3345 }, { "epoch": 0.4, "learning_rate": 7.075414712641203e-06, "loss": 2.6792, "step": 3346 }, { "epoch": 0.4, "learning_rate": 7.073588005638308e-06, "loss": 2.5875, "step": 3347 }, { "epoch": 0.4, "learning_rate": 7.071760964313739e-06, "loss": 2.5652, "step": 3348 }, { "epoch": 0.4, "learning_rate": 7.0699335889620746e-06, "loss": 2.5507, "step": 3349 }, { "epoch": 0.4, "learning_rate": 7.0681058798779335e-06, "loss": 2.3991, "step": 3350 }, { "epoch": 0.4, "learning_rate": 7.066277837355999e-06, "loss": 2.5742, "step": 3351 }, { "epoch": 0.4, "learning_rate": 7.064449461691003e-06, "loss": 2.5156, "step": 3352 }, { "epoch": 0.4, "learning_rate": 7.0626207531777305e-06, "loss": 2.3594, "step": 3353 }, { "epoch": 0.4, "learning_rate": 7.060791712111021e-06, "loss": 2.5027, "step": 3354 }, { "epoch": 0.4, "learning_rate": 7.0589623387857705e-06, "loss": 2.4226, "step": 3355 }, { "epoch": 0.4, "learning_rate": 7.057132633496924e-06, "loss": 2.5909, "step": 3356 }, { "epoch": 0.4, "learning_rate": 7.055302596539485e-06, "loss": 2.5679, "step": 3357 }, { "epoch": 0.4, "learning_rate": 7.053472228208506e-06, "loss": 2.5209, "step": 3358 }, { "epoch": 0.4, "learning_rate": 7.0516415287990945e-06, "loss": 2.6139, "step": 3359 }, { "epoch": 0.4, "learning_rate": 7.049810498606413e-06, "loss": 2.622, "step": 3360 }, { "epoch": 0.4, "learning_rate": 7.047979137925674e-06, "loss": 2.65, "step": 3361 }, { "epoch": 0.4, "learning_rate": 7.046147447052146e-06, "loss": 2.574, "step": 3362 }, { "epoch": 0.4, "learning_rate": 7.044315426281151e-06, "loss": 2.4838, "step": 3363 }, { "epoch": 0.4, "learning_rate": 7.042483075908062e-06, "loss": 2.5026, "step": 3364 }, { "epoch": 0.4, "learning_rate": 7.040650396228306e-06, "loss": 2.4315, "step": 3365 }, { "epoch": 0.4, "learning_rate": 7.038817387537364e-06, "loss": 2.6086, "step": 3366 }, { "epoch": 0.4, "learning_rate": 7.036984050130771e-06, "loss": 2.5921, "step": 3367 }, { "epoch": 0.4, "learning_rate": 7.03515038430411e-06, "loss": 2.6474, "step": 3368 }, { "epoch": 0.4, "learning_rate": 7.033316390353022e-06, "loss": 2.4734, "step": 3369 }, { "epoch": 0.4, "learning_rate": 7.031482068573201e-06, "loss": 2.418, "step": 3370 }, { "epoch": 0.4, "learning_rate": 7.029647419260388e-06, "loss": 2.4721, "step": 3371 }, { "epoch": 0.41, "learning_rate": 7.027812442710385e-06, "loss": 2.595, "step": 3372 }, { "epoch": 0.41, "learning_rate": 7.0259771392190405e-06, "loss": 2.3401, "step": 3373 }, { "epoch": 0.41, "learning_rate": 7.024141509082259e-06, "loss": 2.529, "step": 3374 }, { "epoch": 0.41, "learning_rate": 7.022305552595996e-06, "loss": 2.5277, "step": 3375 }, { "epoch": 0.41, "learning_rate": 7.020469270056258e-06, "loss": 2.5605, "step": 3376 }, { "epoch": 0.41, "learning_rate": 7.018632661759112e-06, "loss": 2.5286, "step": 3377 }, { "epoch": 0.41, "learning_rate": 7.016795728000666e-06, "loss": 2.6061, "step": 3378 }, { "epoch": 0.41, "learning_rate": 7.014958469077087e-06, "loss": 2.5439, "step": 3379 }, { "epoch": 0.41, "learning_rate": 7.013120885284599e-06, "loss": 2.6058, "step": 3380 }, { "epoch": 0.41, "learning_rate": 7.011282976919467e-06, "loss": 2.494, "step": 3381 }, { "epoch": 0.41, "learning_rate": 7.0094447442780156e-06, "loss": 2.7405, "step": 3382 }, { "epoch": 0.41, "learning_rate": 7.007606187656623e-06, "loss": 2.4808, "step": 3383 }, { "epoch": 0.41, "learning_rate": 7.005767307351714e-06, "loss": 2.56, "step": 3384 }, { "epoch": 0.41, "learning_rate": 7.003928103659771e-06, "loss": 2.4512, "step": 3385 }, { "epoch": 0.41, "learning_rate": 7.002088576877325e-06, "loss": 2.3884, "step": 3386 }, { "epoch": 0.41, "learning_rate": 7.00024872730096e-06, "loss": 2.5553, "step": 3387 }, { "epoch": 0.41, "learning_rate": 6.9984085552273136e-06, "loss": 2.4752, "step": 3388 }, { "epoch": 0.41, "learning_rate": 6.996568060953075e-06, "loss": 2.5007, "step": 3389 }, { "epoch": 0.41, "learning_rate": 6.994727244774981e-06, "loss": 2.438, "step": 3390 }, { "epoch": 0.41, "learning_rate": 6.992886106989827e-06, "loss": 2.7247, "step": 3391 }, { "epoch": 0.41, "learning_rate": 6.991044647894456e-06, "loss": 2.5372, "step": 3392 }, { "epoch": 0.41, "learning_rate": 6.989202867785762e-06, "loss": 2.5679, "step": 3393 }, { "epoch": 0.41, "learning_rate": 6.987360766960697e-06, "loss": 2.7698, "step": 3394 }, { "epoch": 0.41, "learning_rate": 6.985518345716256e-06, "loss": 2.3488, "step": 3395 }, { "epoch": 0.41, "learning_rate": 6.983675604349492e-06, "loss": 2.544, "step": 3396 }, { "epoch": 0.41, "learning_rate": 6.981832543157507e-06, "loss": 2.4098, "step": 3397 }, { "epoch": 0.41, "learning_rate": 6.9799891624374565e-06, "loss": 2.4566, "step": 3398 }, { "epoch": 0.41, "learning_rate": 6.978145462486544e-06, "loss": 2.5263, "step": 3399 }, { "epoch": 0.41, "learning_rate": 6.9763014436020285e-06, "loss": 2.5483, "step": 3400 }, { "epoch": 0.41, "learning_rate": 6.9744571060812185e-06, "loss": 2.5378, "step": 3401 }, { "epoch": 0.41, "learning_rate": 6.972612450221471e-06, "loss": 2.6029, "step": 3402 }, { "epoch": 0.41, "learning_rate": 6.9707674763202e-06, "loss": 2.471, "step": 3403 }, { "epoch": 0.41, "learning_rate": 6.968922184674868e-06, "loss": 2.489, "step": 3404 }, { "epoch": 0.41, "learning_rate": 6.967076575582989e-06, "loss": 2.4791, "step": 3405 }, { "epoch": 0.41, "learning_rate": 6.965230649342127e-06, "loss": 2.4615, "step": 3406 }, { "epoch": 0.41, "learning_rate": 6.963384406249898e-06, "loss": 2.5226, "step": 3407 }, { "epoch": 0.41, "learning_rate": 6.96153784660397e-06, "loss": 2.4778, "step": 3408 }, { "epoch": 0.41, "learning_rate": 6.959690970702059e-06, "loss": 2.5375, "step": 3409 }, { "epoch": 0.41, "learning_rate": 6.957843778841937e-06, "loss": 2.6204, "step": 3410 }, { "epoch": 0.41, "learning_rate": 6.955996271321423e-06, "loss": 2.4206, "step": 3411 }, { "epoch": 0.41, "learning_rate": 6.954148448438389e-06, "loss": 2.5351, "step": 3412 }, { "epoch": 0.41, "learning_rate": 6.9523003104907565e-06, "loss": 2.6069, "step": 3413 }, { "epoch": 0.41, "learning_rate": 6.950451857776495e-06, "loss": 2.7543, "step": 3414 }, { "epoch": 0.41, "learning_rate": 6.948603090593632e-06, "loss": 2.5575, "step": 3415 }, { "epoch": 0.41, "learning_rate": 6.946754009240241e-06, "loss": 2.4693, "step": 3416 }, { "epoch": 0.41, "learning_rate": 6.944904614014445e-06, "loss": 2.5934, "step": 3417 }, { "epoch": 0.41, "learning_rate": 6.943054905214421e-06, "loss": 2.5002, "step": 3418 }, { "epoch": 0.41, "learning_rate": 6.941204883138395e-06, "loss": 2.6119, "step": 3419 }, { "epoch": 0.41, "learning_rate": 6.9393545480846405e-06, "loss": 2.4744, "step": 3420 }, { "epoch": 0.41, "learning_rate": 6.9375039003514876e-06, "loss": 2.4601, "step": 3421 }, { "epoch": 0.41, "learning_rate": 6.935652940237313e-06, "loss": 2.6223, "step": 3422 }, { "epoch": 0.41, "learning_rate": 6.933801668040544e-06, "loss": 2.6702, "step": 3423 }, { "epoch": 0.41, "learning_rate": 6.9319500840596596e-06, "loss": 2.4057, "step": 3424 }, { "epoch": 0.41, "learning_rate": 6.930098188593185e-06, "loss": 2.7331, "step": 3425 }, { "epoch": 0.41, "learning_rate": 6.9282459819397016e-06, "loss": 2.4977, "step": 3426 }, { "epoch": 0.41, "learning_rate": 6.926393464397838e-06, "loss": 2.5082, "step": 3427 }, { "epoch": 0.41, "learning_rate": 6.924540636266272e-06, "loss": 2.4777, "step": 3428 }, { "epoch": 0.41, "learning_rate": 6.922687497843734e-06, "loss": 2.5447, "step": 3429 }, { "epoch": 0.41, "learning_rate": 6.920834049429002e-06, "loss": 2.4544, "step": 3430 }, { "epoch": 0.41, "learning_rate": 6.918980291320902e-06, "loss": 2.6058, "step": 3431 }, { "epoch": 0.41, "learning_rate": 6.917126223818315e-06, "loss": 2.4188, "step": 3432 }, { "epoch": 0.41, "learning_rate": 6.9152718472201715e-06, "loss": 2.5214, "step": 3433 }, { "epoch": 0.41, "learning_rate": 6.913417161825449e-06, "loss": 2.438, "step": 3434 }, { "epoch": 0.41, "learning_rate": 6.911562167933176e-06, "loss": 2.537, "step": 3435 }, { "epoch": 0.41, "learning_rate": 6.909706865842429e-06, "loss": 2.5084, "step": 3436 }, { "epoch": 0.41, "learning_rate": 6.907851255852336e-06, "loss": 2.5394, "step": 3437 }, { "epoch": 0.41, "learning_rate": 6.905995338262075e-06, "loss": 2.627, "step": 3438 }, { "epoch": 0.41, "learning_rate": 6.904139113370875e-06, "loss": 2.4779, "step": 3439 }, { "epoch": 0.41, "learning_rate": 6.902282581478009e-06, "loss": 2.5839, "step": 3440 }, { "epoch": 0.41, "learning_rate": 6.9004257428828044e-06, "loss": 2.6905, "step": 3441 }, { "epoch": 0.41, "learning_rate": 6.8985685978846385e-06, "loss": 2.436, "step": 3442 }, { "epoch": 0.41, "learning_rate": 6.896711146782933e-06, "loss": 2.4503, "step": 3443 }, { "epoch": 0.41, "learning_rate": 6.894853389877163e-06, "loss": 2.7182, "step": 3444 }, { "epoch": 0.41, "learning_rate": 6.892995327466854e-06, "loss": 2.394, "step": 3445 }, { "epoch": 0.41, "learning_rate": 6.891136959851576e-06, "loss": 2.3424, "step": 3446 }, { "epoch": 0.41, "learning_rate": 6.889278287330955e-06, "loss": 2.4091, "step": 3447 }, { "epoch": 0.41, "learning_rate": 6.887419310204657e-06, "loss": 2.4229, "step": 3448 }, { "epoch": 0.41, "learning_rate": 6.885560028772406e-06, "loss": 2.56, "step": 3449 }, { "epoch": 0.41, "learning_rate": 6.88370044333397e-06, "loss": 2.4882, "step": 3450 }, { "epoch": 0.41, "learning_rate": 6.881840554189167e-06, "loss": 2.6487, "step": 3451 }, { "epoch": 0.41, "learning_rate": 6.879980361637865e-06, "loss": 2.4626, "step": 3452 }, { "epoch": 0.41, "learning_rate": 6.878119865979982e-06, "loss": 2.5608, "step": 3453 }, { "epoch": 0.41, "learning_rate": 6.876259067515478e-06, "loss": 2.6365, "step": 3454 }, { "epoch": 0.42, "learning_rate": 6.874397966544371e-06, "loss": 2.6155, "step": 3455 }, { "epoch": 0.42, "learning_rate": 6.872536563366724e-06, "loss": 2.5183, "step": 3456 }, { "epoch": 0.42, "learning_rate": 6.870674858282647e-06, "loss": 2.5987, "step": 3457 }, { "epoch": 0.42, "learning_rate": 6.868812851592299e-06, "loss": 2.5776, "step": 3458 }, { "epoch": 0.42, "learning_rate": 6.866950543595891e-06, "loss": 2.3885, "step": 3459 }, { "epoch": 0.42, "learning_rate": 6.86508793459368e-06, "loss": 2.4621, "step": 3460 }, { "epoch": 0.42, "learning_rate": 6.863225024885968e-06, "loss": 2.4538, "step": 3461 }, { "epoch": 0.42, "learning_rate": 6.861361814773114e-06, "loss": 2.6471, "step": 3462 }, { "epoch": 0.42, "learning_rate": 6.85949830455552e-06, "loss": 2.5987, "step": 3463 }, { "epoch": 0.42, "learning_rate": 6.857634494533636e-06, "loss": 2.4264, "step": 3464 }, { "epoch": 0.42, "learning_rate": 6.8557703850079605e-06, "loss": 2.577, "step": 3465 }, { "epoch": 0.42, "learning_rate": 6.8539059762790425e-06, "loss": 2.598, "step": 3466 }, { "epoch": 0.42, "learning_rate": 6.852041268647478e-06, "loss": 2.5505, "step": 3467 }, { "epoch": 0.42, "learning_rate": 6.8501762624139125e-06, "loss": 2.539, "step": 3468 }, { "epoch": 0.42, "learning_rate": 6.848310957879036e-06, "loss": 2.6697, "step": 3469 }, { "epoch": 0.42, "learning_rate": 6.846445355343591e-06, "loss": 2.5349, "step": 3470 }, { "epoch": 0.42, "learning_rate": 6.844579455108362e-06, "loss": 2.4591, "step": 3471 }, { "epoch": 0.42, "learning_rate": 6.842713257474191e-06, "loss": 2.505, "step": 3472 }, { "epoch": 0.42, "learning_rate": 6.8408467627419575e-06, "loss": 2.5075, "step": 3473 }, { "epoch": 0.42, "learning_rate": 6.838979971212598e-06, "loss": 2.7163, "step": 3474 }, { "epoch": 0.42, "learning_rate": 6.837112883187089e-06, "loss": 2.4738, "step": 3475 }, { "epoch": 0.42, "learning_rate": 6.835245498966461e-06, "loss": 2.4947, "step": 3476 }, { "epoch": 0.42, "learning_rate": 6.833377818851789e-06, "loss": 2.5098, "step": 3477 }, { "epoch": 0.42, "learning_rate": 6.8315098431441955e-06, "loss": 2.4884, "step": 3478 }, { "epoch": 0.42, "learning_rate": 6.829641572144854e-06, "loss": 2.5255, "step": 3479 }, { "epoch": 0.42, "learning_rate": 6.8277730061549806e-06, "loss": 2.6656, "step": 3480 }, { "epoch": 0.42, "learning_rate": 6.825904145475842e-06, "loss": 2.5295, "step": 3481 }, { "epoch": 0.42, "learning_rate": 6.824034990408753e-06, "loss": 2.4591, "step": 3482 }, { "epoch": 0.42, "learning_rate": 6.8221655412550746e-06, "loss": 2.5537, "step": 3483 }, { "epoch": 0.42, "learning_rate": 6.820295798316214e-06, "loss": 2.5295, "step": 3484 }, { "epoch": 0.42, "learning_rate": 6.81842576189363e-06, "loss": 2.4957, "step": 3485 }, { "epoch": 0.42, "learning_rate": 6.816555432288824e-06, "loss": 2.4792, "step": 3486 }, { "epoch": 0.42, "learning_rate": 6.814684809803347e-06, "loss": 2.7786, "step": 3487 }, { "epoch": 0.42, "learning_rate": 6.8128138947387966e-06, "loss": 2.5126, "step": 3488 }, { "epoch": 0.42, "learning_rate": 6.810942687396818e-06, "loss": 2.5993, "step": 3489 }, { "epoch": 0.42, "learning_rate": 6.8090711880791025e-06, "loss": 2.4943, "step": 3490 }, { "epoch": 0.42, "learning_rate": 6.807199397087391e-06, "loss": 2.6227, "step": 3491 }, { "epoch": 0.42, "learning_rate": 6.805327314723469e-06, "loss": 2.4049, "step": 3492 }, { "epoch": 0.42, "learning_rate": 6.803454941289168e-06, "loss": 2.4009, "step": 3493 }, { "epoch": 0.42, "learning_rate": 6.801582277086371e-06, "loss": 2.6056, "step": 3494 }, { "epoch": 0.42, "learning_rate": 6.7997093224170045e-06, "loss": 2.3961, "step": 3495 }, { "epoch": 0.42, "learning_rate": 6.79783607758304e-06, "loss": 2.4373, "step": 3496 }, { "epoch": 0.42, "learning_rate": 6.795962542886501e-06, "loss": 2.5217, "step": 3497 }, { "epoch": 0.42, "learning_rate": 6.794088718629451e-06, "loss": 2.4587, "step": 3498 }, { "epoch": 0.42, "learning_rate": 6.792214605114009e-06, "loss": 2.3403, "step": 3499 }, { "epoch": 0.42, "learning_rate": 6.790340202642333e-06, "loss": 2.6014, "step": 3500 }, { "epoch": 0.42, "learning_rate": 6.7884655115166285e-06, "loss": 2.5895, "step": 3501 }, { "epoch": 0.42, "learning_rate": 6.786590532039152e-06, "loss": 2.4506, "step": 3502 }, { "epoch": 0.42, "learning_rate": 6.784715264512205e-06, "loss": 2.7009, "step": 3503 }, { "epoch": 0.42, "learning_rate": 6.78283970923813e-06, "loss": 2.5024, "step": 3504 }, { "epoch": 0.42, "learning_rate": 6.7809638665193235e-06, "loss": 2.6888, "step": 3505 }, { "epoch": 0.42, "learning_rate": 6.7790877366582255e-06, "loss": 2.4187, "step": 3506 }, { "epoch": 0.42, "learning_rate": 6.777211319957318e-06, "loss": 2.4443, "step": 3507 }, { "epoch": 0.42, "learning_rate": 6.775334616719136e-06, "loss": 2.5614, "step": 3508 }, { "epoch": 0.42, "learning_rate": 6.773457627246256e-06, "loss": 2.5991, "step": 3509 }, { "epoch": 0.42, "learning_rate": 6.771580351841304e-06, "loss": 2.5444, "step": 3510 }, { "epoch": 0.42, "learning_rate": 6.769702790806949e-06, "loss": 2.5674, "step": 3511 }, { "epoch": 0.42, "learning_rate": 6.76782494444591e-06, "loss": 2.5935, "step": 3512 }, { "epoch": 0.42, "learning_rate": 6.765946813060946e-06, "loss": 2.5608, "step": 3513 }, { "epoch": 0.42, "learning_rate": 6.764068396954868e-06, "loss": 2.7615, "step": 3514 }, { "epoch": 0.42, "learning_rate": 6.76218969643053e-06, "loss": 2.612, "step": 3515 }, { "epoch": 0.42, "learning_rate": 6.760310711790831e-06, "loss": 2.5248, "step": 3516 }, { "epoch": 0.42, "learning_rate": 6.75843144333872e-06, "loss": 2.4135, "step": 3517 }, { "epoch": 0.42, "learning_rate": 6.756551891377185e-06, "loss": 2.525, "step": 3518 }, { "epoch": 0.42, "learning_rate": 6.7546720562092664e-06, "loss": 2.4553, "step": 3519 }, { "epoch": 0.42, "learning_rate": 6.752791938138046e-06, "loss": 2.5535, "step": 3520 }, { "epoch": 0.42, "learning_rate": 6.7509115374666515e-06, "loss": 2.4303, "step": 3521 }, { "epoch": 0.42, "learning_rate": 6.74903085449826e-06, "loss": 2.5413, "step": 3522 }, { "epoch": 0.42, "learning_rate": 6.747149889536089e-06, "loss": 2.5923, "step": 3523 }, { "epoch": 0.42, "learning_rate": 6.7452686428834045e-06, "loss": 2.6194, "step": 3524 }, { "epoch": 0.42, "learning_rate": 6.743387114843518e-06, "loss": 2.4902, "step": 3525 }, { "epoch": 0.42, "learning_rate": 6.741505305719785e-06, "loss": 2.511, "step": 3526 }, { "epoch": 0.42, "learning_rate": 6.739623215815607e-06, "loss": 2.5482, "step": 3527 }, { "epoch": 0.42, "learning_rate": 6.737740845434432e-06, "loss": 2.4535, "step": 3528 }, { "epoch": 0.42, "learning_rate": 6.7358581948797495e-06, "loss": 2.4784, "step": 3529 }, { "epoch": 0.42, "learning_rate": 6.733975264455097e-06, "loss": 2.3545, "step": 3530 }, { "epoch": 0.42, "learning_rate": 6.7320920544640585e-06, "loss": 2.4496, "step": 3531 }, { "epoch": 0.42, "learning_rate": 6.73020856521026e-06, "loss": 2.5349, "step": 3532 }, { "epoch": 0.42, "learning_rate": 6.7283247969973756e-06, "loss": 2.5711, "step": 3533 }, { "epoch": 0.42, "learning_rate": 6.7264407501291195e-06, "loss": 2.5519, "step": 3534 }, { "epoch": 0.42, "learning_rate": 6.724556424909256e-06, "loss": 2.5586, "step": 3535 }, { "epoch": 0.42, "learning_rate": 6.722671821641591e-06, "loss": 2.4885, "step": 3536 }, { "epoch": 0.42, "learning_rate": 6.720786940629977e-06, "loss": 2.6116, "step": 3537 }, { "epoch": 0.43, "learning_rate": 6.718901782178312e-06, "loss": 2.7089, "step": 3538 }, { "epoch": 0.43, "learning_rate": 6.717016346590536e-06, "loss": 2.5655, "step": 3539 }, { "epoch": 0.43, "learning_rate": 6.715130634170636e-06, "loss": 2.5051, "step": 3540 }, { "epoch": 0.43, "learning_rate": 6.7132446452226405e-06, "loss": 2.5019, "step": 3541 }, { "epoch": 0.43, "learning_rate": 6.711358380050628e-06, "loss": 2.6083, "step": 3542 }, { "epoch": 0.43, "learning_rate": 6.709471838958715e-06, "loss": 2.7503, "step": 3543 }, { "epoch": 0.43, "learning_rate": 6.707585022251068e-06, "loss": 2.6002, "step": 3544 }, { "epoch": 0.43, "learning_rate": 6.705697930231898e-06, "loss": 2.4639, "step": 3545 }, { "epoch": 0.43, "learning_rate": 6.703810563205454e-06, "loss": 2.5349, "step": 3546 }, { "epoch": 0.43, "learning_rate": 6.7019229214760365e-06, "loss": 2.6932, "step": 3547 }, { "epoch": 0.43, "learning_rate": 6.700035005347983e-06, "loss": 2.3157, "step": 3548 }, { "epoch": 0.43, "learning_rate": 6.698146815125685e-06, "loss": 2.4562, "step": 3549 }, { "epoch": 0.43, "learning_rate": 6.696258351113569e-06, "loss": 2.5796, "step": 3550 }, { "epoch": 0.43, "learning_rate": 6.694369613616113e-06, "loss": 2.6003, "step": 3551 }, { "epoch": 0.43, "learning_rate": 6.692480602937832e-06, "loss": 2.4744, "step": 3552 }, { "epoch": 0.43, "learning_rate": 6.690591319383289e-06, "loss": 2.6278, "step": 3553 }, { "epoch": 0.43, "learning_rate": 6.68870176325709e-06, "loss": 2.5808, "step": 3554 }, { "epoch": 0.43, "learning_rate": 6.68681193486389e-06, "loss": 2.5646, "step": 3555 }, { "epoch": 0.43, "learning_rate": 6.6849218345083785e-06, "loss": 2.4373, "step": 3556 }, { "epoch": 0.43, "learning_rate": 6.683031462495296e-06, "loss": 2.4639, "step": 3557 }, { "epoch": 0.43, "learning_rate": 6.681140819129424e-06, "loss": 2.5158, "step": 3558 }, { "epoch": 0.43, "learning_rate": 6.679249904715588e-06, "loss": 2.4793, "step": 3559 }, { "epoch": 0.43, "learning_rate": 6.677358719558655e-06, "loss": 2.6138, "step": 3560 }, { "epoch": 0.43, "learning_rate": 6.675467263963544e-06, "loss": 2.7053, "step": 3561 }, { "epoch": 0.43, "learning_rate": 6.6735755382352074e-06, "loss": 2.5928, "step": 3562 }, { "epoch": 0.43, "learning_rate": 6.671683542678646e-06, "loss": 2.589, "step": 3563 }, { "epoch": 0.43, "learning_rate": 6.6697912775989045e-06, "loss": 2.73, "step": 3564 }, { "epoch": 0.43, "learning_rate": 6.66789874330107e-06, "loss": 2.5841, "step": 3565 }, { "epoch": 0.43, "learning_rate": 6.666005940090271e-06, "loss": 2.5886, "step": 3566 }, { "epoch": 0.43, "learning_rate": 6.664112868271686e-06, "loss": 2.4859, "step": 3567 }, { "epoch": 0.43, "learning_rate": 6.662219528150529e-06, "loss": 2.5956, "step": 3568 }, { "epoch": 0.43, "learning_rate": 6.660325920032061e-06, "loss": 2.5993, "step": 3569 }, { "epoch": 0.43, "learning_rate": 6.658432044221584e-06, "loss": 2.3985, "step": 3570 }, { "epoch": 0.43, "learning_rate": 6.656537901024448e-06, "loss": 2.4631, "step": 3571 }, { "epoch": 0.43, "learning_rate": 6.654643490746042e-06, "loss": 2.4616, "step": 3572 }, { "epoch": 0.43, "learning_rate": 6.6527488136917995e-06, "loss": 2.6352, "step": 3573 }, { "epoch": 0.43, "learning_rate": 6.650853870167196e-06, "loss": 2.5351, "step": 3574 }, { "epoch": 0.43, "learning_rate": 6.648958660477751e-06, "loss": 2.5779, "step": 3575 }, { "epoch": 0.43, "learning_rate": 6.647063184929025e-06, "loss": 2.5388, "step": 3576 }, { "epoch": 0.43, "learning_rate": 6.645167443826624e-06, "loss": 2.6739, "step": 3577 }, { "epoch": 0.43, "learning_rate": 6.643271437476196e-06, "loss": 2.5951, "step": 3578 }, { "epoch": 0.43, "learning_rate": 6.641375166183432e-06, "loss": 2.4106, "step": 3579 }, { "epoch": 0.43, "learning_rate": 6.6394786302540645e-06, "loss": 2.6302, "step": 3580 }, { "epoch": 0.43, "learning_rate": 6.6375818299938685e-06, "loss": 2.5257, "step": 3581 }, { "epoch": 0.43, "learning_rate": 6.635684765708662e-06, "loss": 2.4935, "step": 3582 }, { "epoch": 0.43, "learning_rate": 6.633787437704308e-06, "loss": 2.7234, "step": 3583 }, { "epoch": 0.43, "learning_rate": 6.6318898462867086e-06, "loss": 2.6244, "step": 3584 }, { "epoch": 0.43, "learning_rate": 6.629991991761811e-06, "loss": 2.4376, "step": 3585 }, { "epoch": 0.43, "learning_rate": 6.6280938744356025e-06, "loss": 2.6211, "step": 3586 }, { "epoch": 0.43, "learning_rate": 6.6261954946141134e-06, "loss": 2.616, "step": 3587 }, { "epoch": 0.43, "learning_rate": 6.624296852603419e-06, "loss": 2.6237, "step": 3588 }, { "epoch": 0.43, "learning_rate": 6.622397948709632e-06, "loss": 2.4744, "step": 3589 }, { "epoch": 0.43, "learning_rate": 6.6204987832389115e-06, "loss": 2.3844, "step": 3590 }, { "epoch": 0.43, "learning_rate": 6.6185993564974585e-06, "loss": 2.4213, "step": 3591 }, { "epoch": 0.43, "learning_rate": 6.616699668791512e-06, "loss": 2.5316, "step": 3592 }, { "epoch": 0.43, "learning_rate": 6.614799720427357e-06, "loss": 2.4745, "step": 3593 }, { "epoch": 0.43, "learning_rate": 6.612899511711322e-06, "loss": 2.4829, "step": 3594 }, { "epoch": 0.43, "learning_rate": 6.610999042949771e-06, "loss": 2.505, "step": 3595 }, { "epoch": 0.43, "learning_rate": 6.609098314449116e-06, "loss": 2.676, "step": 3596 }, { "epoch": 0.43, "learning_rate": 6.607197326515808e-06, "loss": 2.7384, "step": 3597 }, { "epoch": 0.43, "learning_rate": 6.605296079456342e-06, "loss": 2.532, "step": 3598 }, { "epoch": 0.43, "learning_rate": 6.603394573577253e-06, "loss": 2.3399, "step": 3599 }, { "epoch": 0.43, "learning_rate": 6.601492809185118e-06, "loss": 2.5882, "step": 3600 }, { "epoch": 0.43, "learning_rate": 6.599590786586554e-06, "loss": 2.5883, "step": 3601 }, { "epoch": 0.43, "learning_rate": 6.597688506088224e-06, "loss": 2.4541, "step": 3602 }, { "epoch": 0.43, "learning_rate": 6.595785967996828e-06, "loss": 2.5639, "step": 3603 }, { "epoch": 0.43, "learning_rate": 6.593883172619111e-06, "loss": 2.4487, "step": 3604 }, { "epoch": 0.43, "learning_rate": 6.591980120261857e-06, "loss": 2.6249, "step": 3605 }, { "epoch": 0.43, "learning_rate": 6.5900768112318936e-06, "loss": 2.6483, "step": 3606 }, { "epoch": 0.43, "learning_rate": 6.588173245836087e-06, "loss": 2.5078, "step": 3607 }, { "epoch": 0.43, "learning_rate": 6.586269424381349e-06, "loss": 2.6789, "step": 3608 }, { "epoch": 0.43, "learning_rate": 6.584365347174626e-06, "loss": 2.6752, "step": 3609 }, { "epoch": 0.43, "learning_rate": 6.582461014522913e-06, "loss": 2.6031, "step": 3610 }, { "epoch": 0.43, "learning_rate": 6.580556426733242e-06, "loss": 2.4531, "step": 3611 }, { "epoch": 0.43, "learning_rate": 6.578651584112687e-06, "loss": 2.5375, "step": 3612 }, { "epoch": 0.43, "learning_rate": 6.576746486968363e-06, "loss": 2.5404, "step": 3613 }, { "epoch": 0.43, "learning_rate": 6.574841135607426e-06, "loss": 2.6264, "step": 3614 }, { "epoch": 0.43, "learning_rate": 6.572935530337073e-06, "loss": 2.5931, "step": 3615 }, { "epoch": 0.43, "learning_rate": 6.571029671464542e-06, "loss": 2.6492, "step": 3616 }, { "epoch": 0.43, "learning_rate": 6.569123559297113e-06, "loss": 2.5023, "step": 3617 }, { "epoch": 0.43, "learning_rate": 6.567217194142104e-06, "loss": 2.4458, "step": 3618 }, { "epoch": 0.43, "learning_rate": 6.565310576306877e-06, "loss": 2.4768, "step": 3619 }, { "epoch": 0.43, "learning_rate": 6.563403706098833e-06, "loss": 2.531, "step": 3620 }, { "epoch": 0.44, "learning_rate": 6.561496583825413e-06, "loss": 2.3396, "step": 3621 }, { "epoch": 0.44, "learning_rate": 6.559589209794102e-06, "loss": 2.5596, "step": 3622 }, { "epoch": 0.44, "learning_rate": 6.5576815843124205e-06, "loss": 2.5697, "step": 3623 }, { "epoch": 0.44, "learning_rate": 6.5557737076879335e-06, "loss": 2.6553, "step": 3624 }, { "epoch": 0.44, "learning_rate": 6.553865580228246e-06, "loss": 2.6455, "step": 3625 }, { "epoch": 0.44, "learning_rate": 6.551957202241001e-06, "loss": 2.4026, "step": 3626 }, { "epoch": 0.44, "learning_rate": 6.550048574033885e-06, "loss": 2.623, "step": 3627 }, { "epoch": 0.44, "learning_rate": 6.5481396959146225e-06, "loss": 2.5947, "step": 3628 }, { "epoch": 0.44, "learning_rate": 6.54623056819098e-06, "loss": 2.5972, "step": 3629 }, { "epoch": 0.44, "learning_rate": 6.544321191170764e-06, "loss": 2.4611, "step": 3630 }, { "epoch": 0.44, "learning_rate": 6.5424115651618195e-06, "loss": 2.6117, "step": 3631 }, { "epoch": 0.44, "learning_rate": 6.540501690472032e-06, "loss": 2.4188, "step": 3632 }, { "epoch": 0.44, "learning_rate": 6.5385915674093295e-06, "loss": 2.6753, "step": 3633 }, { "epoch": 0.44, "learning_rate": 6.536681196281678e-06, "loss": 2.5817, "step": 3634 }, { "epoch": 0.44, "learning_rate": 6.534770577397084e-06, "loss": 2.5957, "step": 3635 }, { "epoch": 0.44, "learning_rate": 6.532859711063594e-06, "loss": 2.622, "step": 3636 }, { "epoch": 0.44, "learning_rate": 6.530948597589293e-06, "loss": 2.6513, "step": 3637 }, { "epoch": 0.44, "learning_rate": 6.529037237282309e-06, "loss": 2.4837, "step": 3638 }, { "epoch": 0.44, "learning_rate": 6.527125630450808e-06, "loss": 2.3508, "step": 3639 }, { "epoch": 0.44, "learning_rate": 6.5252137774029955e-06, "loss": 2.5426, "step": 3640 }, { "epoch": 0.44, "learning_rate": 6.523301678447113e-06, "loss": 2.7029, "step": 3641 }, { "epoch": 0.44, "learning_rate": 6.5213893338914515e-06, "loss": 2.4754, "step": 3642 }, { "epoch": 0.44, "learning_rate": 6.5194767440443315e-06, "loss": 2.5594, "step": 3643 }, { "epoch": 0.44, "learning_rate": 6.517563909214119e-06, "loss": 2.6044, "step": 3644 }, { "epoch": 0.44, "learning_rate": 6.515650829709217e-06, "loss": 2.4836, "step": 3645 }, { "epoch": 0.44, "learning_rate": 6.513737505838069e-06, "loss": 2.4863, "step": 3646 }, { "epoch": 0.44, "learning_rate": 6.511823937909158e-06, "loss": 2.4536, "step": 3647 }, { "epoch": 0.44, "learning_rate": 6.509910126231003e-06, "loss": 2.6277, "step": 3648 }, { "epoch": 0.44, "learning_rate": 6.507996071112168e-06, "loss": 2.6093, "step": 3649 }, { "epoch": 0.44, "learning_rate": 6.5060817728612544e-06, "loss": 2.6891, "step": 3650 }, { "epoch": 0.44, "learning_rate": 6.5041672317868984e-06, "loss": 2.5324, "step": 3651 }, { "epoch": 0.44, "learning_rate": 6.502252448197782e-06, "loss": 2.625, "step": 3652 }, { "epoch": 0.44, "learning_rate": 6.500337422402619e-06, "loss": 2.6434, "step": 3653 }, { "epoch": 0.44, "learning_rate": 6.498422154710171e-06, "loss": 2.5062, "step": 3654 }, { "epoch": 0.44, "learning_rate": 6.49650664542923e-06, "loss": 2.7233, "step": 3655 }, { "epoch": 0.44, "learning_rate": 6.4945908948686355e-06, "loss": 2.7268, "step": 3656 }, { "epoch": 0.44, "learning_rate": 6.492674903337257e-06, "loss": 2.5823, "step": 3657 }, { "epoch": 0.44, "learning_rate": 6.490758671144006e-06, "loss": 2.4805, "step": 3658 }, { "epoch": 0.44, "learning_rate": 6.48884219859784e-06, "loss": 2.5523, "step": 3659 }, { "epoch": 0.44, "learning_rate": 6.486925486007743e-06, "loss": 2.5479, "step": 3660 }, { "epoch": 0.44, "learning_rate": 6.485008533682748e-06, "loss": 2.5667, "step": 3661 }, { "epoch": 0.44, "learning_rate": 6.4830913419319205e-06, "loss": 2.3752, "step": 3662 }, { "epoch": 0.44, "learning_rate": 6.481173911064367e-06, "loss": 2.597, "step": 3663 }, { "epoch": 0.44, "learning_rate": 6.479256241389231e-06, "loss": 2.6501, "step": 3664 }, { "epoch": 0.44, "learning_rate": 6.4773383332156985e-06, "loss": 2.5663, "step": 3665 }, { "epoch": 0.44, "learning_rate": 6.47542018685299e-06, "loss": 2.6456, "step": 3666 }, { "epoch": 0.44, "learning_rate": 6.473501802610364e-06, "loss": 2.5619, "step": 3667 }, { "epoch": 0.44, "learning_rate": 6.471583180797121e-06, "loss": 2.6434, "step": 3668 }, { "epoch": 0.44, "learning_rate": 6.469664321722595e-06, "loss": 2.6267, "step": 3669 }, { "epoch": 0.44, "learning_rate": 6.467745225696164e-06, "loss": 2.4389, "step": 3670 }, { "epoch": 0.44, "learning_rate": 6.465825893027238e-06, "loss": 2.517, "step": 3671 }, { "epoch": 0.44, "learning_rate": 6.463906324025272e-06, "loss": 2.537, "step": 3672 }, { "epoch": 0.44, "learning_rate": 6.4619865189997536e-06, "loss": 2.4526, "step": 3673 }, { "epoch": 0.44, "learning_rate": 6.460066478260209e-06, "loss": 2.6329, "step": 3674 }, { "epoch": 0.44, "learning_rate": 6.458146202116206e-06, "loss": 2.5594, "step": 3675 }, { "epoch": 0.44, "learning_rate": 6.456225690877345e-06, "loss": 2.5028, "step": 3676 }, { "epoch": 0.44, "learning_rate": 6.454304944853269e-06, "loss": 2.4956, "step": 3677 }, { "epoch": 0.44, "learning_rate": 6.452383964353659e-06, "loss": 2.4796, "step": 3678 }, { "epoch": 0.44, "learning_rate": 6.4504627496882284e-06, "loss": 2.7503, "step": 3679 }, { "epoch": 0.44, "learning_rate": 6.448541301166737e-06, "loss": 2.4559, "step": 3680 }, { "epoch": 0.44, "learning_rate": 6.44661961909897e-06, "loss": 2.5203, "step": 3681 }, { "epoch": 0.44, "learning_rate": 6.4446977037947635e-06, "loss": 2.5451, "step": 3682 }, { "epoch": 0.44, "learning_rate": 6.442775555563984e-06, "loss": 2.4295, "step": 3683 }, { "epoch": 0.44, "learning_rate": 6.440853174716535e-06, "loss": 2.7933, "step": 3684 }, { "epoch": 0.44, "learning_rate": 6.438930561562361e-06, "loss": 2.4571, "step": 3685 }, { "epoch": 0.44, "learning_rate": 6.437007716411441e-06, "loss": 2.5555, "step": 3686 }, { "epoch": 0.44, "learning_rate": 6.435084639573792e-06, "loss": 2.6315, "step": 3687 }, { "epoch": 0.44, "learning_rate": 6.43316133135947e-06, "loss": 2.6183, "step": 3688 }, { "epoch": 0.44, "learning_rate": 6.4312377920785685e-06, "loss": 2.5398, "step": 3689 }, { "epoch": 0.44, "learning_rate": 6.429314022041216e-06, "loss": 2.3666, "step": 3690 }, { "epoch": 0.44, "learning_rate": 6.427390021557579e-06, "loss": 2.4387, "step": 3691 }, { "epoch": 0.44, "learning_rate": 6.4254657909378615e-06, "loss": 2.5695, "step": 3692 }, { "epoch": 0.44, "learning_rate": 6.4235413304923025e-06, "loss": 2.4248, "step": 3693 }, { "epoch": 0.44, "learning_rate": 6.421616640531183e-06, "loss": 2.633, "step": 3694 }, { "epoch": 0.44, "learning_rate": 6.419691721364817e-06, "loss": 2.621, "step": 3695 }, { "epoch": 0.44, "learning_rate": 6.417766573303557e-06, "loss": 2.5487, "step": 3696 }, { "epoch": 0.44, "learning_rate": 6.415841196657792e-06, "loss": 2.4969, "step": 3697 }, { "epoch": 0.44, "learning_rate": 6.4139155917379445e-06, "loss": 2.5071, "step": 3698 }, { "epoch": 0.44, "learning_rate": 6.411989758854482e-06, "loss": 2.7043, "step": 3699 }, { "epoch": 0.44, "learning_rate": 6.410063698317901e-06, "loss": 2.6105, "step": 3700 }, { "epoch": 0.44, "learning_rate": 6.408137410438738e-06, "loss": 2.5549, "step": 3701 }, { "epoch": 0.44, "learning_rate": 6.406210895527567e-06, "loss": 2.629, "step": 3702 }, { "epoch": 0.44, "learning_rate": 6.404284153894995e-06, "loss": 2.2953, "step": 3703 }, { "epoch": 0.44, "learning_rate": 6.402357185851669e-06, "loss": 2.3908, "step": 3704 }, { "epoch": 0.45, "learning_rate": 6.40042999170827e-06, "loss": 2.5741, "step": 3705 }, { "epoch": 0.45, "learning_rate": 6.39850257177552e-06, "loss": 2.601, "step": 3706 }, { "epoch": 0.45, "learning_rate": 6.396574926364172e-06, "loss": 2.5252, "step": 3707 }, { "epoch": 0.45, "learning_rate": 6.394647055785017e-06, "loss": 2.5862, "step": 3708 }, { "epoch": 0.45, "learning_rate": 6.3927189603488835e-06, "loss": 2.6775, "step": 3709 }, { "epoch": 0.45, "learning_rate": 6.3907906403666355e-06, "loss": 2.6005, "step": 3710 }, { "epoch": 0.45, "learning_rate": 6.388862096149173e-06, "loss": 2.4173, "step": 3711 }, { "epoch": 0.45, "learning_rate": 6.386933328007434e-06, "loss": 2.5111, "step": 3712 }, { "epoch": 0.45, "learning_rate": 6.385004336252392e-06, "loss": 2.5264, "step": 3713 }, { "epoch": 0.45, "learning_rate": 6.383075121195051e-06, "loss": 2.5429, "step": 3714 }, { "epoch": 0.45, "learning_rate": 6.381145683146459e-06, "loss": 2.5776, "step": 3715 }, { "epoch": 0.45, "learning_rate": 6.379216022417695e-06, "loss": 2.4665, "step": 3716 }, { "epoch": 0.45, "learning_rate": 6.377286139319878e-06, "loss": 2.3581, "step": 3717 }, { "epoch": 0.45, "learning_rate": 6.375356034164159e-06, "loss": 2.5014, "step": 3718 }, { "epoch": 0.45, "learning_rate": 6.373425707261725e-06, "loss": 2.7837, "step": 3719 }, { "epoch": 0.45, "learning_rate": 6.371495158923801e-06, "loss": 2.7078, "step": 3720 }, { "epoch": 0.45, "learning_rate": 6.369564389461644e-06, "loss": 2.4752, "step": 3721 }, { "epoch": 0.45, "learning_rate": 6.367633399186554e-06, "loss": 2.4045, "step": 3722 }, { "epoch": 0.45, "learning_rate": 6.365702188409859e-06, "loss": 2.5954, "step": 3723 }, { "epoch": 0.45, "learning_rate": 6.363770757442927e-06, "loss": 2.5643, "step": 3724 }, { "epoch": 0.45, "learning_rate": 6.3618391065971565e-06, "loss": 2.4706, "step": 3725 }, { "epoch": 0.45, "learning_rate": 6.359907236183988e-06, "loss": 2.466, "step": 3726 }, { "epoch": 0.45, "learning_rate": 6.357975146514893e-06, "loss": 2.6247, "step": 3727 }, { "epoch": 0.45, "learning_rate": 6.3560428379013795e-06, "loss": 2.5249, "step": 3728 }, { "epoch": 0.45, "learning_rate": 6.354110310654992e-06, "loss": 2.4566, "step": 3729 }, { "epoch": 0.45, "learning_rate": 6.352177565087308e-06, "loss": 2.4077, "step": 3730 }, { "epoch": 0.45, "learning_rate": 6.350244601509943e-06, "loss": 2.7088, "step": 3731 }, { "epoch": 0.45, "learning_rate": 6.348311420234542e-06, "loss": 2.7253, "step": 3732 }, { "epoch": 0.45, "learning_rate": 6.346378021572795e-06, "loss": 2.5939, "step": 3733 }, { "epoch": 0.45, "learning_rate": 6.344444405836414e-06, "loss": 2.8125, "step": 3734 }, { "epoch": 0.45, "learning_rate": 6.34251057333716e-06, "loss": 2.4783, "step": 3735 }, { "epoch": 0.45, "learning_rate": 6.340576524386819e-06, "loss": 2.4292, "step": 3736 }, { "epoch": 0.45, "learning_rate": 6.338642259297214e-06, "loss": 2.5913, "step": 3737 }, { "epoch": 0.45, "learning_rate": 6.336707778380207e-06, "loss": 2.4744, "step": 3738 }, { "epoch": 0.45, "learning_rate": 6.3347730819476875e-06, "loss": 2.5118, "step": 3739 }, { "epoch": 0.45, "learning_rate": 6.332838170311586e-06, "loss": 2.6141, "step": 3740 }, { "epoch": 0.45, "learning_rate": 6.330903043783867e-06, "loss": 2.5305, "step": 3741 }, { "epoch": 0.45, "learning_rate": 6.328967702676528e-06, "loss": 2.4725, "step": 3742 }, { "epoch": 0.45, "learning_rate": 6.327032147301596e-06, "loss": 2.5415, "step": 3743 }, { "epoch": 0.45, "learning_rate": 6.325096377971145e-06, "loss": 2.4754, "step": 3744 }, { "epoch": 0.45, "learning_rate": 6.323160394997273e-06, "loss": 2.5013, "step": 3745 }, { "epoch": 0.45, "learning_rate": 6.321224198692115e-06, "loss": 2.5, "step": 3746 }, { "epoch": 0.45, "learning_rate": 6.319287789367844e-06, "loss": 2.5858, "step": 3747 }, { "epoch": 0.45, "learning_rate": 6.31735116733666e-06, "loss": 2.6736, "step": 3748 }, { "epoch": 0.45, "learning_rate": 6.315414332910807e-06, "loss": 2.6039, "step": 3749 }, { "epoch": 0.45, "learning_rate": 6.313477286402557e-06, "loss": 2.2934, "step": 3750 }, { "epoch": 0.45, "learning_rate": 6.311540028124214e-06, "loss": 2.4773, "step": 3751 }, { "epoch": 0.45, "learning_rate": 6.309602558388122e-06, "loss": 2.5347, "step": 3752 }, { "epoch": 0.45, "learning_rate": 6.307664877506657e-06, "loss": 2.5361, "step": 3753 }, { "epoch": 0.45, "learning_rate": 6.305726985792227e-06, "loss": 2.6407, "step": 3754 }, { "epoch": 0.45, "learning_rate": 6.303788883557276e-06, "loss": 2.5262, "step": 3755 }, { "epoch": 0.45, "learning_rate": 6.301850571114282e-06, "loss": 2.5746, "step": 3756 }, { "epoch": 0.45, "learning_rate": 6.2999120487757535e-06, "loss": 2.5742, "step": 3757 }, { "epoch": 0.45, "learning_rate": 6.297973316854241e-06, "loss": 2.7387, "step": 3758 }, { "epoch": 0.45, "learning_rate": 6.296034375662321e-06, "loss": 2.5202, "step": 3759 }, { "epoch": 0.45, "learning_rate": 6.294095225512604e-06, "loss": 2.5415, "step": 3760 }, { "epoch": 0.45, "learning_rate": 6.29215586671774e-06, "loss": 2.7613, "step": 3761 }, { "epoch": 0.45, "learning_rate": 6.290216299590407e-06, "loss": 2.5604, "step": 3762 }, { "epoch": 0.45, "learning_rate": 6.288276524443319e-06, "loss": 2.4239, "step": 3763 }, { "epoch": 0.45, "learning_rate": 6.286336541589224e-06, "loss": 2.5269, "step": 3764 }, { "epoch": 0.45, "learning_rate": 6.2843963513409015e-06, "loss": 2.5552, "step": 3765 }, { "epoch": 0.45, "learning_rate": 6.282455954011166e-06, "loss": 2.4145, "step": 3766 }, { "epoch": 0.45, "learning_rate": 6.280515349912866e-06, "loss": 2.4981, "step": 3767 }, { "epoch": 0.45, "learning_rate": 6.2785745393588815e-06, "loss": 2.6869, "step": 3768 }, { "epoch": 0.45, "learning_rate": 6.276633522662127e-06, "loss": 2.6129, "step": 3769 }, { "epoch": 0.45, "learning_rate": 6.27469230013555e-06, "loss": 2.7346, "step": 3770 }, { "epoch": 0.45, "learning_rate": 6.272750872092128e-06, "loss": 2.6123, "step": 3771 }, { "epoch": 0.45, "learning_rate": 6.270809238844881e-06, "loss": 2.7158, "step": 3772 }, { "epoch": 0.45, "learning_rate": 6.26886740070685e-06, "loss": 2.643, "step": 3773 }, { "epoch": 0.45, "learning_rate": 6.266925357991118e-06, "loss": 2.61, "step": 3774 }, { "epoch": 0.45, "learning_rate": 6.264983111010796e-06, "loss": 2.6215, "step": 3775 }, { "epoch": 0.45, "learning_rate": 6.263040660079031e-06, "loss": 2.4995, "step": 3776 }, { "epoch": 0.45, "learning_rate": 6.261098005509002e-06, "loss": 2.513, "step": 3777 }, { "epoch": 0.45, "learning_rate": 6.25915514761392e-06, "loss": 2.5109, "step": 3778 }, { "epoch": 0.45, "learning_rate": 6.2572120867070286e-06, "loss": 2.6455, "step": 3779 }, { "epoch": 0.45, "learning_rate": 6.255268823101604e-06, "loss": 2.3787, "step": 3780 }, { "epoch": 0.45, "learning_rate": 6.253325357110957e-06, "loss": 2.3545, "step": 3781 }, { "epoch": 0.45, "learning_rate": 6.25138168904843e-06, "loss": 2.5868, "step": 3782 }, { "epoch": 0.45, "learning_rate": 6.2494378192273995e-06, "loss": 2.4098, "step": 3783 }, { "epoch": 0.45, "learning_rate": 6.24749374796127e-06, "loss": 2.5499, "step": 3784 }, { "epoch": 0.45, "learning_rate": 6.2455494755634825e-06, "loss": 2.5285, "step": 3785 }, { "epoch": 0.45, "learning_rate": 6.243605002347508e-06, "loss": 2.5452, "step": 3786 }, { "epoch": 0.45, "learning_rate": 6.241660328626853e-06, "loss": 2.3822, "step": 3787 }, { "epoch": 0.46, "learning_rate": 6.239715454715054e-06, "loss": 2.6895, "step": 3788 }, { "epoch": 0.46, "learning_rate": 6.237770380925682e-06, "loss": 2.7445, "step": 3789 }, { "epoch": 0.46, "learning_rate": 6.235825107572335e-06, "loss": 2.518, "step": 3790 }, { "epoch": 0.46, "learning_rate": 6.233879634968649e-06, "loss": 2.6076, "step": 3791 }, { "epoch": 0.46, "learning_rate": 6.231933963428288e-06, "loss": 2.4786, "step": 3792 }, { "epoch": 0.46, "learning_rate": 6.2299880932649515e-06, "loss": 2.6228, "step": 3793 }, { "epoch": 0.46, "learning_rate": 6.22804202479237e-06, "loss": 2.5041, "step": 3794 }, { "epoch": 0.46, "learning_rate": 6.226095758324304e-06, "loss": 2.4939, "step": 3795 }, { "epoch": 0.46, "learning_rate": 6.224149294174549e-06, "loss": 2.4139, "step": 3796 }, { "epoch": 0.46, "learning_rate": 6.222202632656927e-06, "loss": 2.3342, "step": 3797 }, { "epoch": 0.46, "learning_rate": 6.220255774085297e-06, "loss": 2.4234, "step": 3798 }, { "epoch": 0.46, "learning_rate": 6.218308718773551e-06, "loss": 2.7604, "step": 3799 }, { "epoch": 0.46, "learning_rate": 6.216361467035608e-06, "loss": 2.5816, "step": 3800 }, { "epoch": 0.46, "learning_rate": 6.214414019185421e-06, "loss": 2.58, "step": 3801 }, { "epoch": 0.46, "learning_rate": 6.212466375536974e-06, "loss": 2.5587, "step": 3802 }, { "epoch": 0.46, "learning_rate": 6.210518536404282e-06, "loss": 2.4652, "step": 3803 }, { "epoch": 0.46, "learning_rate": 6.208570502101393e-06, "loss": 2.6887, "step": 3804 }, { "epoch": 0.46, "learning_rate": 6.206622272942386e-06, "loss": 2.5344, "step": 3805 }, { "epoch": 0.46, "learning_rate": 6.204673849241372e-06, "loss": 2.56, "step": 3806 }, { "epoch": 0.46, "learning_rate": 6.202725231312492e-06, "loss": 2.4485, "step": 3807 }, { "epoch": 0.46, "learning_rate": 6.200776419469918e-06, "loss": 2.675, "step": 3808 }, { "epoch": 0.46, "learning_rate": 6.198827414027856e-06, "loss": 2.5281, "step": 3809 }, { "epoch": 0.46, "learning_rate": 6.196878215300538e-06, "loss": 2.598, "step": 3810 }, { "epoch": 0.46, "learning_rate": 6.194928823602235e-06, "loss": 2.6079, "step": 3811 }, { "epoch": 0.46, "learning_rate": 6.192979239247243e-06, "loss": 2.6066, "step": 3812 }, { "epoch": 0.46, "learning_rate": 6.1910294625498904e-06, "loss": 2.5422, "step": 3813 }, { "epoch": 0.46, "learning_rate": 6.1890794938245355e-06, "loss": 2.7632, "step": 3814 }, { "epoch": 0.46, "learning_rate": 6.187129333385571e-06, "loss": 2.5497, "step": 3815 }, { "epoch": 0.46, "learning_rate": 6.1851789815474175e-06, "loss": 2.5933, "step": 3816 }, { "epoch": 0.46, "learning_rate": 6.183228438624528e-06, "loss": 2.3955, "step": 3817 }, { "epoch": 0.46, "learning_rate": 6.181277704931386e-06, "loss": 2.4543, "step": 3818 }, { "epoch": 0.46, "learning_rate": 6.1793267807825056e-06, "loss": 2.5337, "step": 3819 }, { "epoch": 0.46, "learning_rate": 6.177375666492431e-06, "loss": 2.5746, "step": 3820 }, { "epoch": 0.46, "learning_rate": 6.175424362375737e-06, "loss": 2.4997, "step": 3821 }, { "epoch": 0.46, "learning_rate": 6.17347286874703e-06, "loss": 2.551, "step": 3822 }, { "epoch": 0.46, "learning_rate": 6.171521185920948e-06, "loss": 2.5846, "step": 3823 }, { "epoch": 0.46, "learning_rate": 6.169569314212157e-06, "loss": 2.5286, "step": 3824 }, { "epoch": 0.46, "learning_rate": 6.1676172539353555e-06, "loss": 2.4873, "step": 3825 }, { "epoch": 0.46, "learning_rate": 6.165665005405268e-06, "loss": 2.6157, "step": 3826 }, { "epoch": 0.46, "learning_rate": 6.163712568936657e-06, "loss": 2.6965, "step": 3827 }, { "epoch": 0.46, "learning_rate": 6.161759944844308e-06, "loss": 2.6114, "step": 3828 }, { "epoch": 0.46, "learning_rate": 6.159807133443042e-06, "loss": 2.6759, "step": 3829 }, { "epoch": 0.46, "learning_rate": 6.1578541350477076e-06, "loss": 2.6991, "step": 3830 }, { "epoch": 0.46, "learning_rate": 6.155900949973184e-06, "loss": 2.5984, "step": 3831 }, { "epoch": 0.46, "learning_rate": 6.153947578534378e-06, "loss": 2.4548, "step": 3832 }, { "epoch": 0.46, "learning_rate": 6.151994021046233e-06, "loss": 2.7431, "step": 3833 }, { "epoch": 0.46, "learning_rate": 6.150040277823715e-06, "loss": 2.4875, "step": 3834 }, { "epoch": 0.46, "learning_rate": 6.148086349181824e-06, "loss": 2.5336, "step": 3835 }, { "epoch": 0.46, "learning_rate": 6.146132235435591e-06, "loss": 2.5493, "step": 3836 }, { "epoch": 0.46, "learning_rate": 6.144177936900073e-06, "loss": 2.4407, "step": 3837 }, { "epoch": 0.46, "learning_rate": 6.14222345389036e-06, "loss": 2.5409, "step": 3838 }, { "epoch": 0.46, "learning_rate": 6.140268786721571e-06, "loss": 2.6212, "step": 3839 }, { "epoch": 0.46, "learning_rate": 6.138313935708852e-06, "loss": 2.7249, "step": 3840 }, { "epoch": 0.46, "learning_rate": 6.1363589011673815e-06, "loss": 2.6356, "step": 3841 }, { "epoch": 0.46, "learning_rate": 6.1344036834123695e-06, "loss": 2.5843, "step": 3842 }, { "epoch": 0.46, "learning_rate": 6.1324482827590495e-06, "loss": 2.5712, "step": 3843 }, { "epoch": 0.46, "learning_rate": 6.1304926995226895e-06, "loss": 2.5164, "step": 3844 }, { "epoch": 0.46, "learning_rate": 6.128536934018587e-06, "loss": 2.6558, "step": 3845 }, { "epoch": 0.46, "learning_rate": 6.126580986562065e-06, "loss": 2.5482, "step": 3846 }, { "epoch": 0.46, "learning_rate": 6.12462485746848e-06, "loss": 2.4661, "step": 3847 }, { "epoch": 0.46, "learning_rate": 6.1226685470532125e-06, "loss": 2.4729, "step": 3848 }, { "epoch": 0.46, "learning_rate": 6.12071205563168e-06, "loss": 2.467, "step": 3849 }, { "epoch": 0.46, "learning_rate": 6.118755383519323e-06, "loss": 2.3403, "step": 3850 }, { "epoch": 0.46, "learning_rate": 6.116798531031612e-06, "loss": 2.4577, "step": 3851 }, { "epoch": 0.46, "learning_rate": 6.114841498484049e-06, "loss": 2.5683, "step": 3852 }, { "epoch": 0.46, "learning_rate": 6.112884286192163e-06, "loss": 2.5354, "step": 3853 }, { "epoch": 0.46, "learning_rate": 6.1109268944715125e-06, "loss": 2.4382, "step": 3854 }, { "epoch": 0.46, "learning_rate": 6.1089693236376854e-06, "loss": 2.3584, "step": 3855 }, { "epoch": 0.46, "learning_rate": 6.1070115740062985e-06, "loss": 2.6541, "step": 3856 }, { "epoch": 0.46, "learning_rate": 6.105053645892995e-06, "loss": 2.5337, "step": 3857 }, { "epoch": 0.46, "learning_rate": 6.103095539613452e-06, "loss": 2.692, "step": 3858 }, { "epoch": 0.46, "learning_rate": 6.1011372554833696e-06, "loss": 2.5418, "step": 3859 }, { "epoch": 0.46, "learning_rate": 6.099178793818479e-06, "loss": 2.7404, "step": 3860 }, { "epoch": 0.46, "learning_rate": 6.097220154934543e-06, "loss": 2.5488, "step": 3861 }, { "epoch": 0.46, "learning_rate": 6.095261339147347e-06, "loss": 2.5016, "step": 3862 }, { "epoch": 0.46, "learning_rate": 6.093302346772711e-06, "loss": 2.5127, "step": 3863 }, { "epoch": 0.46, "learning_rate": 6.091343178126478e-06, "loss": 2.6184, "step": 3864 }, { "epoch": 0.46, "learning_rate": 6.089383833524524e-06, "loss": 2.4993, "step": 3865 }, { "epoch": 0.46, "learning_rate": 6.0874243132827505e-06, "loss": 2.6617, "step": 3866 }, { "epoch": 0.46, "learning_rate": 6.085464617717088e-06, "loss": 2.4842, "step": 3867 }, { "epoch": 0.46, "learning_rate": 6.083504747143496e-06, "loss": 2.5359, "step": 3868 }, { "epoch": 0.46, "learning_rate": 6.08154470187796e-06, "loss": 2.6675, "step": 3869 }, { "epoch": 0.46, "learning_rate": 6.079584482236499e-06, "loss": 2.4625, "step": 3870 }, { "epoch": 0.47, "learning_rate": 6.077624088535152e-06, "loss": 2.4221, "step": 3871 }, { "epoch": 0.47, "learning_rate": 6.075663521089994e-06, "loss": 2.3978, "step": 3872 }, { "epoch": 0.47, "learning_rate": 6.073702780217124e-06, "loss": 2.5835, "step": 3873 }, { "epoch": 0.47, "learning_rate": 6.071741866232665e-06, "loss": 2.7314, "step": 3874 }, { "epoch": 0.47, "learning_rate": 6.069780779452779e-06, "loss": 2.6017, "step": 3875 }, { "epoch": 0.47, "learning_rate": 6.0678195201936455e-06, "loss": 2.6736, "step": 3876 }, { "epoch": 0.47, "learning_rate": 6.065858088771477e-06, "loss": 2.5366, "step": 3877 }, { "epoch": 0.47, "learning_rate": 6.06389648550251e-06, "loss": 2.7111, "step": 3878 }, { "epoch": 0.47, "learning_rate": 6.061934710703015e-06, "loss": 2.4499, "step": 3879 }, { "epoch": 0.47, "learning_rate": 6.059972764689283e-06, "loss": 2.4882, "step": 3880 }, { "epoch": 0.47, "learning_rate": 6.058010647777636e-06, "loss": 2.7229, "step": 3881 }, { "epoch": 0.47, "learning_rate": 6.056048360284424e-06, "loss": 2.467, "step": 3882 }, { "epoch": 0.47, "learning_rate": 6.0540859025260245e-06, "loss": 2.6057, "step": 3883 }, { "epoch": 0.47, "learning_rate": 6.0521232748188416e-06, "loss": 2.3461, "step": 3884 }, { "epoch": 0.47, "learning_rate": 6.050160477479305e-06, "loss": 2.6968, "step": 3885 }, { "epoch": 0.47, "learning_rate": 6.048197510823876e-06, "loss": 2.3131, "step": 3886 }, { "epoch": 0.47, "learning_rate": 6.046234375169041e-06, "loss": 2.4788, "step": 3887 }, { "epoch": 0.47, "learning_rate": 6.044271070831312e-06, "loss": 2.3937, "step": 3888 }, { "epoch": 0.47, "learning_rate": 6.0423075981272315e-06, "loss": 2.5292, "step": 3889 }, { "epoch": 0.47, "learning_rate": 6.040343957373367e-06, "loss": 2.5041, "step": 3890 }, { "epoch": 0.47, "learning_rate": 6.038380148886312e-06, "loss": 2.3524, "step": 3891 }, { "epoch": 0.47, "learning_rate": 6.0364161729826905e-06, "loss": 2.6107, "step": 3892 }, { "epoch": 0.47, "learning_rate": 6.03445202997915e-06, "loss": 2.5269, "step": 3893 }, { "epoch": 0.47, "learning_rate": 6.032487720192367e-06, "loss": 2.7897, "step": 3894 }, { "epoch": 0.47, "learning_rate": 6.030523243939046e-06, "loss": 2.6203, "step": 3895 }, { "epoch": 0.47, "learning_rate": 6.028558601535915e-06, "loss": 2.3367, "step": 3896 }, { "epoch": 0.47, "learning_rate": 6.02659379329973e-06, "loss": 2.6044, "step": 3897 }, { "epoch": 0.47, "learning_rate": 6.024628819547274e-06, "loss": 2.5391, "step": 3898 }, { "epoch": 0.47, "learning_rate": 6.022663680595361e-06, "loss": 2.527, "step": 3899 }, { "epoch": 0.47, "learning_rate": 6.020698376760824e-06, "loss": 2.6466, "step": 3900 }, { "epoch": 0.47, "learning_rate": 6.018732908360527e-06, "loss": 2.5457, "step": 3901 }, { "epoch": 0.47, "learning_rate": 6.016767275711359e-06, "loss": 2.4356, "step": 3902 }, { "epoch": 0.47, "learning_rate": 6.014801479130237e-06, "loss": 2.6068, "step": 3903 }, { "epoch": 0.47, "learning_rate": 6.012835518934102e-06, "loss": 2.3668, "step": 3904 }, { "epoch": 0.47, "learning_rate": 6.010869395439926e-06, "loss": 2.53, "step": 3905 }, { "epoch": 0.47, "learning_rate": 6.008903108964702e-06, "loss": 2.5431, "step": 3906 }, { "epoch": 0.47, "learning_rate": 6.006936659825453e-06, "loss": 2.5259, "step": 3907 }, { "epoch": 0.47, "learning_rate": 6.0049700483392256e-06, "loss": 2.4428, "step": 3908 }, { "epoch": 0.47, "learning_rate": 6.003003274823094e-06, "loss": 2.558, "step": 3909 }, { "epoch": 0.47, "learning_rate": 6.0010363395941585e-06, "loss": 2.5492, "step": 3910 }, { "epoch": 0.47, "learning_rate": 5.999069242969546e-06, "loss": 2.6465, "step": 3911 }, { "epoch": 0.47, "learning_rate": 5.997101985266408e-06, "loss": 2.5352, "step": 3912 }, { "epoch": 0.47, "learning_rate": 5.995134566801923e-06, "loss": 2.553, "step": 3913 }, { "epoch": 0.47, "learning_rate": 5.993166987893294e-06, "loss": 2.5015, "step": 3914 }, { "epoch": 0.47, "learning_rate": 5.991199248857752e-06, "loss": 2.5744, "step": 3915 }, { "epoch": 0.47, "learning_rate": 5.9892313500125545e-06, "loss": 2.5855, "step": 3916 }, { "epoch": 0.47, "learning_rate": 5.9872632916749796e-06, "loss": 2.5242, "step": 3917 }, { "epoch": 0.47, "learning_rate": 5.985295074162337e-06, "loss": 2.6281, "step": 3918 }, { "epoch": 0.47, "learning_rate": 5.983326697791959e-06, "loss": 2.4923, "step": 3919 }, { "epoch": 0.47, "learning_rate": 5.981358162881202e-06, "loss": 2.4754, "step": 3920 }, { "epoch": 0.47, "learning_rate": 5.979389469747453e-06, "loss": 2.5251, "step": 3921 }, { "epoch": 0.47, "learning_rate": 5.977420618708122e-06, "loss": 2.525, "step": 3922 }, { "epoch": 0.47, "learning_rate": 5.975451610080643e-06, "loss": 2.6192, "step": 3923 }, { "epoch": 0.47, "learning_rate": 5.9734824441824745e-06, "loss": 2.6711, "step": 3924 }, { "epoch": 0.47, "learning_rate": 5.971513121331105e-06, "loss": 2.5914, "step": 3925 }, { "epoch": 0.47, "learning_rate": 5.969543641844044e-06, "loss": 2.5018, "step": 3926 }, { "epoch": 0.47, "learning_rate": 5.967574006038829e-06, "loss": 2.4823, "step": 3927 }, { "epoch": 0.47, "learning_rate": 5.965604214233022e-06, "loss": 2.5358, "step": 3928 }, { "epoch": 0.47, "learning_rate": 5.9636342667442095e-06, "loss": 2.4957, "step": 3929 }, { "epoch": 0.47, "learning_rate": 5.961664163890002e-06, "loss": 2.5533, "step": 3930 }, { "epoch": 0.47, "learning_rate": 5.959693905988038e-06, "loss": 2.5552, "step": 3931 }, { "epoch": 0.47, "learning_rate": 5.957723493355977e-06, "loss": 2.5967, "step": 3932 }, { "epoch": 0.47, "learning_rate": 5.955752926311508e-06, "loss": 2.5695, "step": 3933 }, { "epoch": 0.47, "learning_rate": 5.953782205172343e-06, "loss": 2.5538, "step": 3934 }, { "epoch": 0.47, "learning_rate": 5.951811330256218e-06, "loss": 2.5676, "step": 3935 }, { "epoch": 0.47, "learning_rate": 5.949840301880894e-06, "loss": 2.74, "step": 3936 }, { "epoch": 0.47, "learning_rate": 5.947869120364157e-06, "loss": 2.5113, "step": 3937 }, { "epoch": 0.47, "learning_rate": 5.945897786023817e-06, "loss": 2.4869, "step": 3938 }, { "epoch": 0.47, "learning_rate": 5.943926299177713e-06, "loss": 2.6041, "step": 3939 }, { "epoch": 0.47, "learning_rate": 5.941954660143703e-06, "loss": 2.4952, "step": 3940 }, { "epoch": 0.47, "learning_rate": 5.93998286923967e-06, "loss": 2.5617, "step": 3941 }, { "epoch": 0.47, "learning_rate": 5.938010926783525e-06, "loss": 2.5811, "step": 3942 }, { "epoch": 0.47, "learning_rate": 5.936038833093199e-06, "loss": 2.5142, "step": 3943 }, { "epoch": 0.47, "learning_rate": 5.9340665884866535e-06, "loss": 2.4873, "step": 3944 }, { "epoch": 0.47, "learning_rate": 5.932094193281868e-06, "loss": 2.4744, "step": 3945 }, { "epoch": 0.47, "learning_rate": 5.930121647796852e-06, "loss": 2.5832, "step": 3946 }, { "epoch": 0.47, "learning_rate": 5.928148952349631e-06, "loss": 2.5365, "step": 3947 }, { "epoch": 0.47, "learning_rate": 5.926176107258265e-06, "loss": 2.7332, "step": 3948 }, { "epoch": 0.47, "learning_rate": 5.924203112840832e-06, "loss": 2.5406, "step": 3949 }, { "epoch": 0.47, "learning_rate": 5.922229969415432e-06, "loss": 2.5556, "step": 3950 }, { "epoch": 0.47, "learning_rate": 5.920256677300195e-06, "loss": 2.5723, "step": 3951 }, { "epoch": 0.47, "learning_rate": 5.918283236813272e-06, "loss": 2.5269, "step": 3952 }, { "epoch": 0.47, "learning_rate": 5.9163096482728385e-06, "loss": 2.6579, "step": 3953 }, { "epoch": 0.48, "learning_rate": 5.914335911997091e-06, "loss": 2.4878, "step": 3954 }, { "epoch": 0.48, "learning_rate": 5.912362028304254e-06, "loss": 2.5012, "step": 3955 }, { "epoch": 0.48, "learning_rate": 5.910387997512573e-06, "loss": 2.6394, "step": 3956 }, { "epoch": 0.48, "learning_rate": 5.9084138199403195e-06, "loss": 2.4923, "step": 3957 }, { "epoch": 0.48, "learning_rate": 5.906439495905787e-06, "loss": 2.5159, "step": 3958 }, { "epoch": 0.48, "learning_rate": 5.904465025727293e-06, "loss": 2.5627, "step": 3959 }, { "epoch": 0.48, "learning_rate": 5.9024904097231765e-06, "loss": 2.5482, "step": 3960 }, { "epoch": 0.48, "learning_rate": 5.9005156482118045e-06, "loss": 2.4057, "step": 3961 }, { "epoch": 0.48, "learning_rate": 5.898540741511564e-06, "loss": 2.3859, "step": 3962 }, { "epoch": 0.48, "learning_rate": 5.896565689940866e-06, "loss": 2.445, "step": 3963 }, { "epoch": 0.48, "learning_rate": 5.894590493818149e-06, "loss": 2.6075, "step": 3964 }, { "epoch": 0.48, "learning_rate": 5.8926151534618646e-06, "loss": 2.3935, "step": 3965 }, { "epoch": 0.48, "learning_rate": 5.890639669190499e-06, "loss": 2.5498, "step": 3966 }, { "epoch": 0.48, "learning_rate": 5.888664041322555e-06, "loss": 2.5568, "step": 3967 }, { "epoch": 0.48, "learning_rate": 5.8866882701765605e-06, "loss": 2.4742, "step": 3968 }, { "epoch": 0.48, "learning_rate": 5.884712356071067e-06, "loss": 2.6151, "step": 3969 }, { "epoch": 0.48, "learning_rate": 5.882736299324648e-06, "loss": 2.537, "step": 3970 }, { "epoch": 0.48, "learning_rate": 5.880760100255899e-06, "loss": 2.4412, "step": 3971 }, { "epoch": 0.48, "learning_rate": 5.8787837591834415e-06, "loss": 2.6351, "step": 3972 }, { "epoch": 0.48, "learning_rate": 5.876807276425918e-06, "loss": 2.4655, "step": 3973 }, { "epoch": 0.48, "learning_rate": 5.8748306523019925e-06, "loss": 2.7257, "step": 3974 }, { "epoch": 0.48, "learning_rate": 5.872853887130356e-06, "loss": 2.6065, "step": 3975 }, { "epoch": 0.48, "learning_rate": 5.870876981229716e-06, "loss": 2.6387, "step": 3976 }, { "epoch": 0.48, "learning_rate": 5.86889993491881e-06, "loss": 2.4923, "step": 3977 }, { "epoch": 0.48, "learning_rate": 5.866922748516392e-06, "loss": 2.6374, "step": 3978 }, { "epoch": 0.48, "learning_rate": 5.864945422341242e-06, "loss": 2.4061, "step": 3979 }, { "epoch": 0.48, "learning_rate": 5.86296795671216e-06, "loss": 2.4448, "step": 3980 }, { "epoch": 0.48, "learning_rate": 5.860990351947973e-06, "loss": 2.5263, "step": 3981 }, { "epoch": 0.48, "learning_rate": 5.859012608367523e-06, "loss": 2.4387, "step": 3982 }, { "epoch": 0.48, "learning_rate": 5.8570347262896835e-06, "loss": 2.5369, "step": 3983 }, { "epoch": 0.48, "learning_rate": 5.855056706033343e-06, "loss": 2.3639, "step": 3984 }, { "epoch": 0.48, "learning_rate": 5.853078547917415e-06, "loss": 2.5387, "step": 3985 }, { "epoch": 0.48, "learning_rate": 5.851100252260835e-06, "loss": 2.4705, "step": 3986 }, { "epoch": 0.48, "learning_rate": 5.849121819382562e-06, "loss": 2.4171, "step": 3987 }, { "epoch": 0.48, "learning_rate": 5.847143249601575e-06, "loss": 2.2717, "step": 3988 }, { "epoch": 0.48, "learning_rate": 5.845164543236876e-06, "loss": 2.5776, "step": 3989 }, { "epoch": 0.48, "learning_rate": 5.84318570060749e-06, "loss": 2.5797, "step": 3990 }, { "epoch": 0.48, "learning_rate": 5.841206722032463e-06, "loss": 2.5699, "step": 3991 }, { "epoch": 0.48, "learning_rate": 5.839227607830862e-06, "loss": 2.5221, "step": 3992 }, { "epoch": 0.48, "learning_rate": 5.837248358321775e-06, "loss": 2.3332, "step": 3993 }, { "epoch": 0.48, "learning_rate": 5.835268973824319e-06, "loss": 2.5413, "step": 3994 }, { "epoch": 0.48, "learning_rate": 5.833289454657623e-06, "loss": 2.6294, "step": 3995 }, { "epoch": 0.48, "learning_rate": 5.831309801140841e-06, "loss": 2.4566, "step": 3996 }, { "epoch": 0.48, "learning_rate": 5.829330013593154e-06, "loss": 2.6098, "step": 3997 }, { "epoch": 0.48, "learning_rate": 5.827350092333758e-06, "loss": 2.5004, "step": 3998 }, { "epoch": 0.48, "learning_rate": 5.825370037681872e-06, "loss": 2.6004, "step": 3999 }, { "epoch": 0.48, "learning_rate": 5.82338984995674e-06, "loss": 2.4355, "step": 4000 }, { "epoch": 0.48, "learning_rate": 5.821409529477624e-06, "loss": 2.4033, "step": 4001 }, { "epoch": 0.48, "learning_rate": 5.819429076563805e-06, "loss": 2.3989, "step": 4002 }, { "epoch": 0.48, "learning_rate": 5.817448491534594e-06, "loss": 2.5317, "step": 4003 }, { "epoch": 0.48, "learning_rate": 5.815467774709314e-06, "loss": 2.556, "step": 4004 }, { "epoch": 0.48, "learning_rate": 5.813486926407315e-06, "loss": 2.5343, "step": 4005 }, { "epoch": 0.48, "learning_rate": 5.811505946947967e-06, "loss": 2.5064, "step": 4006 }, { "epoch": 0.48, "learning_rate": 5.809524836650658e-06, "loss": 2.4374, "step": 4007 }, { "epoch": 0.48, "learning_rate": 5.807543595834799e-06, "loss": 2.5041, "step": 4008 }, { "epoch": 0.48, "learning_rate": 5.805562224819827e-06, "loss": 2.4426, "step": 4009 }, { "epoch": 0.48, "learning_rate": 5.803580723925193e-06, "loss": 2.459, "step": 4010 }, { "epoch": 0.48, "learning_rate": 5.801599093470372e-06, "loss": 2.5747, "step": 4011 }, { "epoch": 0.48, "learning_rate": 5.799617333774861e-06, "loss": 2.5783, "step": 4012 }, { "epoch": 0.48, "learning_rate": 5.7976354451581715e-06, "loss": 2.5484, "step": 4013 }, { "epoch": 0.48, "learning_rate": 5.795653427939846e-06, "loss": 2.4644, "step": 4014 }, { "epoch": 0.48, "learning_rate": 5.793671282439439e-06, "loss": 2.5731, "step": 4015 }, { "epoch": 0.48, "learning_rate": 5.791689008976531e-06, "loss": 2.4201, "step": 4016 }, { "epoch": 0.48, "learning_rate": 5.78970660787072e-06, "loss": 2.7292, "step": 4017 }, { "epoch": 0.48, "learning_rate": 5.787724079441626e-06, "loss": 2.5944, "step": 4018 }, { "epoch": 0.48, "learning_rate": 5.7857414240088895e-06, "loss": 2.5921, "step": 4019 }, { "epoch": 0.48, "learning_rate": 5.783758641892172e-06, "loss": 2.5541, "step": 4020 }, { "epoch": 0.48, "learning_rate": 5.7817757334111526e-06, "loss": 2.5021, "step": 4021 }, { "epoch": 0.48, "learning_rate": 5.779792698885534e-06, "loss": 2.6369, "step": 4022 }, { "epoch": 0.48, "learning_rate": 5.777809538635039e-06, "loss": 2.415, "step": 4023 }, { "epoch": 0.48, "learning_rate": 5.775826252979409e-06, "loss": 2.5949, "step": 4024 }, { "epoch": 0.48, "learning_rate": 5.773842842238404e-06, "loss": 2.5123, "step": 4025 }, { "epoch": 0.48, "learning_rate": 5.771859306731809e-06, "loss": 2.6106, "step": 4026 }, { "epoch": 0.48, "learning_rate": 5.769875646779428e-06, "loss": 2.4634, "step": 4027 }, { "epoch": 0.48, "learning_rate": 5.767891862701081e-06, "loss": 2.5433, "step": 4028 }, { "epoch": 0.48, "learning_rate": 5.765907954816612e-06, "loss": 2.5971, "step": 4029 }, { "epoch": 0.48, "learning_rate": 5.7639239234458846e-06, "loss": 2.5318, "step": 4030 }, { "epoch": 0.48, "learning_rate": 5.7619397689087775e-06, "loss": 2.6506, "step": 4031 }, { "epoch": 0.48, "learning_rate": 5.759955491525196e-06, "loss": 2.64, "step": 4032 }, { "epoch": 0.48, "learning_rate": 5.7579710916150645e-06, "loss": 2.5451, "step": 4033 }, { "epoch": 0.48, "learning_rate": 5.755986569498321e-06, "loss": 2.587, "step": 4034 }, { "epoch": 0.48, "learning_rate": 5.754001925494929e-06, "loss": 2.5761, "step": 4035 }, { "epoch": 0.48, "learning_rate": 5.7520171599248704e-06, "loss": 2.6311, "step": 4036 }, { "epoch": 0.48, "learning_rate": 5.750032273108145e-06, "loss": 2.4299, "step": 4037 }, { "epoch": 0.49, "learning_rate": 5.748047265364773e-06, "loss": 2.536, "step": 4038 }, { "epoch": 0.49, "learning_rate": 5.746062137014795e-06, "loss": 2.4225, "step": 4039 }, { "epoch": 0.49, "learning_rate": 5.744076888378272e-06, "loss": 2.557, "step": 4040 }, { "epoch": 0.49, "learning_rate": 5.7420915197752815e-06, "loss": 2.5416, "step": 4041 }, { "epoch": 0.49, "learning_rate": 5.740106031525919e-06, "loss": 2.4537, "step": 4042 }, { "epoch": 0.49, "learning_rate": 5.738120423950306e-06, "loss": 2.5181, "step": 4043 }, { "epoch": 0.49, "learning_rate": 5.73613469736858e-06, "loss": 2.635, "step": 4044 }, { "epoch": 0.49, "learning_rate": 5.734148852100892e-06, "loss": 2.4326, "step": 4045 }, { "epoch": 0.49, "learning_rate": 5.732162888467421e-06, "loss": 2.5944, "step": 4046 }, { "epoch": 0.49, "learning_rate": 5.73017680678836e-06, "loss": 2.463, "step": 4047 }, { "epoch": 0.49, "learning_rate": 5.728190607383921e-06, "loss": 2.5032, "step": 4048 }, { "epoch": 0.49, "learning_rate": 5.726204290574336e-06, "loss": 2.3934, "step": 4049 }, { "epoch": 0.49, "learning_rate": 5.724217856679859e-06, "loss": 2.5912, "step": 4050 }, { "epoch": 0.49, "learning_rate": 5.722231306020758e-06, "loss": 2.6152, "step": 4051 }, { "epoch": 0.49, "learning_rate": 5.7202446389173225e-06, "loss": 2.5514, "step": 4052 }, { "epoch": 0.49, "learning_rate": 5.718257855689859e-06, "loss": 2.5303, "step": 4053 }, { "epoch": 0.49, "learning_rate": 5.7162709566586925e-06, "loss": 2.496, "step": 4054 }, { "epoch": 0.49, "learning_rate": 5.71428394214417e-06, "loss": 2.6053, "step": 4055 }, { "epoch": 0.49, "learning_rate": 5.712296812466657e-06, "loss": 2.6862, "step": 4056 }, { "epoch": 0.49, "learning_rate": 5.710309567946531e-06, "loss": 2.4729, "step": 4057 }, { "epoch": 0.49, "learning_rate": 5.708322208904196e-06, "loss": 2.516, "step": 4058 }, { "epoch": 0.49, "learning_rate": 5.706334735660069e-06, "loss": 2.63, "step": 4059 }, { "epoch": 0.49, "learning_rate": 5.704347148534589e-06, "loss": 2.5354, "step": 4060 }, { "epoch": 0.49, "learning_rate": 5.702359447848212e-06, "loss": 2.4654, "step": 4061 }, { "epoch": 0.49, "learning_rate": 5.70037163392141e-06, "loss": 2.5069, "step": 4062 }, { "epoch": 0.49, "learning_rate": 5.6983837070746785e-06, "loss": 2.6844, "step": 4063 }, { "epoch": 0.49, "learning_rate": 5.696395667628526e-06, "loss": 2.5196, "step": 4064 }, { "epoch": 0.49, "learning_rate": 5.694407515903482e-06, "loss": 2.734, "step": 4065 }, { "epoch": 0.49, "learning_rate": 5.692419252220091e-06, "loss": 2.6266, "step": 4066 }, { "epoch": 0.49, "learning_rate": 5.690430876898923e-06, "loss": 2.5426, "step": 4067 }, { "epoch": 0.49, "learning_rate": 5.688442390260559e-06, "loss": 2.5827, "step": 4068 }, { "epoch": 0.49, "learning_rate": 5.686453792625598e-06, "loss": 2.4421, "step": 4069 }, { "epoch": 0.49, "learning_rate": 5.6844650843146595e-06, "loss": 2.6865, "step": 4070 }, { "epoch": 0.49, "learning_rate": 5.68247626564838e-06, "loss": 2.6414, "step": 4071 }, { "epoch": 0.49, "learning_rate": 5.6804873369474155e-06, "loss": 2.6358, "step": 4072 }, { "epoch": 0.49, "learning_rate": 5.678498298532437e-06, "loss": 2.6106, "step": 4073 }, { "epoch": 0.49, "learning_rate": 5.6765091507241345e-06, "loss": 2.5209, "step": 4074 }, { "epoch": 0.49, "learning_rate": 5.674519893843216e-06, "loss": 2.6547, "step": 4075 }, { "epoch": 0.49, "learning_rate": 5.672530528210405e-06, "loss": 2.5692, "step": 4076 }, { "epoch": 0.49, "learning_rate": 5.6705410541464455e-06, "loss": 2.5473, "step": 4077 }, { "epoch": 0.49, "learning_rate": 5.668551471972097e-06, "loss": 2.6338, "step": 4078 }, { "epoch": 0.49, "learning_rate": 5.666561782008137e-06, "loss": 2.5355, "step": 4079 }, { "epoch": 0.49, "learning_rate": 5.664571984575362e-06, "loss": 2.69, "step": 4080 }, { "epoch": 0.49, "learning_rate": 5.662582079994583e-06, "loss": 2.3956, "step": 4081 }, { "epoch": 0.49, "learning_rate": 5.660592068586629e-06, "loss": 2.4715, "step": 4082 }, { "epoch": 0.49, "learning_rate": 5.658601950672347e-06, "loss": 2.4634, "step": 4083 }, { "epoch": 0.49, "learning_rate": 5.656611726572601e-06, "loss": 2.4539, "step": 4084 }, { "epoch": 0.49, "learning_rate": 5.654621396608272e-06, "loss": 2.6542, "step": 4085 }, { "epoch": 0.49, "learning_rate": 5.65263096110026e-06, "loss": 2.5361, "step": 4086 }, { "epoch": 0.49, "learning_rate": 5.650640420369475e-06, "loss": 2.5117, "step": 4087 }, { "epoch": 0.49, "learning_rate": 5.648649774736855e-06, "loss": 2.4335, "step": 4088 }, { "epoch": 0.49, "learning_rate": 5.646659024523346e-06, "loss": 2.4316, "step": 4089 }, { "epoch": 0.49, "learning_rate": 5.644668170049913e-06, "loss": 2.6245, "step": 4090 }, { "epoch": 0.49, "learning_rate": 5.642677211637542e-06, "loss": 2.4428, "step": 4091 }, { "epoch": 0.49, "learning_rate": 5.640686149607228e-06, "loss": 2.6339, "step": 4092 }, { "epoch": 0.49, "learning_rate": 5.638694984279991e-06, "loss": 2.5714, "step": 4093 }, { "epoch": 0.49, "learning_rate": 5.6367037159768625e-06, "loss": 2.6661, "step": 4094 }, { "epoch": 0.49, "learning_rate": 5.63471234501889e-06, "loss": 2.5311, "step": 4095 }, { "epoch": 0.49, "learning_rate": 5.632720871727142e-06, "loss": 2.5472, "step": 4096 }, { "epoch": 0.49, "learning_rate": 5.630729296422701e-06, "loss": 2.5339, "step": 4097 }, { "epoch": 0.49, "learning_rate": 5.628737619426664e-06, "loss": 2.6301, "step": 4098 }, { "epoch": 0.49, "learning_rate": 5.626745841060146e-06, "loss": 2.4696, "step": 4099 }, { "epoch": 0.49, "learning_rate": 5.624753961644281e-06, "loss": 2.4119, "step": 4100 }, { "epoch": 0.49, "learning_rate": 5.622761981500215e-06, "loss": 2.4492, "step": 4101 }, { "epoch": 0.49, "learning_rate": 5.620769900949113e-06, "loss": 2.5032, "step": 4102 }, { "epoch": 0.49, "learning_rate": 5.618777720312156e-06, "loss": 2.7037, "step": 4103 }, { "epoch": 0.49, "learning_rate": 5.61678543991054e-06, "loss": 2.4918, "step": 4104 }, { "epoch": 0.49, "learning_rate": 5.6147930600654755e-06, "loss": 2.4369, "step": 4105 }, { "epoch": 0.49, "learning_rate": 5.612800581098193e-06, "loss": 2.4236, "step": 4106 }, { "epoch": 0.49, "learning_rate": 5.610808003329937e-06, "loss": 2.6601, "step": 4107 }, { "epoch": 0.49, "learning_rate": 5.608815327081969e-06, "loss": 2.5355, "step": 4108 }, { "epoch": 0.49, "learning_rate": 5.606822552675564e-06, "loss": 2.5028, "step": 4109 }, { "epoch": 0.49, "learning_rate": 5.604829680432012e-06, "loss": 2.3269, "step": 4110 }, { "epoch": 0.49, "learning_rate": 5.602836710672627e-06, "loss": 2.5745, "step": 4111 }, { "epoch": 0.49, "learning_rate": 5.600843643718728e-06, "loss": 2.4346, "step": 4112 }, { "epoch": 0.49, "learning_rate": 5.598850479891653e-06, "loss": 2.5822, "step": 4113 }, { "epoch": 0.49, "learning_rate": 5.596857219512762e-06, "loss": 2.4729, "step": 4114 }, { "epoch": 0.49, "learning_rate": 5.594863862903422e-06, "loss": 2.3652, "step": 4115 }, { "epoch": 0.49, "learning_rate": 5.592870410385021e-06, "loss": 2.4995, "step": 4116 }, { "epoch": 0.49, "learning_rate": 5.590876862278959e-06, "loss": 2.6704, "step": 4117 }, { "epoch": 0.49, "learning_rate": 5.588883218906653e-06, "loss": 2.5942, "step": 4118 }, { "epoch": 0.49, "learning_rate": 5.586889480589537e-06, "loss": 2.6051, "step": 4119 }, { "epoch": 0.49, "learning_rate": 5.584895647649058e-06, "loss": 2.6485, "step": 4120 }, { "epoch": 0.5, "learning_rate": 5.582901720406677e-06, "loss": 2.5641, "step": 4121 }, { "epoch": 0.5, "learning_rate": 5.580907699183875e-06, "loss": 2.4983, "step": 4122 }, { "epoch": 0.5, "learning_rate": 5.578913584302144e-06, "loss": 2.5445, "step": 4123 }, { "epoch": 0.5, "learning_rate": 5.57691937608299e-06, "loss": 2.5767, "step": 4124 }, { "epoch": 0.5, "learning_rate": 5.574925074847939e-06, "loss": 2.6114, "step": 4125 }, { "epoch": 0.5, "learning_rate": 5.572930680918529e-06, "loss": 2.4994, "step": 4126 }, { "epoch": 0.5, "learning_rate": 5.570936194616313e-06, "loss": 2.5801, "step": 4127 }, { "epoch": 0.5, "learning_rate": 5.568941616262861e-06, "loss": 2.5797, "step": 4128 }, { "epoch": 0.5, "learning_rate": 5.566946946179753e-06, "loss": 2.5963, "step": 4129 }, { "epoch": 0.5, "learning_rate": 5.564952184688588e-06, "loss": 2.5391, "step": 4130 }, { "epoch": 0.5, "learning_rate": 5.56295733211098e-06, "loss": 2.5562, "step": 4131 }, { "epoch": 0.5, "learning_rate": 5.560962388768554e-06, "loss": 2.4871, "step": 4132 }, { "epoch": 0.5, "learning_rate": 5.5589673549829525e-06, "loss": 2.4754, "step": 4133 }, { "epoch": 0.5, "learning_rate": 5.556972231075834e-06, "loss": 2.4606, "step": 4134 }, { "epoch": 0.5, "learning_rate": 5.554977017368868e-06, "loss": 2.5276, "step": 4135 }, { "epoch": 0.5, "learning_rate": 5.552981714183738e-06, "loss": 2.5456, "step": 4136 }, { "epoch": 0.5, "learning_rate": 5.550986321842147e-06, "loss": 2.46, "step": 4137 }, { "epoch": 0.5, "learning_rate": 5.548990840665809e-06, "loss": 2.5926, "step": 4138 }, { "epoch": 0.5, "learning_rate": 5.5469952709764515e-06, "loss": 2.5604, "step": 4139 }, { "epoch": 0.5, "learning_rate": 5.5449996130958185e-06, "loss": 2.5762, "step": 4140 }, { "epoch": 0.5, "learning_rate": 5.5430038673456655e-06, "loss": 2.4994, "step": 4141 }, { "epoch": 0.5, "learning_rate": 5.5410080340477634e-06, "loss": 2.4543, "step": 4142 }, { "epoch": 0.5, "learning_rate": 5.539012113523899e-06, "loss": 2.5115, "step": 4143 }, { "epoch": 0.5, "learning_rate": 5.5370161060958726e-06, "loss": 2.5635, "step": 4144 }, { "epoch": 0.5, "learning_rate": 5.535020012085497e-06, "loss": 2.7138, "step": 4145 }, { "epoch": 0.5, "learning_rate": 5.533023831814599e-06, "loss": 2.6107, "step": 4146 }, { "epoch": 0.5, "learning_rate": 5.5310275656050195e-06, "loss": 2.4846, "step": 4147 }, { "epoch": 0.5, "learning_rate": 5.529031213778615e-06, "loss": 2.6026, "step": 4148 }, { "epoch": 0.5, "learning_rate": 5.5270347766572515e-06, "loss": 2.645, "step": 4149 }, { "epoch": 0.5, "learning_rate": 5.525038254562817e-06, "loss": 2.5704, "step": 4150 }, { "epoch": 0.5, "learning_rate": 5.523041647817204e-06, "loss": 2.5021, "step": 4151 }, { "epoch": 0.5, "learning_rate": 5.521044956742324e-06, "loss": 2.5612, "step": 4152 }, { "epoch": 0.5, "learning_rate": 5.5190481816601e-06, "loss": 2.5784, "step": 4153 }, { "epoch": 0.5, "learning_rate": 5.517051322892468e-06, "loss": 2.5125, "step": 4154 }, { "epoch": 0.5, "learning_rate": 5.515054380761382e-06, "loss": 2.6093, "step": 4155 }, { "epoch": 0.5, "learning_rate": 5.513057355588804e-06, "loss": 2.4796, "step": 4156 }, { "epoch": 0.5, "learning_rate": 5.511060247696713e-06, "loss": 2.4179, "step": 4157 }, { "epoch": 0.5, "learning_rate": 5.509063057407098e-06, "loss": 2.6826, "step": 4158 }, { "epoch": 0.5, "learning_rate": 5.507065785041963e-06, "loss": 2.652, "step": 4159 }, { "epoch": 0.5, "learning_rate": 5.505068430923327e-06, "loss": 2.5544, "step": 4160 }, { "epoch": 0.5, "learning_rate": 5.503070995373221e-06, "loss": 2.4317, "step": 4161 }, { "epoch": 0.5, "learning_rate": 5.5010734787136865e-06, "loss": 2.5095, "step": 4162 }, { "epoch": 0.5, "learning_rate": 5.499075881266784e-06, "loss": 2.5806, "step": 4163 }, { "epoch": 0.5, "learning_rate": 5.497078203354577e-06, "loss": 2.6062, "step": 4164 }, { "epoch": 0.5, "learning_rate": 5.4950804452991545e-06, "loss": 2.5624, "step": 4165 }, { "epoch": 0.5, "learning_rate": 5.4930826074226085e-06, "loss": 2.6041, "step": 4166 }, { "epoch": 0.5, "learning_rate": 5.49108469004705e-06, "loss": 2.5914, "step": 4167 }, { "epoch": 0.5, "learning_rate": 5.4890866934946e-06, "loss": 2.7266, "step": 4168 }, { "epoch": 0.5, "learning_rate": 5.487088618087391e-06, "loss": 2.4253, "step": 4169 }, { "epoch": 0.5, "learning_rate": 5.485090464147571e-06, "loss": 2.5052, "step": 4170 }, { "epoch": 0.5, "learning_rate": 5.483092231997299e-06, "loss": 2.4201, "step": 4171 }, { "epoch": 0.5, "learning_rate": 5.481093921958749e-06, "loss": 2.5636, "step": 4172 }, { "epoch": 0.5, "learning_rate": 5.479095534354103e-06, "loss": 2.6252, "step": 4173 }, { "epoch": 0.5, "learning_rate": 5.47709706950556e-06, "loss": 2.4417, "step": 4174 }, { "epoch": 0.5, "learning_rate": 5.475098527735329e-06, "loss": 2.4963, "step": 4175 }, { "epoch": 0.5, "learning_rate": 5.473099909365633e-06, "loss": 2.5189, "step": 4176 }, { "epoch": 0.5, "learning_rate": 5.471101214718704e-06, "loss": 2.5357, "step": 4177 }, { "epoch": 0.5, "learning_rate": 5.469102444116791e-06, "loss": 2.698, "step": 4178 }, { "epoch": 0.5, "learning_rate": 5.467103597882154e-06, "loss": 2.5239, "step": 4179 }, { "epoch": 0.5, "learning_rate": 5.4651046763370615e-06, "loss": 2.3852, "step": 4180 }, { "epoch": 0.5, "learning_rate": 5.463105679803798e-06, "loss": 2.434, "step": 4181 }, { "epoch": 0.5, "learning_rate": 5.461106608604658e-06, "loss": 2.5047, "step": 4182 }, { "epoch": 0.5, "learning_rate": 5.459107463061949e-06, "loss": 2.5734, "step": 4183 }, { "epoch": 0.5, "learning_rate": 5.457108243497993e-06, "loss": 2.3627, "step": 4184 }, { "epoch": 0.5, "learning_rate": 5.455108950235119e-06, "loss": 2.5102, "step": 4185 }, { "epoch": 0.5, "learning_rate": 5.45310958359567e-06, "loss": 2.5064, "step": 4186 }, { "epoch": 0.5, "learning_rate": 5.4511101439020006e-06, "loss": 2.5779, "step": 4187 }, { "epoch": 0.5, "learning_rate": 5.449110631476481e-06, "loss": 2.6646, "step": 4188 }, { "epoch": 0.5, "learning_rate": 5.4471110466414855e-06, "loss": 2.3701, "step": 4189 }, { "epoch": 0.5, "learning_rate": 5.445111389719408e-06, "loss": 2.3831, "step": 4190 }, { "epoch": 0.5, "learning_rate": 5.443111661032648e-06, "loss": 2.5394, "step": 4191 }, { "epoch": 0.5, "learning_rate": 5.44111186090362e-06, "loss": 2.6391, "step": 4192 }, { "epoch": 0.5, "learning_rate": 5.439111989654748e-06, "loss": 2.6628, "step": 4193 }, { "epoch": 0.5, "learning_rate": 5.43711204760847e-06, "loss": 2.6402, "step": 4194 }, { "epoch": 0.5, "learning_rate": 5.435112035087232e-06, "loss": 2.441, "step": 4195 }, { "epoch": 0.5, "learning_rate": 5.433111952413496e-06, "loss": 2.5556, "step": 4196 }, { "epoch": 0.5, "learning_rate": 5.431111799909728e-06, "loss": 2.568, "step": 4197 }, { "epoch": 0.5, "learning_rate": 5.429111577898415e-06, "loss": 2.6705, "step": 4198 }, { "epoch": 0.5, "learning_rate": 5.427111286702044e-06, "loss": 2.5791, "step": 4199 }, { "epoch": 0.5, "learning_rate": 5.425110926643123e-06, "loss": 2.6414, "step": 4200 }, { "epoch": 0.5, "learning_rate": 5.42311049804417e-06, "loss": 2.5155, "step": 4201 }, { "epoch": 0.5, "learning_rate": 5.421110001227705e-06, "loss": 2.4702, "step": 4202 }, { "epoch": 0.5, "learning_rate": 5.41910943651627e-06, "loss": 2.3799, "step": 4203 }, { "epoch": 0.51, "learning_rate": 5.417108804232409e-06, "loss": 2.586, "step": 4204 }, { "epoch": 0.51, "learning_rate": 5.415108104698687e-06, "loss": 2.6274, "step": 4205 }, { "epoch": 0.51, "learning_rate": 5.413107338237667e-06, "loss": 2.672, "step": 4206 }, { "epoch": 0.51, "learning_rate": 5.411106505171936e-06, "loss": 2.4756, "step": 4207 }, { "epoch": 0.51, "learning_rate": 5.409105605824082e-06, "loss": 2.6223, "step": 4208 }, { "epoch": 0.51, "learning_rate": 5.40710464051671e-06, "loss": 2.4368, "step": 4209 }, { "epoch": 0.51, "learning_rate": 5.405103609572427e-06, "loss": 2.5212, "step": 4210 }, { "epoch": 0.51, "learning_rate": 5.403102513313862e-06, "loss": 2.3784, "step": 4211 }, { "epoch": 0.51, "learning_rate": 5.4011013520636466e-06, "loss": 2.521, "step": 4212 }, { "epoch": 0.51, "learning_rate": 5.399100126144426e-06, "loss": 2.3947, "step": 4213 }, { "epoch": 0.51, "learning_rate": 5.3970988358788565e-06, "loss": 2.5648, "step": 4214 }, { "epoch": 0.51, "learning_rate": 5.395097481589599e-06, "loss": 2.4612, "step": 4215 }, { "epoch": 0.51, "learning_rate": 5.393096063599333e-06, "loss": 2.5685, "step": 4216 }, { "epoch": 0.51, "learning_rate": 5.391094582230744e-06, "loss": 2.6409, "step": 4217 }, { "epoch": 0.51, "learning_rate": 5.389093037806524e-06, "loss": 2.3948, "step": 4218 }, { "epoch": 0.51, "learning_rate": 5.387091430649385e-06, "loss": 2.4082, "step": 4219 }, { "epoch": 0.51, "learning_rate": 5.385089761082039e-06, "loss": 2.4952, "step": 4220 }, { "epoch": 0.51, "learning_rate": 5.383088029427214e-06, "loss": 2.5713, "step": 4221 }, { "epoch": 0.51, "learning_rate": 5.381086236007647e-06, "loss": 2.4298, "step": 4222 }, { "epoch": 0.51, "learning_rate": 5.379084381146082e-06, "loss": 2.4903, "step": 4223 }, { "epoch": 0.51, "learning_rate": 5.377082465165277e-06, "loss": 2.6372, "step": 4224 }, { "epoch": 0.51, "learning_rate": 5.375080488387998e-06, "loss": 2.6019, "step": 4225 }, { "epoch": 0.51, "learning_rate": 5.3730784511370204e-06, "loss": 2.5179, "step": 4226 }, { "epoch": 0.51, "learning_rate": 5.371076353735132e-06, "loss": 2.6131, "step": 4227 }, { "epoch": 0.51, "learning_rate": 5.3690741965051255e-06, "loss": 2.516, "step": 4228 }, { "epoch": 0.51, "learning_rate": 5.367071979769805e-06, "loss": 2.6027, "step": 4229 }, { "epoch": 0.51, "learning_rate": 5.3650697038519885e-06, "loss": 2.4422, "step": 4230 }, { "epoch": 0.51, "learning_rate": 5.363067369074498e-06, "loss": 2.4694, "step": 4231 }, { "epoch": 0.51, "learning_rate": 5.361064975760166e-06, "loss": 2.6596, "step": 4232 }, { "epoch": 0.51, "learning_rate": 5.35906252423184e-06, "loss": 2.5504, "step": 4233 }, { "epoch": 0.51, "learning_rate": 5.357060014812367e-06, "loss": 2.5195, "step": 4234 }, { "epoch": 0.51, "learning_rate": 5.355057447824612e-06, "loss": 2.4864, "step": 4235 }, { "epoch": 0.51, "learning_rate": 5.353054823591446e-06, "loss": 2.5911, "step": 4236 }, { "epoch": 0.51, "learning_rate": 5.351052142435747e-06, "loss": 2.5579, "step": 4237 }, { "epoch": 0.51, "learning_rate": 5.349049404680407e-06, "loss": 2.5381, "step": 4238 }, { "epoch": 0.51, "learning_rate": 5.347046610648324e-06, "loss": 2.4927, "step": 4239 }, { "epoch": 0.51, "learning_rate": 5.345043760662406e-06, "loss": 2.5695, "step": 4240 }, { "epoch": 0.51, "learning_rate": 5.343040855045567e-06, "loss": 2.6301, "step": 4241 }, { "epoch": 0.51, "learning_rate": 5.341037894120737e-06, "loss": 2.5352, "step": 4242 }, { "epoch": 0.51, "learning_rate": 5.339034878210846e-06, "loss": 2.4195, "step": 4243 }, { "epoch": 0.51, "learning_rate": 5.3370318076388405e-06, "loss": 2.6437, "step": 4244 }, { "epoch": 0.51, "learning_rate": 5.335028682727672e-06, "loss": 2.734, "step": 4245 }, { "epoch": 0.51, "learning_rate": 5.333025503800301e-06, "loss": 2.4667, "step": 4246 }, { "epoch": 0.51, "learning_rate": 5.3310222711796975e-06, "loss": 2.4553, "step": 4247 }, { "epoch": 0.51, "learning_rate": 5.329018985188841e-06, "loss": 2.4828, "step": 4248 }, { "epoch": 0.51, "learning_rate": 5.327015646150716e-06, "loss": 2.4915, "step": 4249 }, { "epoch": 0.51, "learning_rate": 5.32501225438832e-06, "loss": 2.4959, "step": 4250 }, { "epoch": 0.51, "learning_rate": 5.323008810224657e-06, "loss": 2.4616, "step": 4251 }, { "epoch": 0.51, "learning_rate": 5.3210053139827374e-06, "loss": 2.3947, "step": 4252 }, { "epoch": 0.51, "learning_rate": 5.319001765985585e-06, "loss": 2.5313, "step": 4253 }, { "epoch": 0.51, "learning_rate": 5.3169981665562275e-06, "loss": 2.3548, "step": 4254 }, { "epoch": 0.51, "learning_rate": 5.314994516017703e-06, "loss": 2.7625, "step": 4255 }, { "epoch": 0.51, "learning_rate": 5.3129908146930565e-06, "loss": 2.6501, "step": 4256 }, { "epoch": 0.51, "learning_rate": 5.310987062905343e-06, "loss": 2.5438, "step": 4257 }, { "epoch": 0.51, "learning_rate": 5.308983260977622e-06, "loss": 2.5125, "step": 4258 }, { "epoch": 0.51, "learning_rate": 5.306979409232967e-06, "loss": 2.4539, "step": 4259 }, { "epoch": 0.51, "learning_rate": 5.304975507994453e-06, "loss": 2.6234, "step": 4260 }, { "epoch": 0.51, "learning_rate": 5.302971557585169e-06, "loss": 2.4804, "step": 4261 }, { "epoch": 0.51, "learning_rate": 5.300967558328208e-06, "loss": 2.6117, "step": 4262 }, { "epoch": 0.51, "learning_rate": 5.298963510546673e-06, "loss": 2.5833, "step": 4263 }, { "epoch": 0.51, "learning_rate": 5.296959414563671e-06, "loss": 2.5299, "step": 4264 }, { "epoch": 0.51, "learning_rate": 5.2949552707023215e-06, "loss": 2.5245, "step": 4265 }, { "epoch": 0.51, "learning_rate": 5.29295107928575e-06, "loss": 2.6001, "step": 4266 }, { "epoch": 0.51, "learning_rate": 5.290946840637089e-06, "loss": 2.4249, "step": 4267 }, { "epoch": 0.51, "learning_rate": 5.288942555079479e-06, "loss": 2.5154, "step": 4268 }, { "epoch": 0.51, "learning_rate": 5.286938222936069e-06, "loss": 2.4015, "step": 4269 }, { "epoch": 0.51, "learning_rate": 5.284933844530013e-06, "loss": 2.6337, "step": 4270 }, { "epoch": 0.51, "learning_rate": 5.282929420184474e-06, "loss": 2.6177, "step": 4271 }, { "epoch": 0.51, "learning_rate": 5.2809249502226255e-06, "loss": 2.5195, "step": 4272 }, { "epoch": 0.51, "learning_rate": 5.278920434967643e-06, "loss": 2.5401, "step": 4273 }, { "epoch": 0.51, "learning_rate": 5.2769158747427115e-06, "loss": 2.5632, "step": 4274 }, { "epoch": 0.51, "learning_rate": 5.274911269871024e-06, "loss": 2.5878, "step": 4275 }, { "epoch": 0.51, "learning_rate": 5.27290662067578e-06, "loss": 2.3144, "step": 4276 }, { "epoch": 0.51, "learning_rate": 5.270901927480186e-06, "loss": 2.4555, "step": 4277 }, { "epoch": 0.51, "learning_rate": 5.268897190607457e-06, "loss": 2.5036, "step": 4278 }, { "epoch": 0.51, "learning_rate": 5.266892410380814e-06, "loss": 2.3945, "step": 4279 }, { "epoch": 0.51, "learning_rate": 5.264887587123483e-06, "loss": 2.3634, "step": 4280 }, { "epoch": 0.51, "learning_rate": 5.262882721158699e-06, "loss": 2.5458, "step": 4281 }, { "epoch": 0.51, "learning_rate": 5.260877812809704e-06, "loss": 2.4633, "step": 4282 }, { "epoch": 0.51, "learning_rate": 5.2588728623997485e-06, "loss": 2.6636, "step": 4283 }, { "epoch": 0.51, "learning_rate": 5.256867870252087e-06, "loss": 2.5437, "step": 4284 }, { "epoch": 0.51, "learning_rate": 5.25486283668998e-06, "loss": 2.6446, "step": 4285 }, { "epoch": 0.51, "learning_rate": 5.2528577620366986e-06, "loss": 2.5654, "step": 4286 }, { "epoch": 0.52, "learning_rate": 5.250852646615514e-06, "loss": 2.5356, "step": 4287 }, { "epoch": 0.52, "learning_rate": 5.248847490749711e-06, "loss": 2.5357, "step": 4288 }, { "epoch": 0.52, "learning_rate": 5.246842294762581e-06, "loss": 2.5901, "step": 4289 }, { "epoch": 0.52, "learning_rate": 5.244837058977413e-06, "loss": 2.5917, "step": 4290 }, { "epoch": 0.52, "learning_rate": 5.242831783717514e-06, "loss": 2.5189, "step": 4291 }, { "epoch": 0.52, "learning_rate": 5.240826469306187e-06, "loss": 2.4242, "step": 4292 }, { "epoch": 0.52, "learning_rate": 5.2388211160667475e-06, "loss": 2.508, "step": 4293 }, { "epoch": 0.52, "learning_rate": 5.236815724322516e-06, "loss": 2.4792, "step": 4294 }, { "epoch": 0.52, "learning_rate": 5.23481029439682e-06, "loss": 2.725, "step": 4295 }, { "epoch": 0.52, "learning_rate": 5.232804826612993e-06, "loss": 2.4685, "step": 4296 }, { "epoch": 0.52, "learning_rate": 5.23079932129437e-06, "loss": 2.5457, "step": 4297 }, { "epoch": 0.52, "learning_rate": 5.228793778764297e-06, "loss": 2.5421, "step": 4298 }, { "epoch": 0.52, "learning_rate": 5.226788199346127e-06, "loss": 2.5129, "step": 4299 }, { "epoch": 0.52, "learning_rate": 5.224782583363215e-06, "loss": 2.5694, "step": 4300 }, { "epoch": 0.52, "learning_rate": 5.222776931138926e-06, "loss": 2.5762, "step": 4301 }, { "epoch": 0.52, "learning_rate": 5.220771242996624e-06, "loss": 2.5664, "step": 4302 }, { "epoch": 0.52, "learning_rate": 5.2187655192596875e-06, "loss": 2.4692, "step": 4303 }, { "epoch": 0.52, "learning_rate": 5.216759760251493e-06, "loss": 2.5931, "step": 4304 }, { "epoch": 0.52, "learning_rate": 5.214753966295429e-06, "loss": 2.5956, "step": 4305 }, { "epoch": 0.52, "learning_rate": 5.2127481377148845e-06, "loss": 2.4225, "step": 4306 }, { "epoch": 0.52, "learning_rate": 5.210742274833259e-06, "loss": 2.4239, "step": 4307 }, { "epoch": 0.52, "learning_rate": 5.208736377973954e-06, "loss": 2.3057, "step": 4308 }, { "epoch": 0.52, "learning_rate": 5.206730447460377e-06, "loss": 2.5247, "step": 4309 }, { "epoch": 0.52, "learning_rate": 5.204724483615941e-06, "loss": 2.3896, "step": 4310 }, { "epoch": 0.52, "learning_rate": 5.202718486764065e-06, "loss": 2.3684, "step": 4311 }, { "epoch": 0.52, "learning_rate": 5.200712457228173e-06, "loss": 2.5044, "step": 4312 }, { "epoch": 0.52, "learning_rate": 5.198706395331695e-06, "loss": 2.5967, "step": 4313 }, { "epoch": 0.52, "learning_rate": 5.1967003013980655e-06, "loss": 2.5187, "step": 4314 }, { "epoch": 0.52, "learning_rate": 5.194694175750723e-06, "loss": 2.6281, "step": 4315 }, { "epoch": 0.52, "learning_rate": 5.1926880187131134e-06, "loss": 2.3195, "step": 4316 }, { "epoch": 0.52, "learning_rate": 5.190681830608686e-06, "loss": 2.5504, "step": 4317 }, { "epoch": 0.52, "learning_rate": 5.188675611760896e-06, "loss": 2.3847, "step": 4318 }, { "epoch": 0.52, "learning_rate": 5.186669362493204e-06, "loss": 2.5551, "step": 4319 }, { "epoch": 0.52, "learning_rate": 5.184663083129073e-06, "loss": 2.5166, "step": 4320 }, { "epoch": 0.52, "learning_rate": 5.182656773991973e-06, "loss": 2.4939, "step": 4321 }, { "epoch": 0.52, "learning_rate": 5.18065043540538e-06, "loss": 2.5114, "step": 4322 }, { "epoch": 0.52, "learning_rate": 5.178644067692771e-06, "loss": 2.4324, "step": 4323 }, { "epoch": 0.52, "learning_rate": 5.176637671177631e-06, "loss": 2.5323, "step": 4324 }, { "epoch": 0.52, "learning_rate": 5.174631246183449e-06, "loss": 2.5382, "step": 4325 }, { "epoch": 0.52, "learning_rate": 5.172624793033717e-06, "loss": 2.5209, "step": 4326 }, { "epoch": 0.52, "learning_rate": 5.170618312051934e-06, "loss": 2.435, "step": 4327 }, { "epoch": 0.52, "learning_rate": 5.168611803561599e-06, "loss": 2.577, "step": 4328 }, { "epoch": 0.52, "learning_rate": 5.166605267886222e-06, "loss": 2.3858, "step": 4329 }, { "epoch": 0.52, "learning_rate": 5.164598705349313e-06, "loss": 2.429, "step": 4330 }, { "epoch": 0.52, "learning_rate": 5.162592116274386e-06, "loss": 2.5314, "step": 4331 }, { "epoch": 0.52, "learning_rate": 5.160585500984962e-06, "loss": 2.548, "step": 4332 }, { "epoch": 0.52, "learning_rate": 5.158578859804562e-06, "loss": 2.5639, "step": 4333 }, { "epoch": 0.52, "learning_rate": 5.156572193056718e-06, "loss": 2.6438, "step": 4334 }, { "epoch": 0.52, "learning_rate": 5.1545655010649605e-06, "loss": 2.5023, "step": 4335 }, { "epoch": 0.52, "learning_rate": 5.152558784152824e-06, "loss": 2.6907, "step": 4336 }, { "epoch": 0.52, "learning_rate": 5.150552042643851e-06, "loss": 2.496, "step": 4337 }, { "epoch": 0.52, "learning_rate": 5.148545276861583e-06, "loss": 2.7109, "step": 4338 }, { "epoch": 0.52, "learning_rate": 5.146538487129571e-06, "loss": 2.3729, "step": 4339 }, { "epoch": 0.52, "learning_rate": 5.144531673771364e-06, "loss": 2.55, "step": 4340 }, { "epoch": 0.52, "learning_rate": 5.14252483711052e-06, "loss": 2.4161, "step": 4341 }, { "epoch": 0.52, "learning_rate": 5.140517977470597e-06, "loss": 2.4703, "step": 4342 }, { "epoch": 0.52, "learning_rate": 5.138511095175158e-06, "loss": 2.5521, "step": 4343 }, { "epoch": 0.52, "learning_rate": 5.136504190547772e-06, "loss": 2.4457, "step": 4344 }, { "epoch": 0.52, "learning_rate": 5.134497263912007e-06, "loss": 2.6243, "step": 4345 }, { "epoch": 0.52, "learning_rate": 5.132490315591437e-06, "loss": 2.6425, "step": 4346 }, { "epoch": 0.52, "learning_rate": 5.130483345909642e-06, "loss": 2.5647, "step": 4347 }, { "epoch": 0.52, "learning_rate": 5.1284763551901995e-06, "loss": 2.499, "step": 4348 }, { "epoch": 0.52, "learning_rate": 5.126469343756695e-06, "loss": 2.6119, "step": 4349 }, { "epoch": 0.52, "learning_rate": 5.124462311932719e-06, "loss": 2.4121, "step": 4350 }, { "epoch": 0.52, "learning_rate": 5.1224552600418566e-06, "loss": 2.5365, "step": 4351 }, { "epoch": 0.52, "learning_rate": 5.1204481884077075e-06, "loss": 2.4647, "step": 4352 }, { "epoch": 0.52, "learning_rate": 5.118441097353867e-06, "loss": 2.6164, "step": 4353 }, { "epoch": 0.52, "learning_rate": 5.116433987203934e-06, "loss": 2.4972, "step": 4354 }, { "epoch": 0.52, "learning_rate": 5.114426858281515e-06, "loss": 2.5168, "step": 4355 }, { "epoch": 0.52, "learning_rate": 5.112419710910213e-06, "loss": 2.5557, "step": 4356 }, { "epoch": 0.52, "learning_rate": 5.110412545413641e-06, "loss": 2.5062, "step": 4357 }, { "epoch": 0.52, "learning_rate": 5.10840536211541e-06, "loss": 2.7639, "step": 4358 }, { "epoch": 0.52, "learning_rate": 5.106398161339135e-06, "loss": 2.5096, "step": 4359 }, { "epoch": 0.52, "learning_rate": 5.104390943408434e-06, "loss": 2.4705, "step": 4360 }, { "epoch": 0.52, "learning_rate": 5.102383708646929e-06, "loss": 2.6436, "step": 4361 }, { "epoch": 0.52, "learning_rate": 5.100376457378243e-06, "loss": 2.453, "step": 4362 }, { "epoch": 0.52, "learning_rate": 5.098369189926003e-06, "loss": 2.6943, "step": 4363 }, { "epoch": 0.52, "learning_rate": 5.096361906613836e-06, "loss": 2.3764, "step": 4364 }, { "epoch": 0.52, "learning_rate": 5.094354607765374e-06, "loss": 2.6486, "step": 4365 }, { "epoch": 0.52, "learning_rate": 5.092347293704253e-06, "loss": 2.6558, "step": 4366 }, { "epoch": 0.52, "learning_rate": 5.090339964754108e-06, "loss": 2.4995, "step": 4367 }, { "epoch": 0.52, "learning_rate": 5.0883326212385775e-06, "loss": 2.4483, "step": 4368 }, { "epoch": 0.52, "learning_rate": 5.086325263481303e-06, "loss": 2.6501, "step": 4369 }, { "epoch": 0.52, "learning_rate": 5.084317891805928e-06, "loss": 2.5364, "step": 4370 }, { "epoch": 0.53, "learning_rate": 5.0823105065360976e-06, "loss": 2.3887, "step": 4371 }, { "epoch": 0.53, "learning_rate": 5.080303107995461e-06, "loss": 2.6551, "step": 4372 }, { "epoch": 0.53, "learning_rate": 5.078295696507668e-06, "loss": 2.5312, "step": 4373 }, { "epoch": 0.53, "learning_rate": 5.076288272396369e-06, "loss": 2.6157, "step": 4374 }, { "epoch": 0.53, "learning_rate": 5.07428083598522e-06, "loss": 2.6937, "step": 4375 }, { "epoch": 0.53, "learning_rate": 5.072273387597877e-06, "loss": 2.6244, "step": 4376 }, { "epoch": 0.53, "learning_rate": 5.070265927557997e-06, "loss": 2.6403, "step": 4377 }, { "epoch": 0.53, "learning_rate": 5.068258456189241e-06, "loss": 2.5331, "step": 4378 }, { "epoch": 0.53, "learning_rate": 5.066250973815271e-06, "loss": 2.6135, "step": 4379 }, { "epoch": 0.53, "learning_rate": 5.064243480759749e-06, "loss": 2.5462, "step": 4380 }, { "epoch": 0.53, "learning_rate": 5.0622359773463416e-06, "loss": 2.407, "step": 4381 }, { "epoch": 0.53, "learning_rate": 5.0602284638987145e-06, "loss": 2.2708, "step": 4382 }, { "epoch": 0.53, "learning_rate": 5.058220940740537e-06, "loss": 2.505, "step": 4383 }, { "epoch": 0.53, "learning_rate": 5.05621340819548e-06, "loss": 2.5065, "step": 4384 }, { "epoch": 0.53, "learning_rate": 5.0542058665872155e-06, "loss": 2.3628, "step": 4385 }, { "epoch": 0.53, "learning_rate": 5.052198316239414e-06, "loss": 2.6275, "step": 4386 }, { "epoch": 0.53, "learning_rate": 5.050190757475751e-06, "loss": 2.6426, "step": 4387 }, { "epoch": 0.53, "learning_rate": 5.048183190619904e-06, "loss": 2.5916, "step": 4388 }, { "epoch": 0.53, "learning_rate": 5.04617561599555e-06, "loss": 2.6117, "step": 4389 }, { "epoch": 0.53, "learning_rate": 5.0441680339263655e-06, "loss": 2.5506, "step": 4390 }, { "epoch": 0.53, "learning_rate": 5.042160444736032e-06, "loss": 2.3557, "step": 4391 }, { "epoch": 0.53, "learning_rate": 5.040152848748228e-06, "loss": 2.4903, "step": 4392 }, { "epoch": 0.53, "learning_rate": 5.038145246286636e-06, "loss": 2.4843, "step": 4393 }, { "epoch": 0.53, "learning_rate": 5.036137637674943e-06, "loss": 2.6772, "step": 4394 }, { "epoch": 0.53, "learning_rate": 5.034130023236827e-06, "loss": 2.5635, "step": 4395 }, { "epoch": 0.53, "learning_rate": 5.032122403295977e-06, "loss": 2.6972, "step": 4396 }, { "epoch": 0.53, "learning_rate": 5.030114778176077e-06, "loss": 2.4733, "step": 4397 }, { "epoch": 0.53, "learning_rate": 5.028107148200812e-06, "loss": 2.4518, "step": 4398 }, { "epoch": 0.53, "learning_rate": 5.026099513693873e-06, "loss": 2.5072, "step": 4399 }, { "epoch": 0.53, "learning_rate": 5.0240918749789455e-06, "loss": 2.5627, "step": 4400 }, { "epoch": 0.53, "learning_rate": 5.022084232379719e-06, "loss": 2.6159, "step": 4401 }, { "epoch": 0.53, "learning_rate": 5.020076586219884e-06, "loss": 2.6684, "step": 4402 }, { "epoch": 0.53, "learning_rate": 5.018068936823127e-06, "loss": 2.4774, "step": 4403 }, { "epoch": 0.53, "learning_rate": 5.016061284513142e-06, "loss": 2.6553, "step": 4404 }, { "epoch": 0.53, "learning_rate": 5.014053629613619e-06, "loss": 2.5731, "step": 4405 }, { "epoch": 0.53, "learning_rate": 5.01204597244825e-06, "loss": 2.5659, "step": 4406 }, { "epoch": 0.53, "learning_rate": 5.010038313340725e-06, "loss": 2.3407, "step": 4407 }, { "epoch": 0.53, "learning_rate": 5.008030652614737e-06, "loss": 2.5823, "step": 4408 }, { "epoch": 0.53, "learning_rate": 5.006022990593977e-06, "loss": 2.6064, "step": 4409 }, { "epoch": 0.53, "learning_rate": 5.004015327602139e-06, "loss": 2.7604, "step": 4410 }, { "epoch": 0.53, "learning_rate": 5.0020076639629165e-06, "loss": 2.4973, "step": 4411 }, { "epoch": 0.53, "learning_rate": 5e-06, "loss": 2.5491, "step": 4412 }, { "epoch": 0.53, "learning_rate": 4.997992336037085e-06, "loss": 2.513, "step": 4413 }, { "epoch": 0.53, "learning_rate": 4.995984672397863e-06, "loss": 2.4393, "step": 4414 }, { "epoch": 0.53, "learning_rate": 4.993977009406024e-06, "loss": 2.6177, "step": 4415 }, { "epoch": 0.53, "learning_rate": 4.991969347385266e-06, "loss": 2.4957, "step": 4416 }, { "epoch": 0.53, "learning_rate": 4.989961686659278e-06, "loss": 2.3424, "step": 4417 }, { "epoch": 0.53, "learning_rate": 4.987954027551751e-06, "loss": 2.484, "step": 4418 }, { "epoch": 0.53, "learning_rate": 4.985946370386381e-06, "loss": 2.562, "step": 4419 }, { "epoch": 0.53, "learning_rate": 4.983938715486858e-06, "loss": 2.4753, "step": 4420 }, { "epoch": 0.53, "learning_rate": 4.9819310631768734e-06, "loss": 2.6078, "step": 4421 }, { "epoch": 0.53, "learning_rate": 4.979923413780117e-06, "loss": 2.3461, "step": 4422 }, { "epoch": 0.53, "learning_rate": 4.977915767620282e-06, "loss": 2.5036, "step": 4423 }, { "epoch": 0.53, "learning_rate": 4.975908125021055e-06, "loss": 2.3665, "step": 4424 }, { "epoch": 0.53, "learning_rate": 4.973900486306129e-06, "loss": 2.5325, "step": 4425 }, { "epoch": 0.53, "learning_rate": 4.9718928517991885e-06, "loss": 2.3529, "step": 4426 }, { "epoch": 0.53, "learning_rate": 4.969885221823925e-06, "loss": 2.6802, "step": 4427 }, { "epoch": 0.53, "learning_rate": 4.967877596704026e-06, "loss": 2.4688, "step": 4428 }, { "epoch": 0.53, "learning_rate": 4.965869976763173e-06, "loss": 2.6919, "step": 4429 }, { "epoch": 0.53, "learning_rate": 4.963862362325058e-06, "loss": 2.4719, "step": 4430 }, { "epoch": 0.53, "learning_rate": 4.961854753713364e-06, "loss": 2.4536, "step": 4431 }, { "epoch": 0.53, "learning_rate": 4.959847151251774e-06, "loss": 2.4291, "step": 4432 }, { "epoch": 0.53, "learning_rate": 4.95783955526397e-06, "loss": 2.6364, "step": 4433 }, { "epoch": 0.53, "learning_rate": 4.955831966073636e-06, "loss": 2.5107, "step": 4434 }, { "epoch": 0.53, "learning_rate": 4.953824384004451e-06, "loss": 2.5304, "step": 4435 }, { "epoch": 0.53, "learning_rate": 4.951816809380098e-06, "loss": 2.4195, "step": 4436 }, { "epoch": 0.53, "learning_rate": 4.949809242524251e-06, "loss": 2.4153, "step": 4437 }, { "epoch": 0.53, "learning_rate": 4.947801683760588e-06, "loss": 2.4473, "step": 4438 }, { "epoch": 0.53, "learning_rate": 4.945794133412787e-06, "loss": 2.4882, "step": 4439 }, { "epoch": 0.53, "learning_rate": 4.94378659180452e-06, "loss": 2.5923, "step": 4440 }, { "epoch": 0.53, "learning_rate": 4.9417790592594625e-06, "loss": 2.4903, "step": 4441 }, { "epoch": 0.53, "learning_rate": 4.939771536101286e-06, "loss": 2.5608, "step": 4442 }, { "epoch": 0.53, "learning_rate": 4.93776402265366e-06, "loss": 2.5445, "step": 4443 }, { "epoch": 0.53, "learning_rate": 4.935756519240253e-06, "loss": 2.4062, "step": 4444 }, { "epoch": 0.53, "learning_rate": 4.933749026184731e-06, "loss": 2.5928, "step": 4445 }, { "epoch": 0.53, "learning_rate": 4.93174154381076e-06, "loss": 2.6551, "step": 4446 }, { "epoch": 0.53, "learning_rate": 4.929734072442004e-06, "loss": 2.589, "step": 4447 }, { "epoch": 0.53, "learning_rate": 4.9277266124021245e-06, "loss": 2.4513, "step": 4448 }, { "epoch": 0.53, "learning_rate": 4.925719164014781e-06, "loss": 2.575, "step": 4449 }, { "epoch": 0.53, "learning_rate": 4.923711727603632e-06, "loss": 2.5154, "step": 4450 }, { "epoch": 0.53, "learning_rate": 4.9217043034923335e-06, "loss": 2.4726, "step": 4451 }, { "epoch": 0.53, "learning_rate": 4.919696892004539e-06, "loss": 2.4604, "step": 4452 }, { "epoch": 0.53, "learning_rate": 4.917689493463902e-06, "loss": 2.5113, "step": 4453 }, { "epoch": 0.54, "learning_rate": 4.915682108194073e-06, "loss": 2.5333, "step": 4454 }, { "epoch": 0.54, "learning_rate": 4.913674736518699e-06, "loss": 2.5274, "step": 4455 }, { "epoch": 0.54, "learning_rate": 4.911667378761423e-06, "loss": 2.5939, "step": 4456 }, { "epoch": 0.54, "learning_rate": 4.909660035245893e-06, "loss": 2.4214, "step": 4457 }, { "epoch": 0.54, "learning_rate": 4.907652706295748e-06, "loss": 2.449, "step": 4458 }, { "epoch": 0.54, "learning_rate": 4.905645392234628e-06, "loss": 2.6625, "step": 4459 }, { "epoch": 0.54, "learning_rate": 4.903638093386167e-06, "loss": 2.3883, "step": 4460 }, { "epoch": 0.54, "learning_rate": 4.901630810074e-06, "loss": 2.5502, "step": 4461 }, { "epoch": 0.54, "learning_rate": 4.899623542621759e-06, "loss": 2.4975, "step": 4462 }, { "epoch": 0.54, "learning_rate": 4.8976162913530715e-06, "loss": 2.5358, "step": 4463 }, { "epoch": 0.54, "learning_rate": 4.895609056591566e-06, "loss": 2.5447, "step": 4464 }, { "epoch": 0.54, "learning_rate": 4.893601838660866e-06, "loss": 2.4736, "step": 4465 }, { "epoch": 0.54, "learning_rate": 4.891594637884591e-06, "loss": 2.4252, "step": 4466 }, { "epoch": 0.54, "learning_rate": 4.8895874545863604e-06, "loss": 2.5349, "step": 4467 }, { "epoch": 0.54, "learning_rate": 4.887580289089788e-06, "loss": 2.3846, "step": 4468 }, { "epoch": 0.54, "learning_rate": 4.885573141718487e-06, "loss": 2.4806, "step": 4469 }, { "epoch": 0.54, "learning_rate": 4.883566012796068e-06, "loss": 2.6025, "step": 4470 }, { "epoch": 0.54, "learning_rate": 4.8815589026461356e-06, "loss": 2.7083, "step": 4471 }, { "epoch": 0.54, "learning_rate": 4.879551811592295e-06, "loss": 2.7444, "step": 4472 }, { "epoch": 0.54, "learning_rate": 4.877544739958145e-06, "loss": 2.467, "step": 4473 }, { "epoch": 0.54, "learning_rate": 4.875537688067284e-06, "loss": 2.3173, "step": 4474 }, { "epoch": 0.54, "learning_rate": 4.8735306562433045e-06, "loss": 2.4096, "step": 4475 }, { "epoch": 0.54, "learning_rate": 4.871523644809802e-06, "loss": 2.4586, "step": 4476 }, { "epoch": 0.54, "learning_rate": 4.869516654090361e-06, "loss": 2.4228, "step": 4477 }, { "epoch": 0.54, "learning_rate": 4.867509684408564e-06, "loss": 2.6349, "step": 4478 }, { "epoch": 0.54, "learning_rate": 4.865502736087995e-06, "loss": 2.3917, "step": 4479 }, { "epoch": 0.54, "learning_rate": 4.86349580945223e-06, "loss": 2.6994, "step": 4480 }, { "epoch": 0.54, "learning_rate": 4.861488904824843e-06, "loss": 2.6121, "step": 4481 }, { "epoch": 0.54, "learning_rate": 4.859482022529406e-06, "loss": 2.4559, "step": 4482 }, { "epoch": 0.54, "learning_rate": 4.857475162889483e-06, "loss": 2.4448, "step": 4483 }, { "epoch": 0.54, "learning_rate": 4.855468326228638e-06, "loss": 2.5122, "step": 4484 }, { "epoch": 0.54, "learning_rate": 4.85346151287043e-06, "loss": 2.5293, "step": 4485 }, { "epoch": 0.54, "learning_rate": 4.8514547231384164e-06, "loss": 2.6188, "step": 4486 }, { "epoch": 0.54, "learning_rate": 4.84944795735615e-06, "loss": 2.5477, "step": 4487 }, { "epoch": 0.54, "learning_rate": 4.847441215847177e-06, "loss": 2.5933, "step": 4488 }, { "epoch": 0.54, "learning_rate": 4.845434498935041e-06, "loss": 2.4475, "step": 4489 }, { "epoch": 0.54, "learning_rate": 4.843427806943283e-06, "loss": 2.3603, "step": 4490 }, { "epoch": 0.54, "learning_rate": 4.841421140195438e-06, "loss": 2.7032, "step": 4491 }, { "epoch": 0.54, "learning_rate": 4.839414499015041e-06, "loss": 2.4853, "step": 4492 }, { "epoch": 0.54, "learning_rate": 4.837407883725616e-06, "loss": 2.4529, "step": 4493 }, { "epoch": 0.54, "learning_rate": 4.83540129465069e-06, "loss": 2.4536, "step": 4494 }, { "epoch": 0.54, "learning_rate": 4.833394732113781e-06, "loss": 2.3853, "step": 4495 }, { "epoch": 0.54, "learning_rate": 4.831388196438402e-06, "loss": 2.5134, "step": 4496 }, { "epoch": 0.54, "learning_rate": 4.829381687948068e-06, "loss": 2.4522, "step": 4497 }, { "epoch": 0.54, "learning_rate": 4.827375206966284e-06, "loss": 2.5825, "step": 4498 }, { "epoch": 0.54, "learning_rate": 4.825368753816552e-06, "loss": 2.5482, "step": 4499 }, { "epoch": 0.54, "learning_rate": 4.82336232882237e-06, "loss": 2.4532, "step": 4500 }, { "epoch": 0.54, "learning_rate": 4.821355932307231e-06, "loss": 2.4695, "step": 4501 }, { "epoch": 0.54, "learning_rate": 4.819349564594622e-06, "loss": 2.5487, "step": 4502 }, { "epoch": 0.54, "learning_rate": 4.8173432260080285e-06, "loss": 2.6335, "step": 4503 }, { "epoch": 0.54, "learning_rate": 4.815336916870929e-06, "loss": 2.4739, "step": 4504 }, { "epoch": 0.54, "learning_rate": 4.813330637506799e-06, "loss": 2.572, "step": 4505 }, { "epoch": 0.54, "learning_rate": 4.811324388239106e-06, "loss": 2.6269, "step": 4506 }, { "epoch": 0.54, "learning_rate": 4.809318169391314e-06, "loss": 2.5877, "step": 4507 }, { "epoch": 0.54, "learning_rate": 4.807311981286888e-06, "loss": 2.622, "step": 4508 }, { "epoch": 0.54, "learning_rate": 4.805305824249277e-06, "loss": 2.4769, "step": 4509 }, { "epoch": 0.54, "learning_rate": 4.803299698601935e-06, "loss": 2.5003, "step": 4510 }, { "epoch": 0.54, "learning_rate": 4.801293604668306e-06, "loss": 2.4463, "step": 4511 }, { "epoch": 0.54, "learning_rate": 4.799287542771828e-06, "loss": 2.4727, "step": 4512 }, { "epoch": 0.54, "learning_rate": 4.797281513235937e-06, "loss": 2.6627, "step": 4513 }, { "epoch": 0.54, "learning_rate": 4.79527551638406e-06, "loss": 2.5732, "step": 4514 }, { "epoch": 0.54, "learning_rate": 4.793269552539625e-06, "loss": 2.4735, "step": 4515 }, { "epoch": 0.54, "learning_rate": 4.791263622026048e-06, "loss": 2.5869, "step": 4516 }, { "epoch": 0.54, "learning_rate": 4.7892577251667426e-06, "loss": 2.633, "step": 4517 }, { "epoch": 0.54, "learning_rate": 4.7872518622851155e-06, "loss": 2.612, "step": 4518 }, { "epoch": 0.54, "learning_rate": 4.785246033704572e-06, "loss": 2.6092, "step": 4519 }, { "epoch": 0.54, "learning_rate": 4.783240239748509e-06, "loss": 2.5165, "step": 4520 }, { "epoch": 0.54, "learning_rate": 4.781234480740314e-06, "loss": 2.6296, "step": 4521 }, { "epoch": 0.54, "learning_rate": 4.779228757003377e-06, "loss": 2.5957, "step": 4522 }, { "epoch": 0.54, "learning_rate": 4.777223068861077e-06, "loss": 2.4699, "step": 4523 }, { "epoch": 0.54, "learning_rate": 4.775217416636786e-06, "loss": 2.4819, "step": 4524 }, { "epoch": 0.54, "learning_rate": 4.773211800653875e-06, "loss": 2.5784, "step": 4525 }, { "epoch": 0.54, "learning_rate": 4.7712062212357045e-06, "loss": 2.3416, "step": 4526 }, { "epoch": 0.54, "learning_rate": 4.769200678705633e-06, "loss": 2.4512, "step": 4527 }, { "epoch": 0.54, "learning_rate": 4.76719517338701e-06, "loss": 2.3488, "step": 4528 }, { "epoch": 0.54, "learning_rate": 4.76518970560318e-06, "loss": 2.6528, "step": 4529 }, { "epoch": 0.54, "learning_rate": 4.763184275677484e-06, "loss": 2.7052, "step": 4530 }, { "epoch": 0.54, "learning_rate": 4.761178883933254e-06, "loss": 2.521, "step": 4531 }, { "epoch": 0.54, "learning_rate": 4.7591735306938144e-06, "loss": 2.5912, "step": 4532 }, { "epoch": 0.54, "learning_rate": 4.757168216282488e-06, "loss": 2.4897, "step": 4533 }, { "epoch": 0.54, "learning_rate": 4.755162941022588e-06, "loss": 2.4647, "step": 4534 }, { "epoch": 0.54, "learning_rate": 4.7531577052374215e-06, "loss": 2.4967, "step": 4535 }, { "epoch": 0.54, "learning_rate": 4.75115250925029e-06, "loss": 2.3062, "step": 4536 }, { "epoch": 0.55, "learning_rate": 4.749147353384487e-06, "loss": 2.4538, "step": 4537 }, { "epoch": 0.55, "learning_rate": 4.747142237963305e-06, "loss": 2.3927, "step": 4538 }, { "epoch": 0.55, "learning_rate": 4.7451371633100224e-06, "loss": 2.5665, "step": 4539 }, { "epoch": 0.55, "learning_rate": 4.7431321297479135e-06, "loss": 2.5967, "step": 4540 }, { "epoch": 0.55, "learning_rate": 4.7411271376002515e-06, "loss": 2.7084, "step": 4541 }, { "epoch": 0.55, "learning_rate": 4.739122187190296e-06, "loss": 2.5987, "step": 4542 }, { "epoch": 0.55, "learning_rate": 4.737117278841303e-06, "loss": 2.3484, "step": 4543 }, { "epoch": 0.55, "learning_rate": 4.7351124128765185e-06, "loss": 2.6684, "step": 4544 }, { "epoch": 0.55, "learning_rate": 4.733107589619188e-06, "loss": 2.4695, "step": 4545 }, { "epoch": 0.55, "learning_rate": 4.7311028093925445e-06, "loss": 2.6274, "step": 4546 }, { "epoch": 0.55, "learning_rate": 4.729098072519816e-06, "loss": 2.4477, "step": 4547 }, { "epoch": 0.55, "learning_rate": 4.727093379324222e-06, "loss": 2.4511, "step": 4548 }, { "epoch": 0.55, "learning_rate": 4.725088730128978e-06, "loss": 2.6093, "step": 4549 }, { "epoch": 0.55, "learning_rate": 4.723084125257291e-06, "loss": 2.5035, "step": 4550 }, { "epoch": 0.55, "learning_rate": 4.721079565032357e-06, "loss": 2.5606, "step": 4551 }, { "epoch": 0.55, "learning_rate": 4.719075049777375e-06, "loss": 2.5483, "step": 4552 }, { "epoch": 0.55, "learning_rate": 4.717070579815526e-06, "loss": 2.4872, "step": 4553 }, { "epoch": 0.55, "learning_rate": 4.715066155469989e-06, "loss": 2.4046, "step": 4554 }, { "epoch": 0.55, "learning_rate": 4.713061777063933e-06, "loss": 2.6931, "step": 4555 }, { "epoch": 0.55, "learning_rate": 4.711057444920522e-06, "loss": 2.5915, "step": 4556 }, { "epoch": 0.55, "learning_rate": 4.7090531593629125e-06, "loss": 2.6586, "step": 4557 }, { "epoch": 0.55, "learning_rate": 4.7070489207142525e-06, "loss": 2.4936, "step": 4558 }, { "epoch": 0.55, "learning_rate": 4.705044729297681e-06, "loss": 2.7177, "step": 4559 }, { "epoch": 0.55, "learning_rate": 4.703040585436331e-06, "loss": 2.488, "step": 4560 }, { "epoch": 0.55, "learning_rate": 4.7010364894533304e-06, "loss": 2.5838, "step": 4561 }, { "epoch": 0.55, "learning_rate": 4.699032441671794e-06, "loss": 2.5047, "step": 4562 }, { "epoch": 0.55, "learning_rate": 4.697028442414831e-06, "loss": 2.456, "step": 4563 }, { "epoch": 0.55, "learning_rate": 4.6950244920055475e-06, "loss": 2.3813, "step": 4564 }, { "epoch": 0.55, "learning_rate": 4.693020590767035e-06, "loss": 2.4847, "step": 4565 }, { "epoch": 0.55, "learning_rate": 4.69101673902238e-06, "loss": 2.7934, "step": 4566 }, { "epoch": 0.55, "learning_rate": 4.6890129370946595e-06, "loss": 2.5712, "step": 4567 }, { "epoch": 0.55, "learning_rate": 4.687009185306945e-06, "loss": 2.6099, "step": 4568 }, { "epoch": 0.55, "learning_rate": 4.685005483982299e-06, "loss": 2.573, "step": 4569 }, { "epoch": 0.55, "learning_rate": 4.683001833443774e-06, "loss": 2.4833, "step": 4570 }, { "epoch": 0.55, "learning_rate": 4.680998234014416e-06, "loss": 2.7227, "step": 4571 }, { "epoch": 0.55, "learning_rate": 4.678994686017263e-06, "loss": 2.6348, "step": 4572 }, { "epoch": 0.55, "learning_rate": 4.6769911897753456e-06, "loss": 2.3681, "step": 4573 }, { "epoch": 0.55, "learning_rate": 4.67498774561168e-06, "loss": 2.5644, "step": 4574 }, { "epoch": 0.55, "learning_rate": 4.672984353849285e-06, "loss": 2.604, "step": 4575 }, { "epoch": 0.55, "learning_rate": 4.670981014811161e-06, "loss": 2.5612, "step": 4576 }, { "epoch": 0.55, "learning_rate": 4.668977728820303e-06, "loss": 2.4682, "step": 4577 }, { "epoch": 0.55, "learning_rate": 4.666974496199701e-06, "loss": 2.5893, "step": 4578 }, { "epoch": 0.55, "learning_rate": 4.664971317272329e-06, "loss": 2.5033, "step": 4579 }, { "epoch": 0.55, "learning_rate": 4.662968192361161e-06, "loss": 2.5951, "step": 4580 }, { "epoch": 0.55, "learning_rate": 4.660965121789156e-06, "loss": 2.5869, "step": 4581 }, { "epoch": 0.55, "learning_rate": 4.658962105879266e-06, "loss": 2.6145, "step": 4582 }, { "epoch": 0.55, "learning_rate": 4.656959144954434e-06, "loss": 2.361, "step": 4583 }, { "epoch": 0.55, "learning_rate": 4.6549562393375965e-06, "loss": 2.4994, "step": 4584 }, { "epoch": 0.55, "learning_rate": 4.652953389351676e-06, "loss": 2.5968, "step": 4585 }, { "epoch": 0.55, "learning_rate": 4.650950595319593e-06, "loss": 2.4734, "step": 4586 }, { "epoch": 0.55, "learning_rate": 4.6489478575642535e-06, "loss": 2.493, "step": 4587 }, { "epoch": 0.55, "learning_rate": 4.646945176408555e-06, "loss": 2.5463, "step": 4588 }, { "epoch": 0.55, "learning_rate": 4.64494255217539e-06, "loss": 2.4834, "step": 4589 }, { "epoch": 0.55, "learning_rate": 4.642939985187634e-06, "loss": 2.5488, "step": 4590 }, { "epoch": 0.55, "learning_rate": 4.640937475768162e-06, "loss": 2.6648, "step": 4591 }, { "epoch": 0.55, "learning_rate": 4.6389350242398354e-06, "loss": 2.6388, "step": 4592 }, { "epoch": 0.55, "learning_rate": 4.636932630925505e-06, "loss": 2.5063, "step": 4593 }, { "epoch": 0.55, "learning_rate": 4.634930296148014e-06, "loss": 2.485, "step": 4594 }, { "epoch": 0.55, "learning_rate": 4.632928020230196e-06, "loss": 2.6323, "step": 4595 }, { "epoch": 0.55, "learning_rate": 4.630925803494877e-06, "loss": 2.5163, "step": 4596 }, { "epoch": 0.55, "learning_rate": 4.628923646264869e-06, "loss": 2.4747, "step": 4597 }, { "epoch": 0.55, "learning_rate": 4.6269215488629795e-06, "loss": 2.6745, "step": 4598 }, { "epoch": 0.55, "learning_rate": 4.624919511612003e-06, "loss": 2.5249, "step": 4599 }, { "epoch": 0.55, "learning_rate": 4.622917534834724e-06, "loss": 2.4862, "step": 4600 }, { "epoch": 0.55, "learning_rate": 4.62091561885392e-06, "loss": 2.4027, "step": 4601 }, { "epoch": 0.55, "learning_rate": 4.618913763992355e-06, "loss": 2.5152, "step": 4602 }, { "epoch": 0.55, "learning_rate": 4.616911970572788e-06, "loss": 2.4695, "step": 4603 }, { "epoch": 0.55, "learning_rate": 4.614910238917963e-06, "loss": 2.5852, "step": 4604 }, { "epoch": 0.55, "learning_rate": 4.612908569350618e-06, "loss": 2.566, "step": 4605 }, { "epoch": 0.55, "learning_rate": 4.6109069621934765e-06, "loss": 2.6288, "step": 4606 }, { "epoch": 0.55, "learning_rate": 4.608905417769258e-06, "loss": 2.5299, "step": 4607 }, { "epoch": 0.55, "learning_rate": 4.606903936400667e-06, "loss": 2.7037, "step": 4608 }, { "epoch": 0.55, "learning_rate": 4.604902518410402e-06, "loss": 2.6379, "step": 4609 }, { "epoch": 0.55, "learning_rate": 4.602901164121145e-06, "loss": 2.4958, "step": 4610 }, { "epoch": 0.55, "learning_rate": 4.6008998738555746e-06, "loss": 2.5981, "step": 4611 }, { "epoch": 0.55, "learning_rate": 4.598898647936354e-06, "loss": 2.3219, "step": 4612 }, { "epoch": 0.55, "learning_rate": 4.5968974866861394e-06, "loss": 2.5228, "step": 4613 }, { "epoch": 0.55, "learning_rate": 4.594896390427574e-06, "loss": 2.4718, "step": 4614 }, { "epoch": 0.55, "learning_rate": 4.592895359483294e-06, "loss": 2.459, "step": 4615 }, { "epoch": 0.55, "learning_rate": 4.59089439417592e-06, "loss": 2.4922, "step": 4616 }, { "epoch": 0.55, "learning_rate": 4.588893494828066e-06, "loss": 2.5695, "step": 4617 }, { "epoch": 0.55, "learning_rate": 4.586892661762333e-06, "loss": 2.5564, "step": 4618 }, { "epoch": 0.55, "learning_rate": 4.584891895301315e-06, "loss": 2.53, "step": 4619 }, { "epoch": 0.56, "learning_rate": 4.582891195767591e-06, "loss": 2.4467, "step": 4620 }, { "epoch": 0.56, "learning_rate": 4.5808905634837314e-06, "loss": 2.4923, "step": 4621 }, { "epoch": 0.56, "learning_rate": 4.578889998772296e-06, "loss": 2.511, "step": 4622 }, { "epoch": 0.56, "learning_rate": 4.576889501955833e-06, "loss": 2.5366, "step": 4623 }, { "epoch": 0.56, "learning_rate": 4.5748890733568775e-06, "loss": 2.6332, "step": 4624 }, { "epoch": 0.56, "learning_rate": 4.572888713297957e-06, "loss": 2.6805, "step": 4625 }, { "epoch": 0.56, "learning_rate": 4.570888422101588e-06, "loss": 2.6554, "step": 4626 }, { "epoch": 0.56, "learning_rate": 4.568888200090274e-06, "loss": 2.5627, "step": 4627 }, { "epoch": 0.56, "learning_rate": 4.5668880475865074e-06, "loss": 2.538, "step": 4628 }, { "epoch": 0.56, "learning_rate": 4.564887964912768e-06, "loss": 2.4616, "step": 4629 }, { "epoch": 0.56, "learning_rate": 4.562887952391531e-06, "loss": 2.5926, "step": 4630 }, { "epoch": 0.56, "learning_rate": 4.5608880103452525e-06, "loss": 2.4931, "step": 4631 }, { "epoch": 0.56, "learning_rate": 4.5588881390963804e-06, "loss": 2.3971, "step": 4632 }, { "epoch": 0.56, "learning_rate": 4.5568883389673525e-06, "loss": 2.5567, "step": 4633 }, { "epoch": 0.56, "learning_rate": 4.554888610280593e-06, "loss": 2.5392, "step": 4634 }, { "epoch": 0.56, "learning_rate": 4.552888953358515e-06, "loss": 2.505, "step": 4635 }, { "epoch": 0.56, "learning_rate": 4.55088936852352e-06, "loss": 2.4855, "step": 4636 }, { "epoch": 0.56, "learning_rate": 4.548889856098e-06, "loss": 2.4606, "step": 4637 }, { "epoch": 0.56, "learning_rate": 4.5468904164043324e-06, "loss": 2.5365, "step": 4638 }, { "epoch": 0.56, "learning_rate": 4.544891049764884e-06, "loss": 2.4926, "step": 4639 }, { "epoch": 0.56, "learning_rate": 4.542891756502008e-06, "loss": 2.5628, "step": 4640 }, { "epoch": 0.56, "learning_rate": 4.540892536938051e-06, "loss": 2.6502, "step": 4641 }, { "epoch": 0.56, "learning_rate": 4.5388933913953434e-06, "loss": 2.5149, "step": 4642 }, { "epoch": 0.56, "learning_rate": 4.536894320196203e-06, "loss": 2.6246, "step": 4643 }, { "epoch": 0.56, "learning_rate": 4.534895323662939e-06, "loss": 2.4287, "step": 4644 }, { "epoch": 0.56, "learning_rate": 4.532896402117847e-06, "loss": 2.5406, "step": 4645 }, { "epoch": 0.56, "learning_rate": 4.5308975558832095e-06, "loss": 2.6834, "step": 4646 }, { "epoch": 0.56, "learning_rate": 4.528898785281297e-06, "loss": 2.6195, "step": 4647 }, { "epoch": 0.56, "learning_rate": 4.526900090634368e-06, "loss": 2.514, "step": 4648 }, { "epoch": 0.56, "learning_rate": 4.524901472264672e-06, "loss": 2.5704, "step": 4649 }, { "epoch": 0.56, "learning_rate": 4.522902930494442e-06, "loss": 2.4946, "step": 4650 }, { "epoch": 0.56, "learning_rate": 4.520904465645897e-06, "loss": 2.613, "step": 4651 }, { "epoch": 0.56, "learning_rate": 4.518906078041252e-06, "loss": 2.5978, "step": 4652 }, { "epoch": 0.56, "learning_rate": 4.516907768002701e-06, "loss": 2.4853, "step": 4653 }, { "epoch": 0.56, "learning_rate": 4.51490953585243e-06, "loss": 2.4376, "step": 4654 }, { "epoch": 0.56, "learning_rate": 4.5129113819126095e-06, "loss": 2.5481, "step": 4655 }, { "epoch": 0.56, "learning_rate": 4.510913306505401e-06, "loss": 2.4397, "step": 4656 }, { "epoch": 0.56, "learning_rate": 4.508915309952951e-06, "loss": 2.6523, "step": 4657 }, { "epoch": 0.56, "learning_rate": 4.506917392577393e-06, "loss": 2.4729, "step": 4658 }, { "epoch": 0.56, "learning_rate": 4.504919554700846e-06, "loss": 2.4852, "step": 4659 }, { "epoch": 0.56, "learning_rate": 4.502921796645424e-06, "loss": 2.4196, "step": 4660 }, { "epoch": 0.56, "learning_rate": 4.50092411873322e-06, "loss": 2.5954, "step": 4661 }, { "epoch": 0.56, "learning_rate": 4.498926521286315e-06, "loss": 2.4166, "step": 4662 }, { "epoch": 0.56, "learning_rate": 4.49692900462678e-06, "loss": 2.6521, "step": 4663 }, { "epoch": 0.56, "learning_rate": 4.494931569076674e-06, "loss": 2.6387, "step": 4664 }, { "epoch": 0.56, "learning_rate": 4.492934214958038e-06, "loss": 2.3802, "step": 4665 }, { "epoch": 0.56, "learning_rate": 4.490936942592904e-06, "loss": 2.516, "step": 4666 }, { "epoch": 0.56, "learning_rate": 4.488939752303288e-06, "loss": 2.5003, "step": 4667 }, { "epoch": 0.56, "learning_rate": 4.486942644411197e-06, "loss": 2.5952, "step": 4668 }, { "epoch": 0.56, "learning_rate": 4.484945619238619e-06, "loss": 2.4896, "step": 4669 }, { "epoch": 0.56, "learning_rate": 4.482948677107533e-06, "loss": 2.5625, "step": 4670 }, { "epoch": 0.56, "learning_rate": 4.480951818339902e-06, "loss": 2.7392, "step": 4671 }, { "epoch": 0.56, "learning_rate": 4.478955043257679e-06, "loss": 2.4575, "step": 4672 }, { "epoch": 0.56, "learning_rate": 4.476958352182798e-06, "loss": 2.4935, "step": 4673 }, { "epoch": 0.56, "learning_rate": 4.474961745437183e-06, "loss": 2.6235, "step": 4674 }, { "epoch": 0.56, "learning_rate": 4.472965223342748e-06, "loss": 2.46, "step": 4675 }, { "epoch": 0.56, "learning_rate": 4.4709687862213866e-06, "loss": 2.5234, "step": 4676 }, { "epoch": 0.56, "learning_rate": 4.468972434394982e-06, "loss": 2.5119, "step": 4677 }, { "epoch": 0.56, "learning_rate": 4.4669761681854025e-06, "loss": 2.6826, "step": 4678 }, { "epoch": 0.56, "learning_rate": 4.464979987914504e-06, "loss": 2.5457, "step": 4679 }, { "epoch": 0.56, "learning_rate": 4.462983893904128e-06, "loss": 2.628, "step": 4680 }, { "epoch": 0.56, "learning_rate": 4.4609878864761024e-06, "loss": 2.4302, "step": 4681 }, { "epoch": 0.56, "learning_rate": 4.458991965952238e-06, "loss": 2.5833, "step": 4682 }, { "epoch": 0.56, "learning_rate": 4.456996132654337e-06, "loss": 2.6866, "step": 4683 }, { "epoch": 0.56, "learning_rate": 4.455000386904185e-06, "loss": 2.4904, "step": 4684 }, { "epoch": 0.56, "learning_rate": 4.4530047290235484e-06, "loss": 2.6688, "step": 4685 }, { "epoch": 0.56, "learning_rate": 4.451009159334191e-06, "loss": 2.5853, "step": 4686 }, { "epoch": 0.56, "learning_rate": 4.449013678157853e-06, "loss": 2.4731, "step": 4687 }, { "epoch": 0.56, "learning_rate": 4.447018285816263e-06, "loss": 2.3941, "step": 4688 }, { "epoch": 0.56, "learning_rate": 4.445022982631134e-06, "loss": 2.5579, "step": 4689 }, { "epoch": 0.56, "learning_rate": 4.443027768924168e-06, "loss": 2.2959, "step": 4690 }, { "epoch": 0.56, "learning_rate": 4.441032645017048e-06, "loss": 2.4759, "step": 4691 }, { "epoch": 0.56, "learning_rate": 4.439037611231448e-06, "loss": 2.5521, "step": 4692 }, { "epoch": 0.56, "learning_rate": 4.437042667889024e-06, "loss": 2.4141, "step": 4693 }, { "epoch": 0.56, "learning_rate": 4.435047815311414e-06, "loss": 2.422, "step": 4694 }, { "epoch": 0.56, "learning_rate": 4.4330530538202496e-06, "loss": 2.3777, "step": 4695 }, { "epoch": 0.56, "learning_rate": 4.43105838373714e-06, "loss": 2.4974, "step": 4696 }, { "epoch": 0.56, "learning_rate": 4.429063805383687e-06, "loss": 2.5579, "step": 4697 }, { "epoch": 0.56, "learning_rate": 4.4270693190814716e-06, "loss": 2.5238, "step": 4698 }, { "epoch": 0.56, "learning_rate": 4.4250749251520625e-06, "loss": 2.5379, "step": 4699 }, { "epoch": 0.56, "learning_rate": 4.423080623917012e-06, "loss": 2.3751, "step": 4700 }, { "epoch": 0.56, "learning_rate": 4.421086415697858e-06, "loss": 2.463, "step": 4701 }, { "epoch": 0.56, "learning_rate": 4.419092300816127e-06, "loss": 2.5634, "step": 4702 }, { "epoch": 0.56, "learning_rate": 4.417098279593324e-06, "loss": 2.6424, "step": 4703 }, { "epoch": 0.57, "learning_rate": 4.415104352350944e-06, "loss": 2.6202, "step": 4704 }, { "epoch": 0.57, "learning_rate": 4.413110519410465e-06, "loss": 2.6464, "step": 4705 }, { "epoch": 0.57, "learning_rate": 4.411116781093348e-06, "loss": 2.4334, "step": 4706 }, { "epoch": 0.57, "learning_rate": 4.409123137721042e-06, "loss": 2.707, "step": 4707 }, { "epoch": 0.57, "learning_rate": 4.40712958961498e-06, "loss": 2.5717, "step": 4708 }, { "epoch": 0.57, "learning_rate": 4.405136137096579e-06, "loss": 2.6126, "step": 4709 }, { "epoch": 0.57, "learning_rate": 4.40314278048724e-06, "loss": 2.4792, "step": 4710 }, { "epoch": 0.57, "learning_rate": 4.401149520108348e-06, "loss": 2.493, "step": 4711 }, { "epoch": 0.57, "learning_rate": 4.399156356281274e-06, "loss": 2.4694, "step": 4712 }, { "epoch": 0.57, "learning_rate": 4.397163289327375e-06, "loss": 2.5274, "step": 4713 }, { "epoch": 0.57, "learning_rate": 4.395170319567988e-06, "loss": 2.2966, "step": 4714 }, { "epoch": 0.57, "learning_rate": 4.393177447324439e-06, "loss": 2.4796, "step": 4715 }, { "epoch": 0.57, "learning_rate": 4.391184672918034e-06, "loss": 2.5127, "step": 4716 }, { "epoch": 0.57, "learning_rate": 4.3891919966700645e-06, "loss": 2.6744, "step": 4717 }, { "epoch": 0.57, "learning_rate": 4.3871994189018075e-06, "loss": 2.5703, "step": 4718 }, { "epoch": 0.57, "learning_rate": 4.3852069399345245e-06, "loss": 2.6238, "step": 4719 }, { "epoch": 0.57, "learning_rate": 4.383214560089461e-06, "loss": 2.4545, "step": 4720 }, { "epoch": 0.57, "learning_rate": 4.381222279687845e-06, "loss": 2.6328, "step": 4721 }, { "epoch": 0.57, "learning_rate": 4.379230099050888e-06, "loss": 2.5598, "step": 4722 }, { "epoch": 0.57, "learning_rate": 4.377238018499786e-06, "loss": 2.4774, "step": 4723 }, { "epoch": 0.57, "learning_rate": 4.3752460383557195e-06, "loss": 2.579, "step": 4724 }, { "epoch": 0.57, "learning_rate": 4.373254158939855e-06, "loss": 2.6955, "step": 4725 }, { "epoch": 0.57, "learning_rate": 4.371262380573338e-06, "loss": 2.4979, "step": 4726 }, { "epoch": 0.57, "learning_rate": 4.369270703577302e-06, "loss": 2.5012, "step": 4727 }, { "epoch": 0.57, "learning_rate": 4.36727912827286e-06, "loss": 2.4457, "step": 4728 }, { "epoch": 0.57, "learning_rate": 4.3652876549811105e-06, "loss": 2.4972, "step": 4729 }, { "epoch": 0.57, "learning_rate": 4.363296284023139e-06, "loss": 2.6137, "step": 4730 }, { "epoch": 0.57, "learning_rate": 4.3613050157200095e-06, "loss": 2.5875, "step": 4731 }, { "epoch": 0.57, "learning_rate": 4.3593138503927725e-06, "loss": 2.3217, "step": 4732 }, { "epoch": 0.57, "learning_rate": 4.3573227883624605e-06, "loss": 2.4437, "step": 4733 }, { "epoch": 0.57, "learning_rate": 4.355331829950088e-06, "loss": 2.3815, "step": 4734 }, { "epoch": 0.57, "learning_rate": 4.3533409754766555e-06, "loss": 2.6557, "step": 4735 }, { "epoch": 0.57, "learning_rate": 4.351350225263147e-06, "loss": 2.4646, "step": 4736 }, { "epoch": 0.57, "learning_rate": 4.349359579630526e-06, "loss": 2.4214, "step": 4737 }, { "epoch": 0.57, "learning_rate": 4.347369038899744e-06, "loss": 2.4911, "step": 4738 }, { "epoch": 0.57, "learning_rate": 4.34537860339173e-06, "loss": 2.4061, "step": 4739 }, { "epoch": 0.57, "learning_rate": 4.3433882734274e-06, "loss": 2.6639, "step": 4740 }, { "epoch": 0.57, "learning_rate": 4.341398049327654e-06, "loss": 2.5669, "step": 4741 }, { "epoch": 0.57, "learning_rate": 4.339407931413372e-06, "loss": 2.4022, "step": 4742 }, { "epoch": 0.57, "learning_rate": 4.337417920005418e-06, "loss": 2.532, "step": 4743 }, { "epoch": 0.57, "learning_rate": 4.3354280154246385e-06, "loss": 2.5382, "step": 4744 }, { "epoch": 0.57, "learning_rate": 4.333438217991864e-06, "loss": 2.7162, "step": 4745 }, { "epoch": 0.57, "learning_rate": 4.331448528027905e-06, "loss": 2.4285, "step": 4746 }, { "epoch": 0.57, "learning_rate": 4.329458945853555e-06, "loss": 2.4565, "step": 4747 }, { "epoch": 0.57, "learning_rate": 4.327469471789597e-06, "loss": 2.4436, "step": 4748 }, { "epoch": 0.57, "learning_rate": 4.325480106156787e-06, "loss": 2.5075, "step": 4749 }, { "epoch": 0.57, "learning_rate": 4.323490849275868e-06, "loss": 2.415, "step": 4750 }, { "epoch": 0.57, "learning_rate": 4.321501701467564e-06, "loss": 2.2453, "step": 4751 }, { "epoch": 0.57, "learning_rate": 4.319512663052585e-06, "loss": 2.4952, "step": 4752 }, { "epoch": 0.57, "learning_rate": 4.317523734351621e-06, "loss": 2.5837, "step": 4753 }, { "epoch": 0.57, "learning_rate": 4.315534915685341e-06, "loss": 2.5487, "step": 4754 }, { "epoch": 0.57, "learning_rate": 4.313546207374404e-06, "loss": 2.4302, "step": 4755 }, { "epoch": 0.57, "learning_rate": 4.311557609739442e-06, "loss": 2.4719, "step": 4756 }, { "epoch": 0.57, "learning_rate": 4.309569123101077e-06, "loss": 2.6649, "step": 4757 }, { "epoch": 0.57, "learning_rate": 4.30758074777991e-06, "loss": 2.4569, "step": 4758 }, { "epoch": 0.57, "learning_rate": 4.3055924840965204e-06, "loss": 2.5502, "step": 4759 }, { "epoch": 0.57, "learning_rate": 4.303604332371476e-06, "loss": 2.3928, "step": 4760 }, { "epoch": 0.57, "learning_rate": 4.301616292925324e-06, "loss": 2.3291, "step": 4761 }, { "epoch": 0.57, "learning_rate": 4.299628366078592e-06, "loss": 2.4832, "step": 4762 }, { "epoch": 0.57, "learning_rate": 4.297640552151789e-06, "loss": 2.5048, "step": 4763 }, { "epoch": 0.57, "learning_rate": 4.295652851465412e-06, "loss": 2.462, "step": 4764 }, { "epoch": 0.57, "learning_rate": 4.2936652643399315e-06, "loss": 2.5956, "step": 4765 }, { "epoch": 0.57, "learning_rate": 4.291677791095805e-06, "loss": 2.5795, "step": 4766 }, { "epoch": 0.57, "learning_rate": 4.2896904320534704e-06, "loss": 2.6372, "step": 4767 }, { "epoch": 0.57, "learning_rate": 4.287703187533346e-06, "loss": 2.5446, "step": 4768 }, { "epoch": 0.57, "learning_rate": 4.285716057855831e-06, "loss": 2.5414, "step": 4769 }, { "epoch": 0.57, "learning_rate": 4.283729043341308e-06, "loss": 2.3886, "step": 4770 }, { "epoch": 0.57, "learning_rate": 4.281742144310144e-06, "loss": 2.4189, "step": 4771 }, { "epoch": 0.57, "learning_rate": 4.27975536108268e-06, "loss": 2.3943, "step": 4772 }, { "epoch": 0.57, "learning_rate": 4.277768693979244e-06, "loss": 2.5218, "step": 4773 }, { "epoch": 0.57, "learning_rate": 4.275782143320141e-06, "loss": 2.5302, "step": 4774 }, { "epoch": 0.57, "learning_rate": 4.273795709425664e-06, "loss": 2.5052, "step": 4775 }, { "epoch": 0.57, "learning_rate": 4.271809392616081e-06, "loss": 2.6473, "step": 4776 }, { "epoch": 0.57, "learning_rate": 4.269823193211641e-06, "loss": 2.5813, "step": 4777 }, { "epoch": 0.57, "learning_rate": 4.26783711153258e-06, "loss": 2.5097, "step": 4778 }, { "epoch": 0.57, "learning_rate": 4.265851147899109e-06, "loss": 2.4427, "step": 4779 }, { "epoch": 0.57, "learning_rate": 4.263865302631423e-06, "loss": 2.5225, "step": 4780 }, { "epoch": 0.57, "learning_rate": 4.261879576049695e-06, "loss": 2.5665, "step": 4781 }, { "epoch": 0.57, "learning_rate": 4.259893968474082e-06, "loss": 2.5526, "step": 4782 }, { "epoch": 0.57, "learning_rate": 4.257908480224722e-06, "loss": 2.5995, "step": 4783 }, { "epoch": 0.57, "learning_rate": 4.2559231116217305e-06, "loss": 2.4624, "step": 4784 }, { "epoch": 0.57, "learning_rate": 4.253937862985205e-06, "loss": 2.5096, "step": 4785 }, { "epoch": 0.57, "learning_rate": 4.251952734635228e-06, "loss": 2.5136, "step": 4786 }, { "epoch": 0.58, "learning_rate": 4.249967726891857e-06, "loss": 2.3949, "step": 4787 }, { "epoch": 0.58, "learning_rate": 4.24798284007513e-06, "loss": 2.6419, "step": 4788 }, { "epoch": 0.58, "learning_rate": 4.245998074505072e-06, "loss": 2.4746, "step": 4789 }, { "epoch": 0.58, "learning_rate": 4.244013430501681e-06, "loss": 2.5046, "step": 4790 }, { "epoch": 0.58, "learning_rate": 4.242028908384937e-06, "loss": 2.5395, "step": 4791 }, { "epoch": 0.58, "learning_rate": 4.240044508474805e-06, "loss": 2.5844, "step": 4792 }, { "epoch": 0.58, "learning_rate": 4.238060231091224e-06, "loss": 2.4795, "step": 4793 }, { "epoch": 0.58, "learning_rate": 4.236076076554119e-06, "loss": 2.5622, "step": 4794 }, { "epoch": 0.58, "learning_rate": 4.23409204518339e-06, "loss": 2.6337, "step": 4795 }, { "epoch": 0.58, "learning_rate": 4.2321081372989195e-06, "loss": 2.5716, "step": 4796 }, { "epoch": 0.58, "learning_rate": 4.2301243532205726e-06, "loss": 2.4417, "step": 4797 }, { "epoch": 0.58, "learning_rate": 4.228140693268191e-06, "loss": 2.47, "step": 4798 }, { "epoch": 0.58, "learning_rate": 4.226157157761598e-06, "loss": 2.5784, "step": 4799 }, { "epoch": 0.58, "learning_rate": 4.224173747020593e-06, "loss": 2.5336, "step": 4800 }, { "epoch": 0.58, "learning_rate": 4.222190461364963e-06, "loss": 2.3404, "step": 4801 }, { "epoch": 0.58, "learning_rate": 4.220207301114467e-06, "loss": 2.5454, "step": 4802 }, { "epoch": 0.58, "learning_rate": 4.21822426658885e-06, "loss": 2.7036, "step": 4803 }, { "epoch": 0.58, "learning_rate": 4.216241358107831e-06, "loss": 2.5493, "step": 4804 }, { "epoch": 0.58, "learning_rate": 4.214258575991111e-06, "loss": 2.4355, "step": 4805 }, { "epoch": 0.58, "learning_rate": 4.212275920558375e-06, "loss": 2.6433, "step": 4806 }, { "epoch": 0.58, "learning_rate": 4.21029339212928e-06, "loss": 2.4853, "step": 4807 }, { "epoch": 0.58, "learning_rate": 4.208310991023469e-06, "loss": 2.7157, "step": 4808 }, { "epoch": 0.58, "learning_rate": 4.206328717560562e-06, "loss": 2.6732, "step": 4809 }, { "epoch": 0.58, "learning_rate": 4.204346572060156e-06, "loss": 2.4377, "step": 4810 }, { "epoch": 0.58, "learning_rate": 4.20236455484183e-06, "loss": 2.6815, "step": 4811 }, { "epoch": 0.58, "learning_rate": 4.200382666225141e-06, "loss": 2.5664, "step": 4812 }, { "epoch": 0.58, "learning_rate": 4.1984009065296285e-06, "loss": 2.7265, "step": 4813 }, { "epoch": 0.58, "learning_rate": 4.1964192760748085e-06, "loss": 2.5134, "step": 4814 }, { "epoch": 0.58, "learning_rate": 4.1944377751801744e-06, "loss": 2.3888, "step": 4815 }, { "epoch": 0.58, "learning_rate": 4.192456404165202e-06, "loss": 2.5797, "step": 4816 }, { "epoch": 0.58, "learning_rate": 4.190475163349345e-06, "loss": 2.5108, "step": 4817 }, { "epoch": 0.58, "learning_rate": 4.188494053052034e-06, "loss": 2.4257, "step": 4818 }, { "epoch": 0.58, "learning_rate": 4.186513073592686e-06, "loss": 2.5396, "step": 4819 }, { "epoch": 0.58, "learning_rate": 4.184532225290687e-06, "loss": 2.446, "step": 4820 }, { "epoch": 0.58, "learning_rate": 4.182551508465408e-06, "loss": 2.5204, "step": 4821 }, { "epoch": 0.58, "learning_rate": 4.180570923436196e-06, "loss": 2.4695, "step": 4822 }, { "epoch": 0.58, "learning_rate": 4.1785904705223776e-06, "loss": 2.4724, "step": 4823 }, { "epoch": 0.58, "learning_rate": 4.176610150043261e-06, "loss": 2.4487, "step": 4824 }, { "epoch": 0.58, "learning_rate": 4.174629962318129e-06, "loss": 2.3325, "step": 4825 }, { "epoch": 0.58, "learning_rate": 4.172649907666244e-06, "loss": 2.4992, "step": 4826 }, { "epoch": 0.58, "learning_rate": 4.1706699864068485e-06, "loss": 2.6275, "step": 4827 }, { "epoch": 0.58, "learning_rate": 4.16869019885916e-06, "loss": 2.4178, "step": 4828 }, { "epoch": 0.58, "learning_rate": 4.166710545342379e-06, "loss": 2.618, "step": 4829 }, { "epoch": 0.58, "learning_rate": 4.164731026175682e-06, "loss": 2.587, "step": 4830 }, { "epoch": 0.58, "learning_rate": 4.162751641678224e-06, "loss": 2.4629, "step": 4831 }, { "epoch": 0.58, "learning_rate": 4.16077239216914e-06, "loss": 2.7639, "step": 4832 }, { "epoch": 0.58, "learning_rate": 4.158793277967539e-06, "loss": 2.5509, "step": 4833 }, { "epoch": 0.58, "learning_rate": 4.156814299392512e-06, "loss": 2.559, "step": 4834 }, { "epoch": 0.58, "learning_rate": 4.1548354567631245e-06, "loss": 2.502, "step": 4835 }, { "epoch": 0.58, "learning_rate": 4.152856750398426e-06, "loss": 2.6424, "step": 4836 }, { "epoch": 0.58, "learning_rate": 4.15087818061744e-06, "loss": 2.5216, "step": 4837 }, { "epoch": 0.58, "learning_rate": 4.148899747739168e-06, "loss": 2.5336, "step": 4838 }, { "epoch": 0.58, "learning_rate": 4.146921452082587e-06, "loss": 2.5291, "step": 4839 }, { "epoch": 0.58, "learning_rate": 4.144943293966659e-06, "loss": 2.5277, "step": 4840 }, { "epoch": 0.58, "learning_rate": 4.142965273710317e-06, "loss": 2.4815, "step": 4841 }, { "epoch": 0.58, "learning_rate": 4.140987391632477e-06, "loss": 2.4966, "step": 4842 }, { "epoch": 0.58, "learning_rate": 4.139009648052029e-06, "loss": 2.3893, "step": 4843 }, { "epoch": 0.58, "learning_rate": 4.137032043287841e-06, "loss": 2.6514, "step": 4844 }, { "epoch": 0.58, "learning_rate": 4.135054577658761e-06, "loss": 2.4987, "step": 4845 }, { "epoch": 0.58, "learning_rate": 4.133077251483609e-06, "loss": 2.6475, "step": 4846 }, { "epoch": 0.58, "learning_rate": 4.131100065081191e-06, "loss": 2.4836, "step": 4847 }, { "epoch": 0.58, "learning_rate": 4.129123018770285e-06, "loss": 2.3492, "step": 4848 }, { "epoch": 0.58, "learning_rate": 4.1271461128696464e-06, "loss": 2.5578, "step": 4849 }, { "epoch": 0.58, "learning_rate": 4.125169347698009e-06, "loss": 2.5241, "step": 4850 }, { "epoch": 0.58, "learning_rate": 4.123192723574083e-06, "loss": 2.7434, "step": 4851 }, { "epoch": 0.58, "learning_rate": 4.121216240816559e-06, "loss": 2.5684, "step": 4852 }, { "epoch": 0.58, "learning_rate": 4.119239899744101e-06, "loss": 2.4261, "step": 4853 }, { "epoch": 0.58, "learning_rate": 4.117263700675353e-06, "loss": 2.6018, "step": 4854 }, { "epoch": 0.58, "learning_rate": 4.115287643928934e-06, "loss": 2.529, "step": 4855 }, { "epoch": 0.58, "learning_rate": 4.11331172982344e-06, "loss": 2.4285, "step": 4856 }, { "epoch": 0.58, "learning_rate": 4.111335958677447e-06, "loss": 2.5076, "step": 4857 }, { "epoch": 0.58, "learning_rate": 4.1093603308095025e-06, "loss": 2.6507, "step": 4858 }, { "epoch": 0.58, "learning_rate": 4.107384846538137e-06, "loss": 2.6842, "step": 4859 }, { "epoch": 0.58, "learning_rate": 4.105409506181855e-06, "loss": 2.3477, "step": 4860 }, { "epoch": 0.58, "learning_rate": 4.103434310059135e-06, "loss": 2.5301, "step": 4861 }, { "epoch": 0.58, "learning_rate": 4.101459258488438e-06, "loss": 2.5024, "step": 4862 }, { "epoch": 0.58, "learning_rate": 4.099484351788197e-06, "loss": 2.5225, "step": 4863 }, { "epoch": 0.58, "learning_rate": 4.097509590276824e-06, "loss": 2.5166, "step": 4864 }, { "epoch": 0.58, "learning_rate": 4.095534974272709e-06, "loss": 2.4833, "step": 4865 }, { "epoch": 0.58, "learning_rate": 4.093560504094215e-06, "loss": 2.4851, "step": 4866 }, { "epoch": 0.58, "learning_rate": 4.091586180059682e-06, "loss": 2.4024, "step": 4867 }, { "epoch": 0.58, "learning_rate": 4.089612002487428e-06, "loss": 2.4603, "step": 4868 }, { "epoch": 0.58, "learning_rate": 4.087637971695747e-06, "loss": 2.4883, "step": 4869 }, { "epoch": 0.59, "learning_rate": 4.085664088002911e-06, "loss": 2.6685, "step": 4870 }, { "epoch": 0.59, "learning_rate": 4.083690351727164e-06, "loss": 2.5464, "step": 4871 }, { "epoch": 0.59, "learning_rate": 4.0817167631867294e-06, "loss": 2.5826, "step": 4872 }, { "epoch": 0.59, "learning_rate": 4.079743322699807e-06, "loss": 2.4273, "step": 4873 }, { "epoch": 0.59, "learning_rate": 4.077770030584569e-06, "loss": 2.3708, "step": 4874 }, { "epoch": 0.59, "learning_rate": 4.0757968871591705e-06, "loss": 2.5209, "step": 4875 }, { "epoch": 0.59, "learning_rate": 4.0738238927417354e-06, "loss": 2.4891, "step": 4876 }, { "epoch": 0.59, "learning_rate": 4.07185104765037e-06, "loss": 2.3561, "step": 4877 }, { "epoch": 0.59, "learning_rate": 4.069878352203151e-06, "loss": 2.479, "step": 4878 }, { "epoch": 0.59, "learning_rate": 4.067905806718133e-06, "loss": 2.5887, "step": 4879 }, { "epoch": 0.59, "learning_rate": 4.065933411513349e-06, "loss": 2.4512, "step": 4880 }, { "epoch": 0.59, "learning_rate": 4.0639611669068025e-06, "loss": 2.4799, "step": 4881 }, { "epoch": 0.59, "learning_rate": 4.061989073216478e-06, "loss": 2.562, "step": 4882 }, { "epoch": 0.59, "learning_rate": 4.0600171307603325e-06, "loss": 2.6175, "step": 4883 }, { "epoch": 0.59, "learning_rate": 4.0580453398563005e-06, "loss": 2.7528, "step": 4884 }, { "epoch": 0.59, "learning_rate": 4.056073700822288e-06, "loss": 2.5791, "step": 4885 }, { "epoch": 0.59, "learning_rate": 4.054102213976184e-06, "loss": 2.5083, "step": 4886 }, { "epoch": 0.59, "learning_rate": 4.052130879635845e-06, "loss": 2.5872, "step": 4887 }, { "epoch": 0.59, "learning_rate": 4.050159698119107e-06, "loss": 2.5085, "step": 4888 }, { "epoch": 0.59, "learning_rate": 4.048188669743783e-06, "loss": 2.6802, "step": 4889 }, { "epoch": 0.59, "learning_rate": 4.046217794827659e-06, "loss": 2.6018, "step": 4890 }, { "epoch": 0.59, "learning_rate": 4.044247073688494e-06, "loss": 2.5118, "step": 4891 }, { "epoch": 0.59, "learning_rate": 4.042276506644024e-06, "loss": 2.4972, "step": 4892 }, { "epoch": 0.59, "learning_rate": 4.040306094011965e-06, "loss": 2.3447, "step": 4893 }, { "epoch": 0.59, "learning_rate": 4.038335836110001e-06, "loss": 2.6201, "step": 4894 }, { "epoch": 0.59, "learning_rate": 4.036365733255794e-06, "loss": 2.5011, "step": 4895 }, { "epoch": 0.59, "learning_rate": 4.034395785766978e-06, "loss": 2.6591, "step": 4896 }, { "epoch": 0.59, "learning_rate": 4.032425993961171e-06, "loss": 2.523, "step": 4897 }, { "epoch": 0.59, "learning_rate": 4.030456358155957e-06, "loss": 2.6904, "step": 4898 }, { "epoch": 0.59, "learning_rate": 4.028486878668896e-06, "loss": 2.4741, "step": 4899 }, { "epoch": 0.59, "learning_rate": 4.026517555817527e-06, "loss": 2.6222, "step": 4900 }, { "epoch": 0.59, "learning_rate": 4.02454838991936e-06, "loss": 2.6375, "step": 4901 }, { "epoch": 0.59, "learning_rate": 4.02257938129188e-06, "loss": 2.4083, "step": 4902 }, { "epoch": 0.59, "learning_rate": 4.020610530252548e-06, "loss": 2.5175, "step": 4903 }, { "epoch": 0.59, "learning_rate": 4.018641837118799e-06, "loss": 2.4851, "step": 4904 }, { "epoch": 0.59, "learning_rate": 4.016673302208044e-06, "loss": 2.4044, "step": 4905 }, { "epoch": 0.59, "learning_rate": 4.0147049258376654e-06, "loss": 2.4443, "step": 4906 }, { "epoch": 0.59, "learning_rate": 4.01273670832502e-06, "loss": 2.6252, "step": 4907 }, { "epoch": 0.59, "learning_rate": 4.010768649987446e-06, "loss": 2.3682, "step": 4908 }, { "epoch": 0.59, "learning_rate": 4.0088007511422485e-06, "loss": 2.3978, "step": 4909 }, { "epoch": 0.59, "learning_rate": 4.006833012106707e-06, "loss": 2.5544, "step": 4910 }, { "epoch": 0.59, "learning_rate": 4.004865433198078e-06, "loss": 2.5584, "step": 4911 }, { "epoch": 0.59, "learning_rate": 4.002898014733593e-06, "loss": 2.4182, "step": 4912 }, { "epoch": 0.59, "learning_rate": 4.000930757030456e-06, "loss": 2.3943, "step": 4913 }, { "epoch": 0.59, "learning_rate": 3.998963660405843e-06, "loss": 2.6366, "step": 4914 }, { "epoch": 0.59, "learning_rate": 3.996996725176908e-06, "loss": 2.6088, "step": 4915 }, { "epoch": 0.59, "learning_rate": 3.995029951660777e-06, "loss": 2.5193, "step": 4916 }, { "epoch": 0.59, "learning_rate": 3.993063340174549e-06, "loss": 2.5376, "step": 4917 }, { "epoch": 0.59, "learning_rate": 3.991096891035298e-06, "loss": 2.595, "step": 4918 }, { "epoch": 0.59, "learning_rate": 3.989130604560074e-06, "loss": 2.7174, "step": 4919 }, { "epoch": 0.59, "learning_rate": 3.987164481065899e-06, "loss": 2.5327, "step": 4920 }, { "epoch": 0.59, "learning_rate": 3.985198520869765e-06, "loss": 2.4284, "step": 4921 }, { "epoch": 0.59, "learning_rate": 3.983232724288642e-06, "loss": 2.6153, "step": 4922 }, { "epoch": 0.59, "learning_rate": 3.981267091639475e-06, "loss": 2.531, "step": 4923 }, { "epoch": 0.59, "learning_rate": 3.979301623239177e-06, "loss": 2.6541, "step": 4924 }, { "epoch": 0.59, "learning_rate": 3.9773363194046405e-06, "loss": 2.4796, "step": 4925 }, { "epoch": 0.59, "learning_rate": 3.9753711804527266e-06, "loss": 2.5867, "step": 4926 }, { "epoch": 0.59, "learning_rate": 3.9734062067002716e-06, "loss": 2.467, "step": 4927 }, { "epoch": 0.59, "learning_rate": 3.971441398464088e-06, "loss": 2.438, "step": 4928 }, { "epoch": 0.59, "learning_rate": 3.969476756060954e-06, "loss": 2.6418, "step": 4929 }, { "epoch": 0.59, "learning_rate": 3.967512279807633e-06, "loss": 2.4639, "step": 4930 }, { "epoch": 0.59, "learning_rate": 3.965547970020851e-06, "loss": 2.6308, "step": 4931 }, { "epoch": 0.59, "learning_rate": 3.963583827017311e-06, "loss": 2.6424, "step": 4932 }, { "epoch": 0.59, "learning_rate": 3.961619851113689e-06, "loss": 2.6717, "step": 4933 }, { "epoch": 0.59, "learning_rate": 3.959656042626634e-06, "loss": 2.6414, "step": 4934 }, { "epoch": 0.59, "learning_rate": 3.957692401872769e-06, "loss": 2.5456, "step": 4935 }, { "epoch": 0.59, "learning_rate": 3.955728929168689e-06, "loss": 2.5684, "step": 4936 }, { "epoch": 0.59, "learning_rate": 3.9537656248309605e-06, "loss": 2.4174, "step": 4937 }, { "epoch": 0.59, "learning_rate": 3.951802489176126e-06, "loss": 2.5022, "step": 4938 }, { "epoch": 0.59, "learning_rate": 3.9498395225206964e-06, "loss": 2.5, "step": 4939 }, { "epoch": 0.59, "learning_rate": 3.94787672518116e-06, "loss": 2.6546, "step": 4940 }, { "epoch": 0.59, "learning_rate": 3.9459140974739755e-06, "loss": 2.5153, "step": 4941 }, { "epoch": 0.59, "learning_rate": 3.943951639715576e-06, "loss": 2.5803, "step": 4942 }, { "epoch": 0.59, "learning_rate": 3.941989352222366e-06, "loss": 2.5764, "step": 4943 }, { "epoch": 0.59, "learning_rate": 3.940027235310719e-06, "loss": 2.4846, "step": 4944 }, { "epoch": 0.59, "learning_rate": 3.938065289296986e-06, "loss": 2.4249, "step": 4945 }, { "epoch": 0.59, "learning_rate": 3.9361035144974905e-06, "loss": 2.4133, "step": 4946 }, { "epoch": 0.59, "learning_rate": 3.934141911228525e-06, "loss": 2.543, "step": 4947 }, { "epoch": 0.59, "learning_rate": 3.932180479806357e-06, "loss": 2.6736, "step": 4948 }, { "epoch": 0.59, "learning_rate": 3.930219220547223e-06, "loss": 2.4867, "step": 4949 }, { "epoch": 0.59, "learning_rate": 3.928258133767336e-06, "loss": 2.4432, "step": 4950 }, { "epoch": 0.59, "learning_rate": 3.92629721978288e-06, "loss": 2.3723, "step": 4951 }, { "epoch": 0.59, "learning_rate": 3.924336478910007e-06, "loss": 2.6019, "step": 4952 }, { "epoch": 0.6, "learning_rate": 3.922375911464849e-06, "loss": 2.5161, "step": 4953 }, { "epoch": 0.6, "learning_rate": 3.920415517763503e-06, "loss": 2.5733, "step": 4954 }, { "epoch": 0.6, "learning_rate": 3.918455298122041e-06, "loss": 2.4679, "step": 4955 }, { "epoch": 0.6, "learning_rate": 3.916495252856506e-06, "loss": 2.4922, "step": 4956 }, { "epoch": 0.6, "learning_rate": 3.914535382282913e-06, "loss": 2.4435, "step": 4957 }, { "epoch": 0.6, "learning_rate": 3.912575686717251e-06, "loss": 2.4271, "step": 4958 }, { "epoch": 0.6, "learning_rate": 3.910616166475477e-06, "loss": 2.5095, "step": 4959 }, { "epoch": 0.6, "learning_rate": 3.908656821873523e-06, "loss": 2.5107, "step": 4960 }, { "epoch": 0.6, "learning_rate": 3.906697653227291e-06, "loss": 2.4476, "step": 4961 }, { "epoch": 0.6, "learning_rate": 3.904738660852654e-06, "loss": 2.4865, "step": 4962 }, { "epoch": 0.6, "learning_rate": 3.9027798450654585e-06, "loss": 2.5297, "step": 4963 }, { "epoch": 0.6, "learning_rate": 3.900821206181521e-06, "loss": 2.674, "step": 4964 }, { "epoch": 0.6, "learning_rate": 3.898862744516631e-06, "loss": 2.5417, "step": 4965 }, { "epoch": 0.6, "learning_rate": 3.89690446038655e-06, "loss": 2.4093, "step": 4966 }, { "epoch": 0.6, "learning_rate": 3.8949463541070065e-06, "loss": 2.4897, "step": 4967 }, { "epoch": 0.6, "learning_rate": 3.892988425993703e-06, "loss": 2.525, "step": 4968 }, { "epoch": 0.6, "learning_rate": 3.891030676362315e-06, "loss": 2.3902, "step": 4969 }, { "epoch": 0.6, "learning_rate": 3.889073105528489e-06, "loss": 2.5884, "step": 4970 }, { "epoch": 0.6, "learning_rate": 3.887115713807839e-06, "loss": 2.3973, "step": 4971 }, { "epoch": 0.6, "learning_rate": 3.885158501515954e-06, "loss": 2.3552, "step": 4972 }, { "epoch": 0.6, "learning_rate": 3.88320146896839e-06, "loss": 2.4136, "step": 4973 }, { "epoch": 0.6, "learning_rate": 3.881244616480679e-06, "loss": 2.47, "step": 4974 }, { "epoch": 0.6, "learning_rate": 3.879287944368321e-06, "loss": 2.5461, "step": 4975 }, { "epoch": 0.6, "learning_rate": 3.8773314529467875e-06, "loss": 2.6127, "step": 4976 }, { "epoch": 0.6, "learning_rate": 3.8753751425315225e-06, "loss": 2.6071, "step": 4977 }, { "epoch": 0.6, "learning_rate": 3.873419013437937e-06, "loss": 2.618, "step": 4978 }, { "epoch": 0.6, "learning_rate": 3.871463065981415e-06, "loss": 2.496, "step": 4979 }, { "epoch": 0.6, "learning_rate": 3.869507300477311e-06, "loss": 2.4832, "step": 4980 }, { "epoch": 0.6, "learning_rate": 3.867551717240952e-06, "loss": 2.545, "step": 4981 }, { "epoch": 0.6, "learning_rate": 3.865596316587633e-06, "loss": 2.593, "step": 4982 }, { "epoch": 0.6, "learning_rate": 3.86364109883262e-06, "loss": 2.4829, "step": 4983 }, { "epoch": 0.6, "learning_rate": 3.8616860642911516e-06, "loss": 2.5589, "step": 4984 }, { "epoch": 0.6, "learning_rate": 3.85973121327843e-06, "loss": 2.5866, "step": 4985 }, { "epoch": 0.6, "learning_rate": 3.857776546109641e-06, "loss": 2.4887, "step": 4986 }, { "epoch": 0.6, "learning_rate": 3.855822063099927e-06, "loss": 2.4433, "step": 4987 }, { "epoch": 0.6, "learning_rate": 3.853867764564409e-06, "loss": 2.6315, "step": 4988 }, { "epoch": 0.6, "learning_rate": 3.851913650818177e-06, "loss": 2.5939, "step": 4989 }, { "epoch": 0.6, "learning_rate": 3.849959722176287e-06, "loss": 2.4589, "step": 4990 }, { "epoch": 0.6, "learning_rate": 3.848005978953769e-06, "loss": 2.6314, "step": 4991 }, { "epoch": 0.6, "learning_rate": 3.846052421465623e-06, "loss": 2.5799, "step": 4992 }, { "epoch": 0.6, "learning_rate": 3.844099050026819e-06, "loss": 2.5222, "step": 4993 }, { "epoch": 0.6, "learning_rate": 3.842145864952295e-06, "loss": 2.4196, "step": 4994 }, { "epoch": 0.6, "learning_rate": 3.84019286655696e-06, "loss": 2.413, "step": 4995 }, { "epoch": 0.6, "learning_rate": 3.838240055155692e-06, "loss": 2.595, "step": 4996 }, { "epoch": 0.6, "learning_rate": 3.836287431063344e-06, "loss": 2.5207, "step": 4997 }, { "epoch": 0.6, "learning_rate": 3.834334994594733e-06, "loss": 2.5144, "step": 4998 }, { "epoch": 0.6, "learning_rate": 3.832382746064647e-06, "loss": 2.3374, "step": 4999 }, { "epoch": 0.6, "learning_rate": 3.830430685787844e-06, "loss": 2.577, "step": 5000 }, { "epoch": 0.6, "learning_rate": 3.828478814079054e-06, "loss": 2.7151, "step": 5001 }, { "epoch": 0.6, "learning_rate": 3.8265271312529714e-06, "loss": 2.5266, "step": 5002 }, { "epoch": 0.6, "learning_rate": 3.824575637624265e-06, "loss": 2.5121, "step": 5003 }, { "epoch": 0.6, "learning_rate": 3.8226243335075715e-06, "loss": 2.4622, "step": 5004 }, { "epoch": 0.6, "learning_rate": 3.820673219217497e-06, "loss": 2.4387, "step": 5005 }, { "epoch": 0.6, "learning_rate": 3.818722295068616e-06, "loss": 2.5886, "step": 5006 }, { "epoch": 0.6, "learning_rate": 3.816771561375473e-06, "loss": 2.5406, "step": 5007 }, { "epoch": 0.6, "learning_rate": 3.814821018452583e-06, "loss": 2.592, "step": 5008 }, { "epoch": 0.6, "learning_rate": 3.812870666614431e-06, "loss": 2.5259, "step": 5009 }, { "epoch": 0.6, "learning_rate": 3.8109205061754657e-06, "loss": 2.3736, "step": 5010 }, { "epoch": 0.6, "learning_rate": 3.8089705374501116e-06, "loss": 2.462, "step": 5011 }, { "epoch": 0.6, "learning_rate": 3.8070207607527587e-06, "loss": 2.5273, "step": 5012 }, { "epoch": 0.6, "learning_rate": 3.805071176397766e-06, "loss": 2.4739, "step": 5013 }, { "epoch": 0.6, "learning_rate": 3.8031217846994628e-06, "loss": 2.6388, "step": 5014 }, { "epoch": 0.6, "learning_rate": 3.801172585972146e-06, "loss": 2.6525, "step": 5015 }, { "epoch": 0.6, "learning_rate": 3.7992235805300838e-06, "loss": 2.4216, "step": 5016 }, { "epoch": 0.6, "learning_rate": 3.7972747686875104e-06, "loss": 2.4764, "step": 5017 }, { "epoch": 0.6, "learning_rate": 3.7953261507586282e-06, "loss": 2.6501, "step": 5018 }, { "epoch": 0.6, "learning_rate": 3.7933777270576145e-06, "loss": 2.5571, "step": 5019 }, { "epoch": 0.6, "learning_rate": 3.7914294978986083e-06, "loss": 2.5942, "step": 5020 }, { "epoch": 0.6, "learning_rate": 3.7894814635957188e-06, "loss": 2.4701, "step": 5021 }, { "epoch": 0.6, "learning_rate": 3.7875336244630278e-06, "loss": 2.4182, "step": 5022 }, { "epoch": 0.6, "learning_rate": 3.7855859808145808e-06, "loss": 2.3399, "step": 5023 }, { "epoch": 0.6, "learning_rate": 3.7836385329643933e-06, "loss": 2.3826, "step": 5024 }, { "epoch": 0.6, "learning_rate": 3.7816912812264506e-06, "loss": 2.5337, "step": 5025 }, { "epoch": 0.6, "learning_rate": 3.779744225914703e-06, "loss": 2.4479, "step": 5026 }, { "epoch": 0.6, "learning_rate": 3.777797367343076e-06, "loss": 2.4938, "step": 5027 }, { "epoch": 0.6, "learning_rate": 3.7758507058254547e-06, "loss": 2.5076, "step": 5028 }, { "epoch": 0.6, "learning_rate": 3.773904241675696e-06, "loss": 2.5482, "step": 5029 }, { "epoch": 0.6, "learning_rate": 3.77195797520763e-06, "loss": 2.4423, "step": 5030 }, { "epoch": 0.6, "learning_rate": 3.770011906735049e-06, "loss": 2.4936, "step": 5031 }, { "epoch": 0.6, "learning_rate": 3.768066036571713e-06, "loss": 2.5321, "step": 5032 }, { "epoch": 0.6, "learning_rate": 3.766120365031352e-06, "loss": 2.5735, "step": 5033 }, { "epoch": 0.6, "learning_rate": 3.764174892427666e-06, "loss": 2.5805, "step": 5034 }, { "epoch": 0.6, "learning_rate": 3.76222961907432e-06, "loss": 2.4771, "step": 5035 }, { "epoch": 0.6, "learning_rate": 3.760284545284947e-06, "loss": 2.4682, "step": 5036 }, { "epoch": 0.61, "learning_rate": 3.7583396713731486e-06, "loss": 2.456, "step": 5037 }, { "epoch": 0.61, "learning_rate": 3.7563949976524933e-06, "loss": 2.6913, "step": 5038 }, { "epoch": 0.61, "learning_rate": 3.7544505244365204e-06, "loss": 2.5072, "step": 5039 }, { "epoch": 0.61, "learning_rate": 3.7525062520387305e-06, "loss": 2.4621, "step": 5040 }, { "epoch": 0.61, "learning_rate": 3.750562180772601e-06, "loss": 2.4993, "step": 5041 }, { "epoch": 0.61, "learning_rate": 3.7486183109515696e-06, "loss": 2.4674, "step": 5042 }, { "epoch": 0.61, "learning_rate": 3.7466746428890434e-06, "loss": 2.5972, "step": 5043 }, { "epoch": 0.61, "learning_rate": 3.744731176898396e-06, "loss": 2.5712, "step": 5044 }, { "epoch": 0.61, "learning_rate": 3.7427879132929735e-06, "loss": 2.5569, "step": 5045 }, { "epoch": 0.61, "learning_rate": 3.7408448523860817e-06, "loss": 2.515, "step": 5046 }, { "epoch": 0.61, "learning_rate": 3.738901994490999e-06, "loss": 2.5363, "step": 5047 }, { "epoch": 0.61, "learning_rate": 3.7369593399209704e-06, "loss": 2.4126, "step": 5048 }, { "epoch": 0.61, "learning_rate": 3.7350168889892046e-06, "loss": 2.5044, "step": 5049 }, { "epoch": 0.61, "learning_rate": 3.7330746420088837e-06, "loss": 2.354, "step": 5050 }, { "epoch": 0.61, "learning_rate": 3.7311325992931517e-06, "loss": 2.3892, "step": 5051 }, { "epoch": 0.61, "learning_rate": 3.7291907611551197e-06, "loss": 2.5166, "step": 5052 }, { "epoch": 0.61, "learning_rate": 3.7272491279078716e-06, "loss": 2.7588, "step": 5053 }, { "epoch": 0.61, "learning_rate": 3.725307699864452e-06, "loss": 2.5537, "step": 5054 }, { "epoch": 0.61, "learning_rate": 3.723366477337875e-06, "loss": 2.5741, "step": 5055 }, { "epoch": 0.61, "learning_rate": 3.7214254606411193e-06, "loss": 2.5606, "step": 5056 }, { "epoch": 0.61, "learning_rate": 3.7194846500871353e-06, "loss": 2.5653, "step": 5057 }, { "epoch": 0.61, "learning_rate": 3.717544045988835e-06, "loss": 2.4784, "step": 5058 }, { "epoch": 0.61, "learning_rate": 3.7156036486591006e-06, "loss": 2.5439, "step": 5059 }, { "epoch": 0.61, "learning_rate": 3.7136634584107787e-06, "loss": 2.461, "step": 5060 }, { "epoch": 0.61, "learning_rate": 3.711723475556682e-06, "loss": 2.5265, "step": 5061 }, { "epoch": 0.61, "learning_rate": 3.709783700409595e-06, "loss": 2.5148, "step": 5062 }, { "epoch": 0.61, "learning_rate": 3.70784413328226e-06, "loss": 2.5461, "step": 5063 }, { "epoch": 0.61, "learning_rate": 3.705904774487396e-06, "loss": 2.7058, "step": 5064 }, { "epoch": 0.61, "learning_rate": 3.703965624337681e-06, "loss": 2.5522, "step": 5065 }, { "epoch": 0.61, "learning_rate": 3.7020266831457598e-06, "loss": 2.562, "step": 5066 }, { "epoch": 0.61, "learning_rate": 3.7000879512242473e-06, "loss": 2.6152, "step": 5067 }, { "epoch": 0.61, "learning_rate": 3.69814942888572e-06, "loss": 2.5508, "step": 5068 }, { "epoch": 0.61, "learning_rate": 3.6962111164427263e-06, "loss": 2.5404, "step": 5069 }, { "epoch": 0.61, "learning_rate": 3.6942730142077756e-06, "loss": 2.3514, "step": 5070 }, { "epoch": 0.61, "learning_rate": 3.692335122493346e-06, "loss": 2.5645, "step": 5071 }, { "epoch": 0.61, "learning_rate": 3.6903974416118786e-06, "loss": 2.6065, "step": 5072 }, { "epoch": 0.61, "learning_rate": 3.6884599718757873e-06, "loss": 2.5013, "step": 5073 }, { "epoch": 0.61, "learning_rate": 3.6865227135974436e-06, "loss": 2.4169, "step": 5074 }, { "epoch": 0.61, "learning_rate": 3.684585667089192e-06, "loss": 2.4233, "step": 5075 }, { "epoch": 0.61, "learning_rate": 3.6826488326633393e-06, "loss": 2.7467, "step": 5076 }, { "epoch": 0.61, "learning_rate": 3.680712210632158e-06, "loss": 2.4093, "step": 5077 }, { "epoch": 0.61, "learning_rate": 3.6787758013078863e-06, "loss": 2.4178, "step": 5078 }, { "epoch": 0.61, "learning_rate": 3.6768396050027284e-06, "loss": 2.6067, "step": 5079 }, { "epoch": 0.61, "learning_rate": 3.6749036220288563e-06, "loss": 2.5035, "step": 5080 }, { "epoch": 0.61, "learning_rate": 3.6729678526984046e-06, "loss": 2.4545, "step": 5081 }, { "epoch": 0.61, "learning_rate": 3.6710322973234758e-06, "loss": 2.5253, "step": 5082 }, { "epoch": 0.61, "learning_rate": 3.669096956216135e-06, "loss": 2.5167, "step": 5083 }, { "epoch": 0.61, "learning_rate": 3.6671618296884147e-06, "loss": 2.6043, "step": 5084 }, { "epoch": 0.61, "learning_rate": 3.6652269180523137e-06, "loss": 2.6464, "step": 5085 }, { "epoch": 0.61, "learning_rate": 3.663292221619794e-06, "loss": 2.5744, "step": 5086 }, { "epoch": 0.61, "learning_rate": 3.661357740702787e-06, "loss": 2.5735, "step": 5087 }, { "epoch": 0.61, "learning_rate": 3.6594234756131826e-06, "loss": 2.5746, "step": 5088 }, { "epoch": 0.61, "learning_rate": 3.6574894266628415e-06, "loss": 2.4488, "step": 5089 }, { "epoch": 0.61, "learning_rate": 3.655555594163587e-06, "loss": 2.7364, "step": 5090 }, { "epoch": 0.61, "learning_rate": 3.6536219784272074e-06, "loss": 2.5308, "step": 5091 }, { "epoch": 0.61, "learning_rate": 3.6516885797654593e-06, "loss": 2.5674, "step": 5092 }, { "epoch": 0.61, "learning_rate": 3.64975539849006e-06, "loss": 2.3874, "step": 5093 }, { "epoch": 0.61, "learning_rate": 3.6478224349126944e-06, "loss": 2.4535, "step": 5094 }, { "epoch": 0.61, "learning_rate": 3.6458896893450104e-06, "loss": 2.4008, "step": 5095 }, { "epoch": 0.61, "learning_rate": 3.6439571620986213e-06, "loss": 2.622, "step": 5096 }, { "epoch": 0.61, "learning_rate": 3.6420248534851075e-06, "loss": 2.5958, "step": 5097 }, { "epoch": 0.61, "learning_rate": 3.640092763816013e-06, "loss": 2.5485, "step": 5098 }, { "epoch": 0.61, "learning_rate": 3.6381608934028447e-06, "loss": 2.5861, "step": 5099 }, { "epoch": 0.61, "learning_rate": 3.6362292425570754e-06, "loss": 2.4628, "step": 5100 }, { "epoch": 0.61, "learning_rate": 3.634297811590143e-06, "loss": 2.5686, "step": 5101 }, { "epoch": 0.61, "learning_rate": 3.6323666008134465e-06, "loss": 2.4375, "step": 5102 }, { "epoch": 0.61, "learning_rate": 3.6304356105383566e-06, "loss": 2.3743, "step": 5103 }, { "epoch": 0.61, "learning_rate": 3.6285048410762018e-06, "loss": 2.5021, "step": 5104 }, { "epoch": 0.61, "learning_rate": 3.6265742927382778e-06, "loss": 2.4798, "step": 5105 }, { "epoch": 0.61, "learning_rate": 3.6246439658358446e-06, "loss": 2.5, "step": 5106 }, { "epoch": 0.61, "learning_rate": 3.6227138606801225e-06, "loss": 2.4777, "step": 5107 }, { "epoch": 0.61, "learning_rate": 3.620783977582305e-06, "loss": 2.5858, "step": 5108 }, { "epoch": 0.61, "learning_rate": 3.6188543168535416e-06, "loss": 2.6944, "step": 5109 }, { "epoch": 0.61, "learning_rate": 3.61692487880495e-06, "loss": 2.479, "step": 5110 }, { "epoch": 0.61, "learning_rate": 3.61499566374761e-06, "loss": 2.2808, "step": 5111 }, { "epoch": 0.61, "learning_rate": 3.613066671992567e-06, "loss": 2.7281, "step": 5112 }, { "epoch": 0.61, "learning_rate": 3.6111379038508276e-06, "loss": 2.4341, "step": 5113 }, { "epoch": 0.61, "learning_rate": 3.6092093596333654e-06, "loss": 2.4488, "step": 5114 }, { "epoch": 0.61, "learning_rate": 3.6072810396511186e-06, "loss": 2.2915, "step": 5115 }, { "epoch": 0.61, "learning_rate": 3.605352944214986e-06, "loss": 2.3949, "step": 5116 }, { "epoch": 0.61, "learning_rate": 3.603425073635831e-06, "loss": 2.525, "step": 5117 }, { "epoch": 0.61, "learning_rate": 3.601497428224481e-06, "loss": 2.3545, "step": 5118 }, { "epoch": 0.61, "learning_rate": 3.5995700082917307e-06, "loss": 2.5431, "step": 5119 }, { "epoch": 0.62, "learning_rate": 3.5976428141483326e-06, "loss": 2.4549, "step": 5120 }, { "epoch": 0.62, "learning_rate": 3.5957158461050056e-06, "loss": 2.4153, "step": 5121 }, { "epoch": 0.62, "learning_rate": 3.5937891044724344e-06, "loss": 2.5595, "step": 5122 }, { "epoch": 0.62, "learning_rate": 3.5918625895612622e-06, "loss": 2.4526, "step": 5123 }, { "epoch": 0.62, "learning_rate": 3.5899363016821e-06, "loss": 2.5859, "step": 5124 }, { "epoch": 0.62, "learning_rate": 3.5880102411455185e-06, "loss": 2.5839, "step": 5125 }, { "epoch": 0.62, "learning_rate": 3.586084408262056e-06, "loss": 2.568, "step": 5126 }, { "epoch": 0.62, "learning_rate": 3.5841588033422103e-06, "loss": 2.5326, "step": 5127 }, { "epoch": 0.62, "learning_rate": 3.5822334266964454e-06, "loss": 2.4828, "step": 5128 }, { "epoch": 0.62, "learning_rate": 3.580308278635183e-06, "loss": 2.4173, "step": 5129 }, { "epoch": 0.62, "learning_rate": 3.5783833594688177e-06, "loss": 2.5672, "step": 5130 }, { "epoch": 0.62, "learning_rate": 3.5764586695076987e-06, "loss": 2.4434, "step": 5131 }, { "epoch": 0.62, "learning_rate": 3.5745342090621406e-06, "loss": 2.7237, "step": 5132 }, { "epoch": 0.62, "learning_rate": 3.572609978442423e-06, "loss": 2.5052, "step": 5133 }, { "epoch": 0.62, "learning_rate": 3.5706859779587856e-06, "loss": 2.6683, "step": 5134 }, { "epoch": 0.62, "learning_rate": 3.5687622079214328e-06, "loss": 2.3648, "step": 5135 }, { "epoch": 0.62, "learning_rate": 3.566838668640531e-06, "loss": 2.4437, "step": 5136 }, { "epoch": 0.62, "learning_rate": 3.5649153604262094e-06, "loss": 2.5803, "step": 5137 }, { "epoch": 0.62, "learning_rate": 3.5629922835885618e-06, "loss": 2.5502, "step": 5138 }, { "epoch": 0.62, "learning_rate": 3.561069438437642e-06, "loss": 2.5065, "step": 5139 }, { "epoch": 0.62, "learning_rate": 3.5591468252834654e-06, "loss": 2.5241, "step": 5140 }, { "epoch": 0.62, "learning_rate": 3.557224444436017e-06, "loss": 2.3322, "step": 5141 }, { "epoch": 0.62, "learning_rate": 3.555302296205237e-06, "loss": 2.4034, "step": 5142 }, { "epoch": 0.62, "learning_rate": 3.553380380901031e-06, "loss": 2.4135, "step": 5143 }, { "epoch": 0.62, "learning_rate": 3.551458698833265e-06, "loss": 2.525, "step": 5144 }, { "epoch": 0.62, "learning_rate": 3.549537250311772e-06, "loss": 2.4441, "step": 5145 }, { "epoch": 0.62, "learning_rate": 3.547616035646343e-06, "loss": 2.5917, "step": 5146 }, { "epoch": 0.62, "learning_rate": 3.545695055146733e-06, "loss": 2.5828, "step": 5147 }, { "epoch": 0.62, "learning_rate": 3.543774309122657e-06, "loss": 2.5627, "step": 5148 }, { "epoch": 0.62, "learning_rate": 3.541853797883797e-06, "loss": 2.6128, "step": 5149 }, { "epoch": 0.62, "learning_rate": 3.5399335217397936e-06, "loss": 2.6368, "step": 5150 }, { "epoch": 0.62, "learning_rate": 3.53801348100025e-06, "loss": 2.6401, "step": 5151 }, { "epoch": 0.62, "learning_rate": 3.536093675974729e-06, "loss": 2.4807, "step": 5152 }, { "epoch": 0.62, "learning_rate": 3.534174106972762e-06, "loss": 2.5955, "step": 5153 }, { "epoch": 0.62, "learning_rate": 3.532254774303838e-06, "loss": 2.4661, "step": 5154 }, { "epoch": 0.62, "learning_rate": 3.5303356782774058e-06, "loss": 2.6481, "step": 5155 }, { "epoch": 0.62, "learning_rate": 3.528416819202881e-06, "loss": 2.6402, "step": 5156 }, { "epoch": 0.62, "learning_rate": 3.5264981973896374e-06, "loss": 2.4807, "step": 5157 }, { "epoch": 0.62, "learning_rate": 3.5245798131470123e-06, "loss": 2.4342, "step": 5158 }, { "epoch": 0.62, "learning_rate": 3.522661666784303e-06, "loss": 2.5033, "step": 5159 }, { "epoch": 0.62, "learning_rate": 3.5207437586107698e-06, "loss": 2.5971, "step": 5160 }, { "epoch": 0.62, "learning_rate": 3.518826088935635e-06, "loss": 2.6164, "step": 5161 }, { "epoch": 0.62, "learning_rate": 3.5169086580680824e-06, "loss": 2.7458, "step": 5162 }, { "epoch": 0.62, "learning_rate": 3.5149914663172524e-06, "loss": 2.6041, "step": 5163 }, { "epoch": 0.62, "learning_rate": 3.5130745139922572e-06, "loss": 2.5145, "step": 5164 }, { "epoch": 0.62, "learning_rate": 3.511157801402162e-06, "loss": 2.6434, "step": 5165 }, { "epoch": 0.62, "learning_rate": 3.5092413288559948e-06, "loss": 2.4729, "step": 5166 }, { "epoch": 0.62, "learning_rate": 3.5073250966627447e-06, "loss": 2.5423, "step": 5167 }, { "epoch": 0.62, "learning_rate": 3.5054091051313666e-06, "loss": 2.3933, "step": 5168 }, { "epoch": 0.62, "learning_rate": 3.5034933545707704e-06, "loss": 2.5371, "step": 5169 }, { "epoch": 0.62, "learning_rate": 3.5015778452898306e-06, "loss": 2.6622, "step": 5170 }, { "epoch": 0.62, "learning_rate": 3.4996625775973812e-06, "loss": 2.5032, "step": 5171 }, { "epoch": 0.62, "learning_rate": 3.497747551802221e-06, "loss": 2.492, "step": 5172 }, { "epoch": 0.62, "learning_rate": 3.4958327682131032e-06, "loss": 2.5095, "step": 5173 }, { "epoch": 0.62, "learning_rate": 3.493918227138746e-06, "loss": 2.4737, "step": 5174 }, { "epoch": 0.62, "learning_rate": 3.4920039288878316e-06, "loss": 2.5062, "step": 5175 }, { "epoch": 0.62, "learning_rate": 3.4900898737689973e-06, "loss": 2.4692, "step": 5176 }, { "epoch": 0.62, "learning_rate": 3.4881760620908444e-06, "loss": 2.3774, "step": 5177 }, { "epoch": 0.62, "learning_rate": 3.4862624941619316e-06, "loss": 2.6447, "step": 5178 }, { "epoch": 0.62, "learning_rate": 3.484349170290784e-06, "loss": 2.3787, "step": 5179 }, { "epoch": 0.62, "learning_rate": 3.4824360907858824e-06, "loss": 2.3746, "step": 5180 }, { "epoch": 0.62, "learning_rate": 3.48052325595567e-06, "loss": 2.4904, "step": 5181 }, { "epoch": 0.62, "learning_rate": 3.4786106661085506e-06, "loss": 2.4811, "step": 5182 }, { "epoch": 0.62, "learning_rate": 3.4766983215528875e-06, "loss": 2.404, "step": 5183 }, { "epoch": 0.62, "learning_rate": 3.4747862225970074e-06, "loss": 2.4135, "step": 5184 }, { "epoch": 0.62, "learning_rate": 3.472874369549192e-06, "loss": 2.4078, "step": 5185 }, { "epoch": 0.62, "learning_rate": 3.47096276271769e-06, "loss": 2.4307, "step": 5186 }, { "epoch": 0.62, "learning_rate": 3.469051402410707e-06, "loss": 2.5864, "step": 5187 }, { "epoch": 0.62, "learning_rate": 3.467140288936407e-06, "loss": 2.5506, "step": 5188 }, { "epoch": 0.62, "learning_rate": 3.4652294226029177e-06, "loss": 2.4612, "step": 5189 }, { "epoch": 0.62, "learning_rate": 3.463318803718323e-06, "loss": 2.555, "step": 5190 }, { "epoch": 0.62, "learning_rate": 3.4614084325906718e-06, "loss": 2.5685, "step": 5191 }, { "epoch": 0.62, "learning_rate": 3.45949830952797e-06, "loss": 2.5255, "step": 5192 }, { "epoch": 0.62, "learning_rate": 3.457588434838184e-06, "loss": 2.3345, "step": 5193 }, { "epoch": 0.62, "learning_rate": 3.4556788088292393e-06, "loss": 2.5304, "step": 5194 }, { "epoch": 0.62, "learning_rate": 3.4537694318090215e-06, "loss": 2.549, "step": 5195 }, { "epoch": 0.62, "learning_rate": 3.4518603040853783e-06, "loss": 2.5154, "step": 5196 }, { "epoch": 0.62, "learning_rate": 3.449951425966116e-06, "loss": 2.4802, "step": 5197 }, { "epoch": 0.62, "learning_rate": 3.4480427977590004e-06, "loss": 2.501, "step": 5198 }, { "epoch": 0.62, "learning_rate": 3.4461344197717562e-06, "loss": 2.6123, "step": 5199 }, { "epoch": 0.62, "learning_rate": 3.444226292312068e-06, "loss": 2.5901, "step": 5200 }, { "epoch": 0.62, "learning_rate": 3.442318415687581e-06, "loss": 2.5017, "step": 5201 }, { "epoch": 0.62, "learning_rate": 3.4404107902059003e-06, "loss": 2.6913, "step": 5202 }, { "epoch": 0.63, "learning_rate": 3.438503416174589e-06, "loss": 2.4979, "step": 5203 }, { "epoch": 0.63, "learning_rate": 3.43659629390117e-06, "loss": 2.5792, "step": 5204 }, { "epoch": 0.63, "learning_rate": 3.434689423693126e-06, "loss": 2.3556, "step": 5205 }, { "epoch": 0.63, "learning_rate": 3.4327828058578984e-06, "loss": 2.5302, "step": 5206 }, { "epoch": 0.63, "learning_rate": 3.430876440702889e-06, "loss": 2.4373, "step": 5207 }, { "epoch": 0.63, "learning_rate": 3.4289703285354587e-06, "loss": 2.3931, "step": 5208 }, { "epoch": 0.63, "learning_rate": 3.4270644696629286e-06, "loss": 2.4269, "step": 5209 }, { "epoch": 0.63, "learning_rate": 3.4251588643925757e-06, "loss": 2.4641, "step": 5210 }, { "epoch": 0.63, "learning_rate": 3.423253513031639e-06, "loss": 2.6967, "step": 5211 }, { "epoch": 0.63, "learning_rate": 3.421348415887315e-06, "loss": 2.5224, "step": 5212 }, { "epoch": 0.63, "learning_rate": 3.4194435732667593e-06, "loss": 2.4448, "step": 5213 }, { "epoch": 0.63, "learning_rate": 3.4175389854770885e-06, "loss": 2.351, "step": 5214 }, { "epoch": 0.63, "learning_rate": 3.415634652825376e-06, "loss": 2.4423, "step": 5215 }, { "epoch": 0.63, "learning_rate": 3.4137305756186543e-06, "loss": 2.3759, "step": 5216 }, { "epoch": 0.63, "learning_rate": 3.411826754163915e-06, "loss": 2.3932, "step": 5217 }, { "epoch": 0.63, "learning_rate": 3.4099231887681073e-06, "loss": 2.6536, "step": 5218 }, { "epoch": 0.63, "learning_rate": 3.4080198797381435e-06, "loss": 2.5059, "step": 5219 }, { "epoch": 0.63, "learning_rate": 3.4061168273808896e-06, "loss": 2.8095, "step": 5220 }, { "epoch": 0.63, "learning_rate": 3.4042140320031726e-06, "loss": 2.4908, "step": 5221 }, { "epoch": 0.63, "learning_rate": 3.4023114939117773e-06, "loss": 2.5286, "step": 5222 }, { "epoch": 0.63, "learning_rate": 3.4004092134134477e-06, "loss": 2.4125, "step": 5223 }, { "epoch": 0.63, "learning_rate": 3.3985071908148836e-06, "loss": 2.5578, "step": 5224 }, { "epoch": 0.63, "learning_rate": 3.3966054264227476e-06, "loss": 2.5223, "step": 5225 }, { "epoch": 0.63, "learning_rate": 3.3947039205436593e-06, "loss": 2.523, "step": 5226 }, { "epoch": 0.63, "learning_rate": 3.3928026734841935e-06, "loss": 2.3373, "step": 5227 }, { "epoch": 0.63, "learning_rate": 3.390901685550887e-06, "loss": 2.3591, "step": 5228 }, { "epoch": 0.63, "learning_rate": 3.3890009570502304e-06, "loss": 2.3541, "step": 5229 }, { "epoch": 0.63, "learning_rate": 3.3871004882886805e-06, "loss": 2.6044, "step": 5230 }, { "epoch": 0.63, "learning_rate": 3.385200279572643e-06, "loss": 2.4239, "step": 5231 }, { "epoch": 0.63, "learning_rate": 3.383300331208489e-06, "loss": 2.5854, "step": 5232 }, { "epoch": 0.63, "learning_rate": 3.3814006435025436e-06, "loss": 2.5308, "step": 5233 }, { "epoch": 0.63, "learning_rate": 3.3795012167610898e-06, "loss": 2.3812, "step": 5234 }, { "epoch": 0.63, "learning_rate": 3.3776020512903697e-06, "loss": 2.5382, "step": 5235 }, { "epoch": 0.63, "learning_rate": 3.3757031473965827e-06, "loss": 2.6031, "step": 5236 }, { "epoch": 0.63, "learning_rate": 3.3738045053858882e-06, "loss": 2.4826, "step": 5237 }, { "epoch": 0.63, "learning_rate": 3.3719061255643996e-06, "loss": 2.7035, "step": 5238 }, { "epoch": 0.63, "learning_rate": 3.3700080082381913e-06, "loss": 2.4976, "step": 5239 }, { "epoch": 0.63, "learning_rate": 3.3681101537132914e-06, "loss": 2.5154, "step": 5240 }, { "epoch": 0.63, "learning_rate": 3.366212562295693e-06, "loss": 2.5132, "step": 5241 }, { "epoch": 0.63, "learning_rate": 3.364315234291339e-06, "loss": 2.6111, "step": 5242 }, { "epoch": 0.63, "learning_rate": 3.3624181700061328e-06, "loss": 2.5742, "step": 5243 }, { "epoch": 0.63, "learning_rate": 3.360521369745937e-06, "loss": 2.6058, "step": 5244 }, { "epoch": 0.63, "learning_rate": 3.358624833816569e-06, "loss": 2.4172, "step": 5245 }, { "epoch": 0.63, "learning_rate": 3.356728562523805e-06, "loss": 2.564, "step": 5246 }, { "epoch": 0.63, "learning_rate": 3.3548325561733775e-06, "loss": 2.5143, "step": 5247 }, { "epoch": 0.63, "learning_rate": 3.3529368150709762e-06, "loss": 2.5733, "step": 5248 }, { "epoch": 0.63, "learning_rate": 3.351041339522252e-06, "loss": 2.7168, "step": 5249 }, { "epoch": 0.63, "learning_rate": 3.3491461298328064e-06, "loss": 2.656, "step": 5250 }, { "epoch": 0.63, "learning_rate": 3.3472511863082034e-06, "loss": 2.5923, "step": 5251 }, { "epoch": 0.63, "learning_rate": 3.3453565092539586e-06, "loss": 2.5038, "step": 5252 }, { "epoch": 0.63, "learning_rate": 3.343462098975553e-06, "loss": 2.4233, "step": 5253 }, { "epoch": 0.63, "learning_rate": 3.3415679557784163e-06, "loss": 2.5002, "step": 5254 }, { "epoch": 0.63, "learning_rate": 3.339674079967942e-06, "loss": 2.5497, "step": 5255 }, { "epoch": 0.63, "learning_rate": 3.3377804718494733e-06, "loss": 2.5611, "step": 5256 }, { "epoch": 0.63, "learning_rate": 3.335887131728316e-06, "loss": 2.5799, "step": 5257 }, { "epoch": 0.63, "learning_rate": 3.33399405990973e-06, "loss": 2.3542, "step": 5258 }, { "epoch": 0.63, "learning_rate": 3.332101256698932e-06, "loss": 2.6261, "step": 5259 }, { "epoch": 0.63, "learning_rate": 3.330208722401097e-06, "loss": 2.5567, "step": 5260 }, { "epoch": 0.63, "learning_rate": 3.3283164573213557e-06, "loss": 2.5271, "step": 5261 }, { "epoch": 0.63, "learning_rate": 3.326424461764795e-06, "loss": 2.4679, "step": 5262 }, { "epoch": 0.63, "learning_rate": 3.3245327360364566e-06, "loss": 2.4132, "step": 5263 }, { "epoch": 0.63, "learning_rate": 3.3226412804413444e-06, "loss": 2.4701, "step": 5264 }, { "epoch": 0.63, "learning_rate": 3.320750095284414e-06, "loss": 2.5796, "step": 5265 }, { "epoch": 0.63, "learning_rate": 3.3188591808705773e-06, "loss": 2.511, "step": 5266 }, { "epoch": 0.63, "learning_rate": 3.3169685375047044e-06, "loss": 2.297, "step": 5267 }, { "epoch": 0.63, "learning_rate": 3.315078165491622e-06, "loss": 2.5519, "step": 5268 }, { "epoch": 0.63, "learning_rate": 3.3131880651361115e-06, "loss": 2.4593, "step": 5269 }, { "epoch": 0.63, "learning_rate": 3.3112982367429105e-06, "loss": 2.5366, "step": 5270 }, { "epoch": 0.63, "learning_rate": 3.3094086806167126e-06, "loss": 2.4915, "step": 5271 }, { "epoch": 0.63, "learning_rate": 3.3075193970621706e-06, "loss": 2.321, "step": 5272 }, { "epoch": 0.63, "learning_rate": 3.3056303863838902e-06, "loss": 2.4296, "step": 5273 }, { "epoch": 0.63, "learning_rate": 3.3037416488864303e-06, "loss": 2.4635, "step": 5274 }, { "epoch": 0.63, "learning_rate": 3.3018531848743164e-06, "loss": 2.6559, "step": 5275 }, { "epoch": 0.63, "learning_rate": 3.299964994652017e-06, "loss": 2.3666, "step": 5276 }, { "epoch": 0.63, "learning_rate": 3.2980770785239656e-06, "loss": 2.591, "step": 5277 }, { "epoch": 0.63, "learning_rate": 3.2961894367945467e-06, "loss": 2.3876, "step": 5278 }, { "epoch": 0.63, "learning_rate": 3.294302069768104e-06, "loss": 2.5892, "step": 5279 }, { "epoch": 0.63, "learning_rate": 3.292414977748932e-06, "loss": 2.5619, "step": 5280 }, { "epoch": 0.63, "learning_rate": 3.2905281610412866e-06, "loss": 2.5996, "step": 5281 }, { "epoch": 0.63, "learning_rate": 3.288641619949374e-06, "loss": 2.5966, "step": 5282 }, { "epoch": 0.63, "learning_rate": 3.286755354777361e-06, "loss": 2.345, "step": 5283 }, { "epoch": 0.63, "learning_rate": 3.2848693658293675e-06, "loss": 2.5066, "step": 5284 }, { "epoch": 0.63, "learning_rate": 3.2829836534094642e-06, "loss": 2.6319, "step": 5285 }, { "epoch": 0.64, "learning_rate": 3.281098217821689e-06, "loss": 2.5479, "step": 5286 }, { "epoch": 0.64, "learning_rate": 3.2792130593700233e-06, "loss": 2.5742, "step": 5287 }, { "epoch": 0.64, "learning_rate": 3.2773281783584104e-06, "loss": 2.4955, "step": 5288 }, { "epoch": 0.64, "learning_rate": 3.2754435750907454e-06, "loss": 2.6172, "step": 5289 }, { "epoch": 0.64, "learning_rate": 3.2735592498708818e-06, "loss": 2.4367, "step": 5290 }, { "epoch": 0.64, "learning_rate": 3.2716752030026265e-06, "loss": 2.4898, "step": 5291 }, { "epoch": 0.64, "learning_rate": 3.269791434789741e-06, "loss": 2.6084, "step": 5292 }, { "epoch": 0.64, "learning_rate": 3.267907945535943e-06, "loss": 2.4735, "step": 5293 }, { "epoch": 0.64, "learning_rate": 3.2660247355449037e-06, "loss": 2.6067, "step": 5294 }, { "epoch": 0.64, "learning_rate": 3.264141805120253e-06, "loss": 2.5848, "step": 5295 }, { "epoch": 0.64, "learning_rate": 3.262259154565569e-06, "loss": 2.498, "step": 5296 }, { "epoch": 0.64, "learning_rate": 3.260376784184393e-06, "loss": 2.5366, "step": 5297 }, { "epoch": 0.64, "learning_rate": 3.2584946942802153e-06, "loss": 2.4881, "step": 5298 }, { "epoch": 0.64, "learning_rate": 3.2566128851564833e-06, "loss": 2.5459, "step": 5299 }, { "epoch": 0.64, "learning_rate": 3.254731357116597e-06, "loss": 2.3718, "step": 5300 }, { "epoch": 0.64, "learning_rate": 3.2528501104639126e-06, "loss": 2.5318, "step": 5301 }, { "epoch": 0.64, "learning_rate": 3.250969145501742e-06, "loss": 2.4096, "step": 5302 }, { "epoch": 0.64, "learning_rate": 3.2490884625333506e-06, "loss": 2.4562, "step": 5303 }, { "epoch": 0.64, "learning_rate": 3.247208061861957e-06, "loss": 2.6356, "step": 5304 }, { "epoch": 0.64, "learning_rate": 3.245327943790736e-06, "loss": 2.4381, "step": 5305 }, { "epoch": 0.64, "learning_rate": 3.2434481086228163e-06, "loss": 2.3019, "step": 5306 }, { "epoch": 0.64, "learning_rate": 3.24156855666128e-06, "loss": 2.3692, "step": 5307 }, { "epoch": 0.64, "learning_rate": 3.2396892882091678e-06, "loss": 2.6403, "step": 5308 }, { "epoch": 0.64, "learning_rate": 3.2378103035694708e-06, "loss": 2.4894, "step": 5309 }, { "epoch": 0.64, "learning_rate": 3.2359316030451327e-06, "loss": 2.4567, "step": 5310 }, { "epoch": 0.64, "learning_rate": 3.234053186939055e-06, "loss": 2.554, "step": 5311 }, { "epoch": 0.64, "learning_rate": 3.232175055554091e-06, "loss": 2.5812, "step": 5312 }, { "epoch": 0.64, "learning_rate": 3.2302972091930517e-06, "loss": 2.6583, "step": 5313 }, { "epoch": 0.64, "learning_rate": 3.2284196481586984e-06, "loss": 2.4835, "step": 5314 }, { "epoch": 0.64, "learning_rate": 3.2265423727537457e-06, "loss": 2.7434, "step": 5315 }, { "epoch": 0.64, "learning_rate": 3.2246653832808674e-06, "loss": 2.5405, "step": 5316 }, { "epoch": 0.64, "learning_rate": 3.2227886800426844e-06, "loss": 2.5325, "step": 5317 }, { "epoch": 0.64, "learning_rate": 3.2209122633417766e-06, "loss": 2.376, "step": 5318 }, { "epoch": 0.64, "learning_rate": 3.2190361334806765e-06, "loss": 2.6829, "step": 5319 }, { "epoch": 0.64, "learning_rate": 3.2171602907618706e-06, "loss": 2.6358, "step": 5320 }, { "epoch": 0.64, "learning_rate": 3.2152847354877963e-06, "loss": 2.4313, "step": 5321 }, { "epoch": 0.64, "learning_rate": 3.2134094679608485e-06, "loss": 2.5283, "step": 5322 }, { "epoch": 0.64, "learning_rate": 3.211534488483373e-06, "loss": 2.5206, "step": 5323 }, { "epoch": 0.64, "learning_rate": 3.209659797357669e-06, "loss": 2.3794, "step": 5324 }, { "epoch": 0.64, "learning_rate": 3.207785394885993e-06, "loss": 2.4439, "step": 5325 }, { "epoch": 0.64, "learning_rate": 3.2059112813705505e-06, "loss": 2.4697, "step": 5326 }, { "epoch": 0.64, "learning_rate": 3.2040374571135024e-06, "loss": 2.5367, "step": 5327 }, { "epoch": 0.64, "learning_rate": 3.2021639224169615e-06, "loss": 2.3017, "step": 5328 }, { "epoch": 0.64, "learning_rate": 3.2002906775829967e-06, "loss": 2.5431, "step": 5329 }, { "epoch": 0.64, "learning_rate": 3.1984177229136287e-06, "loss": 2.6122, "step": 5330 }, { "epoch": 0.64, "learning_rate": 3.1965450587108317e-06, "loss": 2.6673, "step": 5331 }, { "epoch": 0.64, "learning_rate": 3.1946726852765325e-06, "loss": 2.3926, "step": 5332 }, { "epoch": 0.64, "learning_rate": 3.1928006029126103e-06, "loss": 2.6189, "step": 5333 }, { "epoch": 0.64, "learning_rate": 3.190928811920899e-06, "loss": 2.6169, "step": 5334 }, { "epoch": 0.64, "learning_rate": 3.189057312603183e-06, "loss": 2.5706, "step": 5335 }, { "epoch": 0.64, "learning_rate": 3.187186105261205e-06, "loss": 2.4661, "step": 5336 }, { "epoch": 0.64, "learning_rate": 3.185315190196655e-06, "loss": 2.3463, "step": 5337 }, { "epoch": 0.64, "learning_rate": 3.183444567711178e-06, "loss": 2.4356, "step": 5338 }, { "epoch": 0.64, "learning_rate": 3.1815742381063718e-06, "loss": 2.6496, "step": 5339 }, { "epoch": 0.64, "learning_rate": 3.179704201683786e-06, "loss": 2.4783, "step": 5340 }, { "epoch": 0.64, "learning_rate": 3.1778344587449267e-06, "loss": 2.4083, "step": 5341 }, { "epoch": 0.64, "learning_rate": 3.1759650095912474e-06, "loss": 2.4495, "step": 5342 }, { "epoch": 0.64, "learning_rate": 3.1740958545241586e-06, "loss": 2.5192, "step": 5343 }, { "epoch": 0.64, "learning_rate": 3.172226993845021e-06, "loss": 2.5789, "step": 5344 }, { "epoch": 0.64, "learning_rate": 3.170358427855148e-06, "loss": 2.5553, "step": 5345 }, { "epoch": 0.64, "learning_rate": 3.1684901568558058e-06, "loss": 2.5553, "step": 5346 }, { "epoch": 0.64, "learning_rate": 3.1666221811482123e-06, "loss": 2.5861, "step": 5347 }, { "epoch": 0.64, "learning_rate": 3.16475450103354e-06, "loss": 2.3913, "step": 5348 }, { "epoch": 0.64, "learning_rate": 3.162887116812913e-06, "loss": 2.6615, "step": 5349 }, { "epoch": 0.64, "learning_rate": 3.161020028787405e-06, "loss": 2.5928, "step": 5350 }, { "epoch": 0.64, "learning_rate": 3.1591532372580438e-06, "loss": 2.5309, "step": 5351 }, { "epoch": 0.64, "learning_rate": 3.1572867425258107e-06, "loss": 2.456, "step": 5352 }, { "epoch": 0.64, "learning_rate": 3.155420544891638e-06, "loss": 2.5193, "step": 5353 }, { "epoch": 0.64, "learning_rate": 3.1535546446564107e-06, "loss": 2.5478, "step": 5354 }, { "epoch": 0.64, "learning_rate": 3.151689042120965e-06, "loss": 2.5612, "step": 5355 }, { "epoch": 0.64, "learning_rate": 3.149823737586089e-06, "loss": 2.475, "step": 5356 }, { "epoch": 0.64, "learning_rate": 3.147958731352523e-06, "loss": 2.5624, "step": 5357 }, { "epoch": 0.64, "learning_rate": 3.146094023720958e-06, "loss": 2.5248, "step": 5358 }, { "epoch": 0.64, "learning_rate": 3.1442296149920416e-06, "loss": 2.5248, "step": 5359 }, { "epoch": 0.64, "learning_rate": 3.1423655054663665e-06, "loss": 2.6186, "step": 5360 }, { "epoch": 0.64, "learning_rate": 3.1405016954444824e-06, "loss": 2.2934, "step": 5361 }, { "epoch": 0.64, "learning_rate": 3.1386381852268878e-06, "loss": 2.5569, "step": 5362 }, { "epoch": 0.64, "learning_rate": 3.1367749751140324e-06, "loss": 2.4768, "step": 5363 }, { "epoch": 0.64, "learning_rate": 3.1349120654063224e-06, "loss": 2.5852, "step": 5364 }, { "epoch": 0.64, "learning_rate": 3.13304945640411e-06, "loss": 2.486, "step": 5365 }, { "epoch": 0.64, "learning_rate": 3.1311871484077017e-06, "loss": 2.6075, "step": 5366 }, { "epoch": 0.64, "learning_rate": 3.129325141717354e-06, "loss": 2.5423, "step": 5367 }, { "epoch": 0.64, "learning_rate": 3.1274634366332775e-06, "loss": 2.6243, "step": 5368 }, { "epoch": 0.65, "learning_rate": 3.12560203345563e-06, "loss": 2.4344, "step": 5369 }, { "epoch": 0.65, "learning_rate": 3.1237409324845224e-06, "loss": 2.5058, "step": 5370 }, { "epoch": 0.65, "learning_rate": 3.1218801340200207e-06, "loss": 2.5332, "step": 5371 }, { "epoch": 0.65, "learning_rate": 3.1200196383621363e-06, "loss": 2.6755, "step": 5372 }, { "epoch": 0.65, "learning_rate": 3.118159445810835e-06, "loss": 2.5484, "step": 5373 }, { "epoch": 0.65, "learning_rate": 3.1162995566660307e-06, "loss": 2.4251, "step": 5374 }, { "epoch": 0.65, "learning_rate": 3.1144399712275952e-06, "loss": 2.4665, "step": 5375 }, { "epoch": 0.65, "learning_rate": 3.1125806897953447e-06, "loss": 2.3831, "step": 5376 }, { "epoch": 0.65, "learning_rate": 3.110721712669047e-06, "loss": 2.5155, "step": 5377 }, { "epoch": 0.65, "learning_rate": 3.1088630401484245e-06, "loss": 2.5082, "step": 5378 }, { "epoch": 0.65, "learning_rate": 3.107004672533148e-06, "loss": 2.5048, "step": 5379 }, { "epoch": 0.65, "learning_rate": 3.105146610122839e-06, "loss": 2.495, "step": 5380 }, { "epoch": 0.65, "learning_rate": 3.1032888532170693e-06, "loss": 2.4757, "step": 5381 }, { "epoch": 0.65, "learning_rate": 3.101431402115364e-06, "loss": 2.3197, "step": 5382 }, { "epoch": 0.65, "learning_rate": 3.0995742571171972e-06, "loss": 2.5489, "step": 5383 }, { "epoch": 0.65, "learning_rate": 3.0977174185219937e-06, "loss": 2.5335, "step": 5384 }, { "epoch": 0.65, "learning_rate": 3.095860886629126e-06, "loss": 2.4862, "step": 5385 }, { "epoch": 0.65, "learning_rate": 3.0940046617379247e-06, "loss": 2.4774, "step": 5386 }, { "epoch": 0.65, "learning_rate": 3.092148744147665e-06, "loss": 2.5163, "step": 5387 }, { "epoch": 0.65, "learning_rate": 3.090293134157572e-06, "loss": 2.493, "step": 5388 }, { "epoch": 0.65, "learning_rate": 3.088437832066825e-06, "loss": 2.4894, "step": 5389 }, { "epoch": 0.65, "learning_rate": 3.0865828381745515e-06, "loss": 2.3907, "step": 5390 }, { "epoch": 0.65, "learning_rate": 3.084728152779829e-06, "loss": 2.4862, "step": 5391 }, { "epoch": 0.65, "learning_rate": 3.0828737761816864e-06, "loss": 2.5417, "step": 5392 }, { "epoch": 0.65, "learning_rate": 3.0810197086791e-06, "loss": 2.5239, "step": 5393 }, { "epoch": 0.65, "learning_rate": 3.0791659505710015e-06, "loss": 2.4243, "step": 5394 }, { "epoch": 0.65, "learning_rate": 3.0773125021562683e-06, "loss": 2.577, "step": 5395 }, { "epoch": 0.65, "learning_rate": 3.0754593637337276e-06, "loss": 2.4012, "step": 5396 }, { "epoch": 0.65, "learning_rate": 3.0736065356021623e-06, "loss": 2.4704, "step": 5397 }, { "epoch": 0.65, "learning_rate": 3.071754018060299e-06, "loss": 2.478, "step": 5398 }, { "epoch": 0.65, "learning_rate": 3.0699018114068163e-06, "loss": 2.5369, "step": 5399 }, { "epoch": 0.65, "learning_rate": 3.068049915940342e-06, "loss": 2.5155, "step": 5400 }, { "epoch": 0.65, "learning_rate": 3.0661983319594566e-06, "loss": 2.5737, "step": 5401 }, { "epoch": 0.65, "learning_rate": 3.0643470597626885e-06, "loss": 2.5264, "step": 5402 }, { "epoch": 0.65, "learning_rate": 3.062496099648514e-06, "loss": 2.5013, "step": 5403 }, { "epoch": 0.65, "learning_rate": 3.0606454519153608e-06, "loss": 2.6456, "step": 5404 }, { "epoch": 0.65, "learning_rate": 3.058795116861608e-06, "loss": 2.5562, "step": 5405 }, { "epoch": 0.65, "learning_rate": 3.056945094785581e-06, "loss": 2.3531, "step": 5406 }, { "epoch": 0.65, "learning_rate": 3.055095385985555e-06, "loss": 2.5611, "step": 5407 }, { "epoch": 0.65, "learning_rate": 3.05324599075976e-06, "loss": 2.4521, "step": 5408 }, { "epoch": 0.65, "learning_rate": 3.0513969094063685e-06, "loss": 2.5203, "step": 5409 }, { "epoch": 0.65, "learning_rate": 3.049548142223506e-06, "loss": 2.4905, "step": 5410 }, { "epoch": 0.65, "learning_rate": 3.0476996895092448e-06, "loss": 2.3758, "step": 5411 }, { "epoch": 0.65, "learning_rate": 3.0458515515616117e-06, "loss": 2.5921, "step": 5412 }, { "epoch": 0.65, "learning_rate": 3.044003728678577e-06, "loss": 2.3541, "step": 5413 }, { "epoch": 0.65, "learning_rate": 3.042156221158064e-06, "loss": 2.6618, "step": 5414 }, { "epoch": 0.65, "learning_rate": 3.0403090292979425e-06, "loss": 2.4225, "step": 5415 }, { "epoch": 0.65, "learning_rate": 3.0384621533960324e-06, "loss": 2.3838, "step": 5416 }, { "epoch": 0.65, "learning_rate": 3.036615593750104e-06, "loss": 2.6415, "step": 5417 }, { "epoch": 0.65, "learning_rate": 3.0347693506578737e-06, "loss": 2.7798, "step": 5418 }, { "epoch": 0.65, "learning_rate": 3.0329234244170113e-06, "loss": 2.579, "step": 5419 }, { "epoch": 0.65, "learning_rate": 3.0310778153251325e-06, "loss": 2.5691, "step": 5420 }, { "epoch": 0.65, "learning_rate": 3.0292325236798008e-06, "loss": 2.5401, "step": 5421 }, { "epoch": 0.65, "learning_rate": 3.027387549778531e-06, "loss": 2.6773, "step": 5422 }, { "epoch": 0.65, "learning_rate": 3.0255428939187836e-06, "loss": 2.4552, "step": 5423 }, { "epoch": 0.65, "learning_rate": 3.0236985563979727e-06, "loss": 2.5276, "step": 5424 }, { "epoch": 0.65, "learning_rate": 3.0218545375134574e-06, "loss": 2.47, "step": 5425 }, { "epoch": 0.65, "learning_rate": 3.020010837562546e-06, "loss": 2.6771, "step": 5426 }, { "epoch": 0.65, "learning_rate": 3.0181674568424944e-06, "loss": 2.7199, "step": 5427 }, { "epoch": 0.65, "learning_rate": 3.0163243956505093e-06, "loss": 2.5584, "step": 5428 }, { "epoch": 0.65, "learning_rate": 3.0144816542837444e-06, "loss": 2.3753, "step": 5429 }, { "epoch": 0.65, "learning_rate": 3.0126392330393033e-06, "loss": 2.3524, "step": 5430 }, { "epoch": 0.65, "learning_rate": 3.0107971322142377e-06, "loss": 2.5185, "step": 5431 }, { "epoch": 0.65, "learning_rate": 3.0089553521055455e-06, "loss": 2.5123, "step": 5432 }, { "epoch": 0.65, "learning_rate": 3.007113893010174e-06, "loss": 2.3808, "step": 5433 }, { "epoch": 0.65, "learning_rate": 3.005272755225019e-06, "loss": 2.5056, "step": 5434 }, { "epoch": 0.65, "learning_rate": 3.0034319390469263e-06, "loss": 2.6498, "step": 5435 }, { "epoch": 0.65, "learning_rate": 3.001591444772687e-06, "loss": 2.687, "step": 5436 }, { "epoch": 0.65, "learning_rate": 2.999751272699041e-06, "loss": 2.4794, "step": 5437 }, { "epoch": 0.65, "learning_rate": 2.9979114231226776e-06, "loss": 2.5409, "step": 5438 }, { "epoch": 0.65, "learning_rate": 2.996071896340231e-06, "loss": 2.5666, "step": 5439 }, { "epoch": 0.65, "learning_rate": 2.9942326926482877e-06, "loss": 2.4712, "step": 5440 }, { "epoch": 0.65, "learning_rate": 2.992393812343378e-06, "loss": 2.3693, "step": 5441 }, { "epoch": 0.65, "learning_rate": 2.9905552557219853e-06, "loss": 2.6952, "step": 5442 }, { "epoch": 0.65, "learning_rate": 2.988717023080535e-06, "loss": 2.5596, "step": 5443 }, { "epoch": 0.65, "learning_rate": 2.986879114715403e-06, "loss": 2.5059, "step": 5444 }, { "epoch": 0.65, "learning_rate": 2.985041530922913e-06, "loss": 2.5392, "step": 5445 }, { "epoch": 0.65, "learning_rate": 2.9832042719993354e-06, "loss": 2.5685, "step": 5446 }, { "epoch": 0.65, "learning_rate": 2.9813673382408905e-06, "loss": 2.5261, "step": 5447 }, { "epoch": 0.65, "learning_rate": 2.9795307299437425e-06, "loss": 2.4393, "step": 5448 }, { "epoch": 0.65, "learning_rate": 2.977694447404007e-06, "loss": 2.5145, "step": 5449 }, { "epoch": 0.65, "learning_rate": 2.9758584909177434e-06, "loss": 2.5438, "step": 5450 }, { "epoch": 0.65, "learning_rate": 2.9740228607809607e-06, "loss": 2.4859, "step": 5451 }, { "epoch": 0.65, "learning_rate": 2.972187557289616e-06, "loss": 2.6954, "step": 5452 }, { "epoch": 0.66, "learning_rate": 2.9703525807396117e-06, "loss": 2.4924, "step": 5453 }, { "epoch": 0.66, "learning_rate": 2.9685179314268004e-06, "loss": 2.6191, "step": 5454 }, { "epoch": 0.66, "learning_rate": 2.9666836096469786e-06, "loss": 2.6432, "step": 5455 }, { "epoch": 0.66, "learning_rate": 2.964849615695892e-06, "loss": 2.626, "step": 5456 }, { "epoch": 0.66, "learning_rate": 2.9630159498692303e-06, "loss": 2.6534, "step": 5457 }, { "epoch": 0.66, "learning_rate": 2.9611826124626364e-06, "loss": 2.4933, "step": 5458 }, { "epoch": 0.66, "learning_rate": 2.959349603771695e-06, "loss": 2.562, "step": 5459 }, { "epoch": 0.66, "learning_rate": 2.95751692409194e-06, "loss": 2.5579, "step": 5460 }, { "epoch": 0.66, "learning_rate": 2.9556845737188512e-06, "loss": 2.6642, "step": 5461 }, { "epoch": 0.66, "learning_rate": 2.9538525529478557e-06, "loss": 2.6059, "step": 5462 }, { "epoch": 0.66, "learning_rate": 2.9520208620743275e-06, "loss": 2.5386, "step": 5463 }, { "epoch": 0.66, "learning_rate": 2.950189501393588e-06, "loss": 2.4603, "step": 5464 }, { "epoch": 0.66, "learning_rate": 2.9483584712009063e-06, "loss": 2.5256, "step": 5465 }, { "epoch": 0.66, "learning_rate": 2.9465277717914952e-06, "loss": 2.4229, "step": 5466 }, { "epoch": 0.66, "learning_rate": 2.9446974034605165e-06, "loss": 2.4973, "step": 5467 }, { "epoch": 0.66, "learning_rate": 2.9428673665030772e-06, "loss": 2.6098, "step": 5468 }, { "epoch": 0.66, "learning_rate": 2.941037661214231e-06, "loss": 2.5266, "step": 5469 }, { "epoch": 0.66, "learning_rate": 2.9392082878889804e-06, "loss": 2.5528, "step": 5470 }, { "epoch": 0.66, "learning_rate": 2.9373792468222716e-06, "loss": 2.6064, "step": 5471 }, { "epoch": 0.66, "learning_rate": 2.935550538309e-06, "loss": 2.5225, "step": 5472 }, { "epoch": 0.66, "learning_rate": 2.9337221626440026e-06, "loss": 2.6076, "step": 5473 }, { "epoch": 0.66, "learning_rate": 2.9318941201220664e-06, "loss": 2.5912, "step": 5474 }, { "epoch": 0.66, "learning_rate": 2.9300664110379275e-06, "loss": 2.6216, "step": 5475 }, { "epoch": 0.66, "learning_rate": 2.9282390356862606e-06, "loss": 2.6873, "step": 5476 }, { "epoch": 0.66, "learning_rate": 2.9264119943616942e-06, "loss": 2.4719, "step": 5477 }, { "epoch": 0.66, "learning_rate": 2.924585287358799e-06, "loss": 2.2681, "step": 5478 }, { "epoch": 0.66, "learning_rate": 2.92275891497209e-06, "loss": 2.4833, "step": 5479 }, { "epoch": 0.66, "learning_rate": 2.9209328774960327e-06, "loss": 2.647, "step": 5480 }, { "epoch": 0.66, "learning_rate": 2.9191071752250376e-06, "loss": 2.5384, "step": 5481 }, { "epoch": 0.66, "learning_rate": 2.917281808453457e-06, "loss": 2.5378, "step": 5482 }, { "epoch": 0.66, "learning_rate": 2.915456777475593e-06, "loss": 2.3832, "step": 5483 }, { "epoch": 0.66, "learning_rate": 2.9136320825856967e-06, "loss": 2.5508, "step": 5484 }, { "epoch": 0.66, "learning_rate": 2.911807724077953e-06, "loss": 2.6266, "step": 5485 }, { "epoch": 0.66, "learning_rate": 2.90998370224651e-06, "loss": 2.4925, "step": 5486 }, { "epoch": 0.66, "learning_rate": 2.908160017385446e-06, "loss": 2.4648, "step": 5487 }, { "epoch": 0.66, "learning_rate": 2.9063366697887947e-06, "loss": 2.5367, "step": 5488 }, { "epoch": 0.66, "learning_rate": 2.904513659750528e-06, "loss": 2.7161, "step": 5489 }, { "epoch": 0.66, "learning_rate": 2.9026909875645693e-06, "loss": 2.3945, "step": 5490 }, { "epoch": 0.66, "learning_rate": 2.9008686535247875e-06, "loss": 2.4406, "step": 5491 }, { "epoch": 0.66, "learning_rate": 2.899046657924992e-06, "loss": 2.6448, "step": 5492 }, { "epoch": 0.66, "learning_rate": 2.897225001058942e-06, "loss": 2.587, "step": 5493 }, { "epoch": 0.66, "learning_rate": 2.8954036832203393e-06, "loss": 2.6713, "step": 5494 }, { "epoch": 0.66, "learning_rate": 2.8935827047028333e-06, "loss": 2.5569, "step": 5495 }, { "epoch": 0.66, "learning_rate": 2.8917620658000166e-06, "loss": 2.3651, "step": 5496 }, { "epoch": 0.66, "learning_rate": 2.8899417668054307e-06, "loss": 2.5694, "step": 5497 }, { "epoch": 0.66, "learning_rate": 2.8881218080125605e-06, "loss": 2.5571, "step": 5498 }, { "epoch": 0.66, "learning_rate": 2.8863021897148306e-06, "loss": 2.5118, "step": 5499 }, { "epoch": 0.66, "learning_rate": 2.884482912205621e-06, "loss": 2.5589, "step": 5500 }, { "epoch": 0.66, "learning_rate": 2.882663975778247e-06, "loss": 2.6359, "step": 5501 }, { "epoch": 0.66, "learning_rate": 2.880845380725974e-06, "loss": 2.4155, "step": 5502 }, { "epoch": 0.66, "learning_rate": 2.8790271273420147e-06, "loss": 2.4688, "step": 5503 }, { "epoch": 0.66, "learning_rate": 2.8772092159195193e-06, "loss": 2.4699, "step": 5504 }, { "epoch": 0.66, "learning_rate": 2.875391646751591e-06, "loss": 2.5513, "step": 5505 }, { "epoch": 0.66, "learning_rate": 2.8735744201312688e-06, "loss": 2.5953, "step": 5506 }, { "epoch": 0.66, "learning_rate": 2.871757536351546e-06, "loss": 2.5137, "step": 5507 }, { "epoch": 0.66, "learning_rate": 2.8699409957053535e-06, "loss": 2.5473, "step": 5508 }, { "epoch": 0.66, "learning_rate": 2.868124798485572e-06, "loss": 2.5241, "step": 5509 }, { "epoch": 0.66, "learning_rate": 2.8663089449850246e-06, "loss": 2.576, "step": 5510 }, { "epoch": 0.66, "learning_rate": 2.864493435496476e-06, "loss": 2.7372, "step": 5511 }, { "epoch": 0.66, "learning_rate": 2.8626782703126423e-06, "loss": 2.5764, "step": 5512 }, { "epoch": 0.66, "learning_rate": 2.8608634497261743e-06, "loss": 2.6119, "step": 5513 }, { "epoch": 0.66, "learning_rate": 2.8590489740296767e-06, "loss": 2.4251, "step": 5514 }, { "epoch": 0.66, "learning_rate": 2.857234843515696e-06, "loss": 2.6492, "step": 5515 }, { "epoch": 0.66, "learning_rate": 2.8554210584767188e-06, "loss": 2.506, "step": 5516 }, { "epoch": 0.66, "learning_rate": 2.853607619205182e-06, "loss": 2.3984, "step": 5517 }, { "epoch": 0.66, "learning_rate": 2.8517945259934586e-06, "loss": 2.3663, "step": 5518 }, { "epoch": 0.66, "learning_rate": 2.849981779133879e-06, "loss": 2.5027, "step": 5519 }, { "epoch": 0.66, "learning_rate": 2.8481693789187036e-06, "loss": 2.3971, "step": 5520 }, { "epoch": 0.66, "learning_rate": 2.8463573256401456e-06, "loss": 2.5667, "step": 5521 }, { "epoch": 0.66, "learning_rate": 2.844545619590361e-06, "loss": 2.2879, "step": 5522 }, { "epoch": 0.66, "learning_rate": 2.8427342610614446e-06, "loss": 2.6009, "step": 5523 }, { "epoch": 0.66, "learning_rate": 2.840923250345442e-06, "loss": 2.7398, "step": 5524 }, { "epoch": 0.66, "learning_rate": 2.8391125877343412e-06, "loss": 2.4725, "step": 5525 }, { "epoch": 0.66, "learning_rate": 2.8373022735200694e-06, "loss": 2.521, "step": 5526 }, { "epoch": 0.66, "learning_rate": 2.835492307994504e-06, "loss": 2.4121, "step": 5527 }, { "epoch": 0.66, "learning_rate": 2.8336826914494607e-06, "loss": 2.5251, "step": 5528 }, { "epoch": 0.66, "learning_rate": 2.831873424176702e-06, "loss": 2.4974, "step": 5529 }, { "epoch": 0.66, "learning_rate": 2.8300645064679345e-06, "loss": 2.4901, "step": 5530 }, { "epoch": 0.66, "learning_rate": 2.828255938614807e-06, "loss": 2.6349, "step": 5531 }, { "epoch": 0.66, "learning_rate": 2.8264477209089147e-06, "loss": 2.3902, "step": 5532 }, { "epoch": 0.66, "learning_rate": 2.8246398536417897e-06, "loss": 2.4349, "step": 5533 }, { "epoch": 0.66, "learning_rate": 2.822832337104915e-06, "loss": 2.5474, "step": 5534 }, { "epoch": 0.66, "learning_rate": 2.8210251715897112e-06, "loss": 2.5008, "step": 5535 }, { "epoch": 0.67, "learning_rate": 2.819218357387547e-06, "loss": 2.4588, "step": 5536 }, { "epoch": 0.67, "learning_rate": 2.8174118947897338e-06, "loss": 2.3905, "step": 5537 }, { "epoch": 0.67, "learning_rate": 2.815605784087522e-06, "loss": 2.421, "step": 5538 }, { "epoch": 0.67, "learning_rate": 2.813800025572111e-06, "loss": 2.6113, "step": 5539 }, { "epoch": 0.67, "learning_rate": 2.8119946195346375e-06, "loss": 2.56, "step": 5540 }, { "epoch": 0.67, "learning_rate": 2.810189566266187e-06, "loss": 2.4991, "step": 5541 }, { "epoch": 0.67, "learning_rate": 2.8083848660577846e-06, "loss": 2.5564, "step": 5542 }, { "epoch": 0.67, "learning_rate": 2.8065805192004005e-06, "loss": 2.4544, "step": 5543 }, { "epoch": 0.67, "learning_rate": 2.804776525984948e-06, "loss": 2.4096, "step": 5544 }, { "epoch": 0.67, "learning_rate": 2.8029728867022795e-06, "loss": 2.4401, "step": 5545 }, { "epoch": 0.67, "learning_rate": 2.8011696016431967e-06, "loss": 2.6136, "step": 5546 }, { "epoch": 0.67, "learning_rate": 2.7993666710984356e-06, "loss": 2.4375, "step": 5547 }, { "epoch": 0.67, "learning_rate": 2.7975640953586846e-06, "loss": 2.6309, "step": 5548 }, { "epoch": 0.67, "learning_rate": 2.795761874714571e-06, "loss": 2.3641, "step": 5549 }, { "epoch": 0.67, "learning_rate": 2.79396000945666e-06, "loss": 2.5756, "step": 5550 }, { "epoch": 0.67, "learning_rate": 2.792158499875468e-06, "loss": 2.4682, "step": 5551 }, { "epoch": 0.67, "learning_rate": 2.790357346261445e-06, "loss": 2.5471, "step": 5552 }, { "epoch": 0.67, "learning_rate": 2.7885565489049948e-06, "loss": 2.5293, "step": 5553 }, { "epoch": 0.67, "learning_rate": 2.7867561080964522e-06, "loss": 2.5337, "step": 5554 }, { "epoch": 0.67, "learning_rate": 2.7849560241261013e-06, "loss": 2.4718, "step": 5555 }, { "epoch": 0.67, "learning_rate": 2.78315629728417e-06, "loss": 2.5642, "step": 5556 }, { "epoch": 0.67, "learning_rate": 2.781356927860821e-06, "loss": 2.5596, "step": 5557 }, { "epoch": 0.67, "learning_rate": 2.7795579161461685e-06, "loss": 2.6784, "step": 5558 }, { "epoch": 0.67, "learning_rate": 2.7777592624302594e-06, "loss": 2.5047, "step": 5559 }, { "epoch": 0.67, "learning_rate": 2.7759609670030922e-06, "loss": 2.7324, "step": 5560 }, { "epoch": 0.67, "learning_rate": 2.7741630301546043e-06, "loss": 2.5808, "step": 5561 }, { "epoch": 0.67, "learning_rate": 2.77236545217467e-06, "loss": 2.6279, "step": 5562 }, { "epoch": 0.67, "learning_rate": 2.7705682333531137e-06, "loss": 2.6312, "step": 5563 }, { "epoch": 0.67, "learning_rate": 2.7687713739796972e-06, "loss": 2.4349, "step": 5564 }, { "epoch": 0.67, "learning_rate": 2.7669748743441284e-06, "loss": 2.4243, "step": 5565 }, { "epoch": 0.67, "learning_rate": 2.7651787347360504e-06, "loss": 2.5013, "step": 5566 }, { "epoch": 0.67, "learning_rate": 2.763382955445053e-06, "loss": 2.4225, "step": 5567 }, { "epoch": 0.67, "learning_rate": 2.7615875367606704e-06, "loss": 2.4718, "step": 5568 }, { "epoch": 0.67, "learning_rate": 2.7597924789723716e-06, "loss": 2.6053, "step": 5569 }, { "epoch": 0.67, "learning_rate": 2.7579977823695727e-06, "loss": 2.6068, "step": 5570 }, { "epoch": 0.67, "learning_rate": 2.756203447241632e-06, "loss": 2.7228, "step": 5571 }, { "epoch": 0.67, "learning_rate": 2.7544094738778436e-06, "loss": 2.5415, "step": 5572 }, { "epoch": 0.67, "learning_rate": 2.7526158625674514e-06, "loss": 2.4305, "step": 5573 }, { "epoch": 0.67, "learning_rate": 2.7508226135996313e-06, "loss": 2.441, "step": 5574 }, { "epoch": 0.67, "learning_rate": 2.7490297272635134e-06, "loss": 2.4284, "step": 5575 }, { "epoch": 0.67, "learning_rate": 2.7472372038481575e-06, "loss": 2.5711, "step": 5576 }, { "epoch": 0.67, "learning_rate": 2.7454450436425707e-06, "loss": 2.6394, "step": 5577 }, { "epoch": 0.67, "learning_rate": 2.7436532469357017e-06, "loss": 2.6004, "step": 5578 }, { "epoch": 0.67, "learning_rate": 2.7418618140164372e-06, "loss": 2.7372, "step": 5579 }, { "epoch": 0.67, "learning_rate": 2.7400707451736103e-06, "loss": 2.5114, "step": 5580 }, { "epoch": 0.67, "learning_rate": 2.7382800406959885e-06, "loss": 2.6886, "step": 5581 }, { "epoch": 0.67, "learning_rate": 2.7364897008722867e-06, "loss": 2.479, "step": 5582 }, { "epoch": 0.67, "learning_rate": 2.734699725991161e-06, "loss": 2.5019, "step": 5583 }, { "epoch": 0.67, "learning_rate": 2.732910116341203e-06, "loss": 2.4084, "step": 5584 }, { "epoch": 0.67, "learning_rate": 2.73112087221095e-06, "loss": 2.5474, "step": 5585 }, { "epoch": 0.67, "learning_rate": 2.7293319938888795e-06, "loss": 2.4668, "step": 5586 }, { "epoch": 0.67, "learning_rate": 2.727543481663413e-06, "loss": 2.5269, "step": 5587 }, { "epoch": 0.67, "learning_rate": 2.725755335822903e-06, "loss": 2.5351, "step": 5588 }, { "epoch": 0.67, "learning_rate": 2.723967556655655e-06, "loss": 2.6037, "step": 5589 }, { "epoch": 0.67, "learning_rate": 2.7221801444499104e-06, "loss": 2.687, "step": 5590 }, { "epoch": 0.67, "learning_rate": 2.720393099493847e-06, "loss": 2.5428, "step": 5591 }, { "epoch": 0.67, "learning_rate": 2.7186064220755925e-06, "loss": 2.5088, "step": 5592 }, { "epoch": 0.67, "learning_rate": 2.7168201124832057e-06, "loss": 2.4969, "step": 5593 }, { "epoch": 0.67, "learning_rate": 2.7150341710046924e-06, "loss": 2.7266, "step": 5594 }, { "epoch": 0.67, "learning_rate": 2.7132485979280005e-06, "loss": 2.5336, "step": 5595 }, { "epoch": 0.67, "learning_rate": 2.7114633935410083e-06, "loss": 2.4457, "step": 5596 }, { "epoch": 0.67, "learning_rate": 2.709678558131551e-06, "loss": 2.4767, "step": 5597 }, { "epoch": 0.67, "learning_rate": 2.7078940919873886e-06, "loss": 2.4201, "step": 5598 }, { "epoch": 0.67, "learning_rate": 2.7061099953962316e-06, "loss": 2.5372, "step": 5599 }, { "epoch": 0.67, "learning_rate": 2.704326268645724e-06, "loss": 2.5404, "step": 5600 }, { "epoch": 0.67, "learning_rate": 2.702542912023455e-06, "loss": 2.4303, "step": 5601 }, { "epoch": 0.67, "learning_rate": 2.7007599258169546e-06, "loss": 2.4435, "step": 5602 }, { "epoch": 0.67, "learning_rate": 2.698977310313687e-06, "loss": 2.505, "step": 5603 }, { "epoch": 0.67, "learning_rate": 2.6971950658010666e-06, "loss": 2.4273, "step": 5604 }, { "epoch": 0.67, "learning_rate": 2.695413192566436e-06, "loss": 2.387, "step": 5605 }, { "epoch": 0.67, "learning_rate": 2.6936316908970874e-06, "loss": 2.5283, "step": 5606 }, { "epoch": 0.67, "learning_rate": 2.6918505610802493e-06, "loss": 2.4471, "step": 5607 }, { "epoch": 0.67, "learning_rate": 2.6900698034030904e-06, "loss": 2.4907, "step": 5608 }, { "epoch": 0.67, "learning_rate": 2.688289418152722e-06, "loss": 2.4815, "step": 5609 }, { "epoch": 0.67, "learning_rate": 2.68650940561619e-06, "loss": 2.4569, "step": 5610 }, { "epoch": 0.67, "learning_rate": 2.684729766080486e-06, "loss": 2.4151, "step": 5611 }, { "epoch": 0.67, "learning_rate": 2.6829504998325352e-06, "loss": 2.5173, "step": 5612 }, { "epoch": 0.67, "learning_rate": 2.6811716071592086e-06, "loss": 2.3114, "step": 5613 }, { "epoch": 0.67, "learning_rate": 2.679393088347316e-06, "loss": 2.585, "step": 5614 }, { "epoch": 0.67, "learning_rate": 2.6776149436836023e-06, "loss": 2.4138, "step": 5615 }, { "epoch": 0.67, "learning_rate": 2.6758371734547584e-06, "loss": 2.4584, "step": 5616 }, { "epoch": 0.67, "learning_rate": 2.674059777947408e-06, "loss": 2.5041, "step": 5617 }, { "epoch": 0.67, "learning_rate": 2.67228275744812e-06, "loss": 2.4311, "step": 5618 }, { "epoch": 0.68, "learning_rate": 2.670506112243401e-06, "loss": 2.5432, "step": 5619 }, { "epoch": 0.68, "learning_rate": 2.6687298426196974e-06, "loss": 2.6252, "step": 5620 }, { "epoch": 0.68, "learning_rate": 2.6669539488633954e-06, "loss": 2.4485, "step": 5621 }, { "epoch": 0.68, "learning_rate": 2.6651784312608177e-06, "loss": 2.6797, "step": 5622 }, { "epoch": 0.68, "learning_rate": 2.6634032900982288e-06, "loss": 2.3932, "step": 5623 }, { "epoch": 0.68, "learning_rate": 2.661628525661835e-06, "loss": 2.4724, "step": 5624 }, { "epoch": 0.68, "learning_rate": 2.6598541382377744e-06, "loss": 2.3866, "step": 5625 }, { "epoch": 0.68, "learning_rate": 2.658080128112134e-06, "loss": 2.604, "step": 5626 }, { "epoch": 0.68, "learning_rate": 2.6563064955709305e-06, "loss": 2.5153, "step": 5627 }, { "epoch": 0.68, "learning_rate": 2.6545332409001267e-06, "loss": 2.5127, "step": 5628 }, { "epoch": 0.68, "learning_rate": 2.6527603643856203e-06, "loss": 2.5399, "step": 5629 }, { "epoch": 0.68, "learning_rate": 2.6509878663132514e-06, "loss": 2.355, "step": 5630 }, { "epoch": 0.68, "learning_rate": 2.649215746968799e-06, "loss": 2.4667, "step": 5631 }, { "epoch": 0.68, "learning_rate": 2.6474440066379746e-06, "loss": 2.4941, "step": 5632 }, { "epoch": 0.68, "learning_rate": 2.6456726456064384e-06, "loss": 2.531, "step": 5633 }, { "epoch": 0.68, "learning_rate": 2.64390166415978e-06, "loss": 2.4794, "step": 5634 }, { "epoch": 0.68, "learning_rate": 2.642131062583534e-06, "loss": 2.6076, "step": 5635 }, { "epoch": 0.68, "learning_rate": 2.6403608411631744e-06, "loss": 2.4948, "step": 5636 }, { "epoch": 0.68, "learning_rate": 2.638591000184107e-06, "loss": 2.4739, "step": 5637 }, { "epoch": 0.68, "learning_rate": 2.6368215399316856e-06, "loss": 2.5466, "step": 5638 }, { "epoch": 0.68, "learning_rate": 2.6350524606911928e-06, "loss": 2.5255, "step": 5639 }, { "epoch": 0.68, "learning_rate": 2.633283762747857e-06, "loss": 2.6151, "step": 5640 }, { "epoch": 0.68, "learning_rate": 2.631515446386844e-06, "loss": 2.4614, "step": 5641 }, { "epoch": 0.68, "learning_rate": 2.629747511893255e-06, "loss": 2.4149, "step": 5642 }, { "epoch": 0.68, "learning_rate": 2.6279799595521354e-06, "loss": 2.5482, "step": 5643 }, { "epoch": 0.68, "learning_rate": 2.62621278964846e-06, "loss": 2.5784, "step": 5644 }, { "epoch": 0.68, "learning_rate": 2.624446002467152e-06, "loss": 2.323, "step": 5645 }, { "epoch": 0.68, "learning_rate": 2.622679598293063e-06, "loss": 2.591, "step": 5646 }, { "epoch": 0.68, "learning_rate": 2.6209135774109907e-06, "loss": 2.4178, "step": 5647 }, { "epoch": 0.68, "learning_rate": 2.61914794010567e-06, "loss": 2.3658, "step": 5648 }, { "epoch": 0.68, "learning_rate": 2.617382686661768e-06, "loss": 2.7183, "step": 5649 }, { "epoch": 0.68, "learning_rate": 2.6156178173638978e-06, "loss": 2.4108, "step": 5650 }, { "epoch": 0.68, "learning_rate": 2.613853332496603e-06, "loss": 2.4953, "step": 5651 }, { "epoch": 0.68, "learning_rate": 2.612089232344371e-06, "loss": 2.6214, "step": 5652 }, { "epoch": 0.68, "learning_rate": 2.6103255171916246e-06, "loss": 2.5185, "step": 5653 }, { "epoch": 0.68, "learning_rate": 2.6085621873227264e-06, "loss": 2.4915, "step": 5654 }, { "epoch": 0.68, "learning_rate": 2.6067992430219768e-06, "loss": 2.5804, "step": 5655 }, { "epoch": 0.68, "learning_rate": 2.6050366845736087e-06, "loss": 2.4007, "step": 5656 }, { "epoch": 0.68, "learning_rate": 2.603274512261801e-06, "loss": 2.5762, "step": 5657 }, { "epoch": 0.68, "learning_rate": 2.601512726370662e-06, "loss": 2.4189, "step": 5658 }, { "epoch": 0.68, "learning_rate": 2.599751327184245e-06, "loss": 2.5183, "step": 5659 }, { "epoch": 0.68, "learning_rate": 2.5979903149865386e-06, "loss": 2.4393, "step": 5660 }, { "epoch": 0.68, "learning_rate": 2.596229690061466e-06, "loss": 2.4669, "step": 5661 }, { "epoch": 0.68, "learning_rate": 2.594469452692892e-06, "loss": 2.5278, "step": 5662 }, { "epoch": 0.68, "learning_rate": 2.5927096031646128e-06, "loss": 2.5713, "step": 5663 }, { "epoch": 0.68, "learning_rate": 2.5909501417603744e-06, "loss": 2.5852, "step": 5664 }, { "epoch": 0.68, "learning_rate": 2.5891910687638453e-06, "loss": 2.3829, "step": 5665 }, { "epoch": 0.68, "learning_rate": 2.5874323844586414e-06, "loss": 2.5066, "step": 5666 }, { "epoch": 0.68, "learning_rate": 2.5856740891283145e-06, "loss": 2.4272, "step": 5667 }, { "epoch": 0.68, "learning_rate": 2.5839161830563475e-06, "loss": 2.4649, "step": 5668 }, { "epoch": 0.68, "learning_rate": 2.58215866652617e-06, "loss": 2.4383, "step": 5669 }, { "epoch": 0.68, "learning_rate": 2.58040153982114e-06, "loss": 2.4128, "step": 5670 }, { "epoch": 0.68, "learning_rate": 2.578644803224558e-06, "loss": 2.5301, "step": 5671 }, { "epoch": 0.68, "learning_rate": 2.5768884570196615e-06, "loss": 2.3275, "step": 5672 }, { "epoch": 0.68, "learning_rate": 2.5751325014896216e-06, "loss": 2.4905, "step": 5673 }, { "epoch": 0.68, "learning_rate": 2.5733769369175493e-06, "loss": 2.4747, "step": 5674 }, { "epoch": 0.68, "learning_rate": 2.5716217635864915e-06, "loss": 2.5568, "step": 5675 }, { "epoch": 0.68, "learning_rate": 2.569866981779433e-06, "loss": 2.3576, "step": 5676 }, { "epoch": 0.68, "learning_rate": 2.568112591779297e-06, "loss": 2.4917, "step": 5677 }, { "epoch": 0.68, "learning_rate": 2.566358593868936e-06, "loss": 2.525, "step": 5678 }, { "epoch": 0.68, "learning_rate": 2.5646049883311504e-06, "loss": 2.4985, "step": 5679 }, { "epoch": 0.68, "learning_rate": 2.562851775448666e-06, "loss": 2.3664, "step": 5680 }, { "epoch": 0.68, "learning_rate": 2.5610989555041536e-06, "loss": 2.4181, "step": 5681 }, { "epoch": 0.68, "learning_rate": 2.55934652878022e-06, "loss": 2.6926, "step": 5682 }, { "epoch": 0.68, "learning_rate": 2.5575944955594025e-06, "loss": 2.6438, "step": 5683 }, { "epoch": 0.68, "learning_rate": 2.555842856124182e-06, "loss": 2.5326, "step": 5684 }, { "epoch": 0.68, "learning_rate": 2.5540916107569693e-06, "loss": 2.4401, "step": 5685 }, { "epoch": 0.68, "learning_rate": 2.5523407597401194e-06, "loss": 2.5357, "step": 5686 }, { "epoch": 0.68, "learning_rate": 2.5505903033559163e-06, "loss": 2.5441, "step": 5687 }, { "epoch": 0.68, "learning_rate": 2.5488402418865854e-06, "loss": 2.4151, "step": 5688 }, { "epoch": 0.68, "learning_rate": 2.547090575614288e-06, "loss": 2.3912, "step": 5689 }, { "epoch": 0.68, "learning_rate": 2.5453413048211175e-06, "loss": 2.6546, "step": 5690 }, { "epoch": 0.68, "learning_rate": 2.543592429789108e-06, "loss": 2.4842, "step": 5691 }, { "epoch": 0.68, "learning_rate": 2.541843950800226e-06, "loss": 2.7177, "step": 5692 }, { "epoch": 0.68, "learning_rate": 2.540095868136378e-06, "loss": 2.2205, "step": 5693 }, { "epoch": 0.68, "learning_rate": 2.5383481820794064e-06, "loss": 2.4336, "step": 5694 }, { "epoch": 0.68, "learning_rate": 2.5366008929110854e-06, "loss": 2.6279, "step": 5695 }, { "epoch": 0.68, "learning_rate": 2.5348540009131283e-06, "loss": 2.6147, "step": 5696 }, { "epoch": 0.68, "learning_rate": 2.5331075063671852e-06, "loss": 2.5281, "step": 5697 }, { "epoch": 0.68, "learning_rate": 2.5313614095548423e-06, "loss": 2.5244, "step": 5698 }, { "epoch": 0.68, "learning_rate": 2.5296157107576162e-06, "loss": 2.5064, "step": 5699 }, { "epoch": 0.68, "learning_rate": 2.527870410256966e-06, "loss": 2.5034, "step": 5700 }, { "epoch": 0.68, "learning_rate": 2.5261255083342863e-06, "loss": 2.4018, "step": 5701 }, { "epoch": 0.69, "learning_rate": 2.5243810052709006e-06, "loss": 2.6909, "step": 5702 }, { "epoch": 0.69, "learning_rate": 2.5226369013480773e-06, "loss": 2.5642, "step": 5703 }, { "epoch": 0.69, "learning_rate": 2.5208931968470107e-06, "loss": 2.6771, "step": 5704 }, { "epoch": 0.69, "learning_rate": 2.519149892048839e-06, "loss": 2.3836, "step": 5705 }, { "epoch": 0.69, "learning_rate": 2.517406987234634e-06, "loss": 2.709, "step": 5706 }, { "epoch": 0.69, "learning_rate": 2.515664482685396e-06, "loss": 2.5093, "step": 5707 }, { "epoch": 0.69, "learning_rate": 2.513922378682075e-06, "loss": 2.5555, "step": 5708 }, { "epoch": 0.69, "learning_rate": 2.512180675505541e-06, "loss": 2.5321, "step": 5709 }, { "epoch": 0.69, "learning_rate": 2.5104393734366113e-06, "loss": 2.7031, "step": 5710 }, { "epoch": 0.69, "learning_rate": 2.5086984727560288e-06, "loss": 2.4588, "step": 5711 }, { "epoch": 0.69, "learning_rate": 2.5069579737444795e-06, "loss": 2.5738, "step": 5712 }, { "epoch": 0.69, "learning_rate": 2.5052178766825817e-06, "loss": 2.3612, "step": 5713 }, { "epoch": 0.69, "learning_rate": 2.5034781818508867e-06, "loss": 2.5201, "step": 5714 }, { "epoch": 0.69, "learning_rate": 2.5017388895298865e-06, "loss": 2.5114, "step": 5715 }, { "epoch": 0.69, "learning_rate": 2.5000000000000015e-06, "loss": 2.6406, "step": 5716 }, { "epoch": 0.69, "learning_rate": 2.4982615135415907e-06, "loss": 2.2936, "step": 5717 }, { "epoch": 0.69, "learning_rate": 2.4965234304349483e-06, "loss": 2.5381, "step": 5718 }, { "epoch": 0.69, "learning_rate": 2.494785750960304e-06, "loss": 2.6164, "step": 5719 }, { "epoch": 0.69, "learning_rate": 2.4930484753978224e-06, "loss": 2.5402, "step": 5720 }, { "epoch": 0.69, "learning_rate": 2.491311604027599e-06, "loss": 2.4872, "step": 5721 }, { "epoch": 0.69, "learning_rate": 2.4895751371296695e-06, "loss": 2.5674, "step": 5722 }, { "epoch": 0.69, "learning_rate": 2.4878390749839992e-06, "loss": 2.4377, "step": 5723 }, { "epoch": 0.69, "learning_rate": 2.486103417870493e-06, "loss": 2.4873, "step": 5724 }, { "epoch": 0.69, "learning_rate": 2.48436816606899e-06, "loss": 2.4355, "step": 5725 }, { "epoch": 0.69, "learning_rate": 2.482633319859259e-06, "loss": 2.5612, "step": 5726 }, { "epoch": 0.69, "learning_rate": 2.4808988795210084e-06, "loss": 2.4526, "step": 5727 }, { "epoch": 0.69, "learning_rate": 2.479164845333881e-06, "loss": 2.7242, "step": 5728 }, { "epoch": 0.69, "learning_rate": 2.477431217577448e-06, "loss": 2.4699, "step": 5729 }, { "epoch": 0.69, "learning_rate": 2.4756979965312262e-06, "loss": 2.4682, "step": 5730 }, { "epoch": 0.69, "learning_rate": 2.4739651824746557e-06, "loss": 2.6249, "step": 5731 }, { "epoch": 0.69, "learning_rate": 2.472232775687119e-06, "loss": 2.5425, "step": 5732 }, { "epoch": 0.69, "learning_rate": 2.4705007764479256e-06, "loss": 2.7044, "step": 5733 }, { "epoch": 0.69, "learning_rate": 2.468769185036326e-06, "loss": 2.4582, "step": 5734 }, { "epoch": 0.69, "learning_rate": 2.467038001731503e-06, "loss": 2.5087, "step": 5735 }, { "epoch": 0.69, "learning_rate": 2.46530722681257e-06, "loss": 2.4683, "step": 5736 }, { "epoch": 0.69, "learning_rate": 2.463576860558581e-06, "loss": 2.4651, "step": 5737 }, { "epoch": 0.69, "learning_rate": 2.4618469032485164e-06, "loss": 2.4172, "step": 5738 }, { "epoch": 0.69, "learning_rate": 2.4601173551612966e-06, "loss": 2.5539, "step": 5739 }, { "epoch": 0.69, "learning_rate": 2.4583882165757766e-06, "loss": 2.4726, "step": 5740 }, { "epoch": 0.69, "learning_rate": 2.456659487770737e-06, "loss": 2.3692, "step": 5741 }, { "epoch": 0.69, "learning_rate": 2.454931169024906e-06, "loss": 2.3792, "step": 5742 }, { "epoch": 0.69, "learning_rate": 2.453203260616932e-06, "loss": 2.5887, "step": 5743 }, { "epoch": 0.69, "learning_rate": 2.4514757628254075e-06, "loss": 2.3372, "step": 5744 }, { "epoch": 0.69, "learning_rate": 2.44974867592885e-06, "loss": 2.2937, "step": 5745 }, { "epoch": 0.69, "learning_rate": 2.4480220002057188e-06, "loss": 2.5421, "step": 5746 }, { "epoch": 0.69, "learning_rate": 2.446295735934403e-06, "loss": 2.6029, "step": 5747 }, { "epoch": 0.69, "learning_rate": 2.4445698833932236e-06, "loss": 2.517, "step": 5748 }, { "epoch": 0.69, "learning_rate": 2.442844442860441e-06, "loss": 2.5806, "step": 5749 }, { "epoch": 0.69, "learning_rate": 2.441119414614241e-06, "loss": 2.5828, "step": 5750 }, { "epoch": 0.69, "learning_rate": 2.439394798932749e-06, "loss": 2.3056, "step": 5751 }, { "epoch": 0.69, "learning_rate": 2.4376705960940245e-06, "loss": 2.4688, "step": 5752 }, { "epoch": 0.69, "learning_rate": 2.435946806376057e-06, "loss": 2.4399, "step": 5753 }, { "epoch": 0.69, "learning_rate": 2.434223430056771e-06, "loss": 2.5264, "step": 5754 }, { "epoch": 0.69, "learning_rate": 2.4325004674140235e-06, "loss": 2.5655, "step": 5755 }, { "epoch": 0.69, "learning_rate": 2.4307779187256064e-06, "loss": 2.5325, "step": 5756 }, { "epoch": 0.69, "learning_rate": 2.4290557842692416e-06, "loss": 2.6505, "step": 5757 }, { "epoch": 0.69, "learning_rate": 2.4273340643225874e-06, "loss": 2.4826, "step": 5758 }, { "epoch": 0.69, "learning_rate": 2.4256127591632363e-06, "loss": 2.6069, "step": 5759 }, { "epoch": 0.69, "learning_rate": 2.4238918690687086e-06, "loss": 2.5471, "step": 5760 }, { "epoch": 0.69, "learning_rate": 2.4221713943164643e-06, "loss": 2.51, "step": 5761 }, { "epoch": 0.69, "learning_rate": 2.4204513351838897e-06, "loss": 2.3914, "step": 5762 }, { "epoch": 0.69, "learning_rate": 2.418731691948309e-06, "loss": 2.3416, "step": 5763 }, { "epoch": 0.69, "learning_rate": 2.417012464886978e-06, "loss": 2.6103, "step": 5764 }, { "epoch": 0.69, "learning_rate": 2.415293654277086e-06, "loss": 2.5468, "step": 5765 }, { "epoch": 0.69, "learning_rate": 2.413575260395755e-06, "loss": 2.6844, "step": 5766 }, { "epoch": 0.69, "learning_rate": 2.411857283520036e-06, "loss": 2.6653, "step": 5767 }, { "epoch": 0.69, "learning_rate": 2.4101397239269202e-06, "loss": 2.5732, "step": 5768 }, { "epoch": 0.69, "learning_rate": 2.408422581893323e-06, "loss": 2.5474, "step": 5769 }, { "epoch": 0.69, "learning_rate": 2.406705857696099e-06, "loss": 2.507, "step": 5770 }, { "epoch": 0.69, "learning_rate": 2.404989551612035e-06, "loss": 2.7097, "step": 5771 }, { "epoch": 0.69, "learning_rate": 2.4032736639178443e-06, "loss": 2.7728, "step": 5772 }, { "epoch": 0.69, "learning_rate": 2.401558194890182e-06, "loss": 2.6011, "step": 5773 }, { "epoch": 0.69, "learning_rate": 2.3998431448056237e-06, "loss": 2.2879, "step": 5774 }, { "epoch": 0.69, "learning_rate": 2.3981285139406927e-06, "loss": 2.4575, "step": 5775 }, { "epoch": 0.69, "learning_rate": 2.3964143025718316e-06, "loss": 2.4089, "step": 5776 }, { "epoch": 0.69, "learning_rate": 2.394700510975421e-06, "loss": 2.4577, "step": 5777 }, { "epoch": 0.69, "learning_rate": 2.392987139427776e-06, "loss": 2.5017, "step": 5778 }, { "epoch": 0.69, "learning_rate": 2.391274188205136e-06, "loss": 2.524, "step": 5779 }, { "epoch": 0.69, "learning_rate": 2.389561657583681e-06, "loss": 2.5933, "step": 5780 }, { "epoch": 0.69, "learning_rate": 2.3878495478395207e-06, "loss": 2.4295, "step": 5781 }, { "epoch": 0.69, "learning_rate": 2.3861378592486932e-06, "loss": 2.3969, "step": 5782 }, { "epoch": 0.69, "learning_rate": 2.3844265920871753e-06, "loss": 2.6997, "step": 5783 }, { "epoch": 0.69, "learning_rate": 2.3827157466308674e-06, "loss": 2.4229, "step": 5784 }, { "epoch": 0.69, "learning_rate": 2.38100532315561e-06, "loss": 2.5702, "step": 5785 }, { "epoch": 0.7, "learning_rate": 2.3792953219371713e-06, "loss": 2.4664, "step": 5786 }, { "epoch": 0.7, "learning_rate": 2.377585743251253e-06, "loss": 2.6392, "step": 5787 }, { "epoch": 0.7, "learning_rate": 2.3758765873734897e-06, "loss": 2.5587, "step": 5788 }, { "epoch": 0.7, "learning_rate": 2.374167854579442e-06, "loss": 2.554, "step": 5789 }, { "epoch": 0.7, "learning_rate": 2.3724595451446104e-06, "loss": 2.6561, "step": 5790 }, { "epoch": 0.7, "learning_rate": 2.37075165934442e-06, "loss": 2.5094, "step": 5791 }, { "epoch": 0.7, "learning_rate": 2.3690441974542322e-06, "loss": 2.5966, "step": 5792 }, { "epoch": 0.7, "learning_rate": 2.3673371597493412e-06, "loss": 2.4599, "step": 5793 }, { "epoch": 0.7, "learning_rate": 2.365630546504966e-06, "loss": 2.5728, "step": 5794 }, { "epoch": 0.7, "learning_rate": 2.3639243579962646e-06, "loss": 2.6712, "step": 5795 }, { "epoch": 0.7, "learning_rate": 2.3622185944983187e-06, "loss": 2.7006, "step": 5796 }, { "epoch": 0.7, "learning_rate": 2.360513256286153e-06, "loss": 2.3518, "step": 5797 }, { "epoch": 0.7, "learning_rate": 2.358808343634712e-06, "loss": 2.5924, "step": 5798 }, { "epoch": 0.7, "learning_rate": 2.3571038568188783e-06, "loss": 2.5282, "step": 5799 }, { "epoch": 0.7, "learning_rate": 2.355399796113464e-06, "loss": 2.4929, "step": 5800 }, { "epoch": 0.7, "learning_rate": 2.3536961617932103e-06, "loss": 2.2665, "step": 5801 }, { "epoch": 0.7, "learning_rate": 2.351992954132795e-06, "loss": 2.5944, "step": 5802 }, { "epoch": 0.7, "learning_rate": 2.3502901734068206e-06, "loss": 2.5106, "step": 5803 }, { "epoch": 0.7, "learning_rate": 2.3485878198898253e-06, "loss": 2.6461, "step": 5804 }, { "epoch": 0.7, "learning_rate": 2.346885893856279e-06, "loss": 2.4756, "step": 5805 }, { "epoch": 0.7, "learning_rate": 2.3451843955805774e-06, "loss": 2.6545, "step": 5806 }, { "epoch": 0.7, "learning_rate": 2.3434833253370527e-06, "loss": 2.5651, "step": 5807 }, { "epoch": 0.7, "learning_rate": 2.3417826833999657e-06, "loss": 2.5341, "step": 5808 }, { "epoch": 0.7, "learning_rate": 2.3400824700435104e-06, "loss": 2.3091, "step": 5809 }, { "epoch": 0.7, "learning_rate": 2.3383826855418064e-06, "loss": 2.5746, "step": 5810 }, { "epoch": 0.7, "learning_rate": 2.336683330168909e-06, "loss": 2.6376, "step": 5811 }, { "epoch": 0.7, "learning_rate": 2.3349844041988044e-06, "loss": 2.5146, "step": 5812 }, { "epoch": 0.7, "learning_rate": 2.3332859079054054e-06, "loss": 2.5075, "step": 5813 }, { "epoch": 0.7, "learning_rate": 2.3315878415625613e-06, "loss": 2.5967, "step": 5814 }, { "epoch": 0.7, "learning_rate": 2.3298902054440454e-06, "loss": 2.5576, "step": 5815 }, { "epoch": 0.7, "learning_rate": 2.3281929998235664e-06, "loss": 2.4374, "step": 5816 }, { "epoch": 0.7, "learning_rate": 2.326496224974765e-06, "loss": 2.469, "step": 5817 }, { "epoch": 0.7, "learning_rate": 2.3247998811712036e-06, "loss": 2.6438, "step": 5818 }, { "epoch": 0.7, "learning_rate": 2.32310396868639e-06, "loss": 2.5341, "step": 5819 }, { "epoch": 0.7, "learning_rate": 2.3214084877937464e-06, "loss": 2.5484, "step": 5820 }, { "epoch": 0.7, "learning_rate": 2.3197134387666375e-06, "loss": 2.4038, "step": 5821 }, { "epoch": 0.7, "learning_rate": 2.31801882187835e-06, "loss": 2.4635, "step": 5822 }, { "epoch": 0.7, "learning_rate": 2.3163246374021065e-06, "loss": 2.595, "step": 5823 }, { "epoch": 0.7, "learning_rate": 2.3146308856110593e-06, "loss": 2.5702, "step": 5824 }, { "epoch": 0.7, "learning_rate": 2.3129375667782865e-06, "loss": 2.4857, "step": 5825 }, { "epoch": 0.7, "learning_rate": 2.311244681176803e-06, "loss": 2.5409, "step": 5826 }, { "epoch": 0.7, "learning_rate": 2.3095522290795463e-06, "loss": 2.4583, "step": 5827 }, { "epoch": 0.7, "learning_rate": 2.30786021075939e-06, "loss": 2.3971, "step": 5828 }, { "epoch": 0.7, "learning_rate": 2.3061686264891365e-06, "loss": 2.4815, "step": 5829 }, { "epoch": 0.7, "learning_rate": 2.3044774765415172e-06, "loss": 2.4741, "step": 5830 }, { "epoch": 0.7, "learning_rate": 2.3027867611891953e-06, "loss": 2.4398, "step": 5831 }, { "epoch": 0.7, "learning_rate": 2.301096480704759e-06, "loss": 2.4391, "step": 5832 }, { "epoch": 0.7, "learning_rate": 2.299406635360732e-06, "loss": 2.6364, "step": 5833 }, { "epoch": 0.7, "learning_rate": 2.297717225429567e-06, "loss": 2.6577, "step": 5834 }, { "epoch": 0.7, "learning_rate": 2.2960282511836416e-06, "loss": 2.531, "step": 5835 }, { "epoch": 0.7, "learning_rate": 2.294339712895271e-06, "loss": 2.3623, "step": 5836 }, { "epoch": 0.7, "learning_rate": 2.292651610836691e-06, "loss": 2.4875, "step": 5837 }, { "epoch": 0.7, "learning_rate": 2.2909639452800754e-06, "loss": 2.3647, "step": 5838 }, { "epoch": 0.7, "learning_rate": 2.2892767164975244e-06, "loss": 2.5737, "step": 5839 }, { "epoch": 0.7, "learning_rate": 2.287589924761065e-06, "loss": 2.5266, "step": 5840 }, { "epoch": 0.7, "learning_rate": 2.285903570342657e-06, "loss": 2.5632, "step": 5841 }, { "epoch": 0.7, "learning_rate": 2.2842176535141897e-06, "loss": 2.5344, "step": 5842 }, { "epoch": 0.7, "learning_rate": 2.2825321745474833e-06, "loss": 2.3309, "step": 5843 }, { "epoch": 0.7, "learning_rate": 2.28084713371428e-06, "loss": 2.3182, "step": 5844 }, { "epoch": 0.7, "learning_rate": 2.27916253128626e-06, "loss": 2.4997, "step": 5845 }, { "epoch": 0.7, "learning_rate": 2.2774783675350303e-06, "loss": 2.4612, "step": 5846 }, { "epoch": 0.7, "learning_rate": 2.2757946427321233e-06, "loss": 2.5664, "step": 5847 }, { "epoch": 0.7, "learning_rate": 2.2741113571490066e-06, "loss": 2.6133, "step": 5848 }, { "epoch": 0.7, "learning_rate": 2.2724285110570704e-06, "loss": 2.4452, "step": 5849 }, { "epoch": 0.7, "learning_rate": 2.2707461047276395e-06, "loss": 2.5697, "step": 5850 }, { "epoch": 0.7, "learning_rate": 2.269064138431968e-06, "loss": 2.465, "step": 5851 }, { "epoch": 0.7, "learning_rate": 2.2673826124412314e-06, "loss": 2.5376, "step": 5852 }, { "epoch": 0.7, "learning_rate": 2.2657015270265463e-06, "loss": 2.4654, "step": 5853 }, { "epoch": 0.7, "learning_rate": 2.264020882458947e-06, "loss": 2.4883, "step": 5854 }, { "epoch": 0.7, "learning_rate": 2.2623406790094057e-06, "loss": 2.3018, "step": 5855 }, { "epoch": 0.7, "learning_rate": 2.260660916948814e-06, "loss": 2.5183, "step": 5856 }, { "epoch": 0.7, "learning_rate": 2.2589815965480007e-06, "loss": 2.5283, "step": 5857 }, { "epoch": 0.7, "learning_rate": 2.257302718077721e-06, "loss": 2.5654, "step": 5858 }, { "epoch": 0.7, "learning_rate": 2.2556242818086555e-06, "loss": 2.3642, "step": 5859 }, { "epoch": 0.7, "learning_rate": 2.253946288011419e-06, "loss": 2.4153, "step": 5860 }, { "epoch": 0.7, "learning_rate": 2.2522687369565498e-06, "loss": 2.4917, "step": 5861 }, { "epoch": 0.7, "learning_rate": 2.2505916289145176e-06, "loss": 2.2995, "step": 5862 }, { "epoch": 0.7, "learning_rate": 2.2489149641557196e-06, "loss": 2.5851, "step": 5863 }, { "epoch": 0.7, "learning_rate": 2.247238742950483e-06, "loss": 2.5418, "step": 5864 }, { "epoch": 0.7, "learning_rate": 2.2455629655690655e-06, "loss": 2.4183, "step": 5865 }, { "epoch": 0.7, "learning_rate": 2.2438876322816442e-06, "loss": 2.53, "step": 5866 }, { "epoch": 0.7, "learning_rate": 2.242212743358337e-06, "loss": 2.3489, "step": 5867 }, { "epoch": 0.7, "learning_rate": 2.240538299069178e-06, "loss": 2.4744, "step": 5868 }, { "epoch": 0.71, "learning_rate": 2.238864299684139e-06, "loss": 2.3643, "step": 5869 }, { "epoch": 0.71, "learning_rate": 2.2371907454731168e-06, "loss": 2.5134, "step": 5870 }, { "epoch": 0.71, "learning_rate": 2.235517636705934e-06, "loss": 2.4054, "step": 5871 }, { "epoch": 0.71, "learning_rate": 2.233844973652346e-06, "loss": 2.4568, "step": 5872 }, { "epoch": 0.71, "learning_rate": 2.2321727565820313e-06, "loss": 2.6224, "step": 5873 }, { "epoch": 0.71, "learning_rate": 2.2305009857646003e-06, "loss": 2.6461, "step": 5874 }, { "epoch": 0.71, "learning_rate": 2.2288296614695905e-06, "loss": 2.4097, "step": 5875 }, { "epoch": 0.71, "learning_rate": 2.2271587839664673e-06, "loss": 2.3467, "step": 5876 }, { "epoch": 0.71, "learning_rate": 2.225488353524625e-06, "loss": 2.5661, "step": 5877 }, { "epoch": 0.71, "learning_rate": 2.223818370413382e-06, "loss": 2.4322, "step": 5878 }, { "epoch": 0.71, "learning_rate": 2.2221488349019903e-06, "loss": 2.5194, "step": 5879 }, { "epoch": 0.71, "learning_rate": 2.2204797472596233e-06, "loss": 2.5257, "step": 5880 }, { "epoch": 0.71, "learning_rate": 2.218811107755388e-06, "loss": 2.5032, "step": 5881 }, { "epoch": 0.71, "learning_rate": 2.217142916658318e-06, "loss": 2.5394, "step": 5882 }, { "epoch": 0.71, "learning_rate": 2.2154751742373706e-06, "loss": 2.5377, "step": 5883 }, { "epoch": 0.71, "learning_rate": 2.213807880761434e-06, "loss": 2.5006, "step": 5884 }, { "epoch": 0.71, "learning_rate": 2.2121410364993244e-06, "loss": 2.5967, "step": 5885 }, { "epoch": 0.71, "learning_rate": 2.210474641719785e-06, "loss": 2.5582, "step": 5886 }, { "epoch": 0.71, "learning_rate": 2.2088086966914873e-06, "loss": 2.5298, "step": 5887 }, { "epoch": 0.71, "learning_rate": 2.2071432016830257e-06, "loss": 2.4842, "step": 5888 }, { "epoch": 0.71, "learning_rate": 2.2054781569629306e-06, "loss": 2.4738, "step": 5889 }, { "epoch": 0.71, "learning_rate": 2.2038135627996498e-06, "loss": 2.4383, "step": 5890 }, { "epoch": 0.71, "learning_rate": 2.2021494194615655e-06, "loss": 2.5851, "step": 5891 }, { "epoch": 0.71, "learning_rate": 2.2004857272169878e-06, "loss": 2.616, "step": 5892 }, { "epoch": 0.71, "learning_rate": 2.198822486334147e-06, "loss": 2.2778, "step": 5893 }, { "epoch": 0.71, "learning_rate": 2.197159697081208e-06, "loss": 2.5006, "step": 5894 }, { "epoch": 0.71, "learning_rate": 2.195497359726258e-06, "loss": 2.58, "step": 5895 }, { "epoch": 0.71, "learning_rate": 2.1938354745373147e-06, "loss": 2.6181, "step": 5896 }, { "epoch": 0.71, "learning_rate": 2.1921740417823206e-06, "loss": 2.4936, "step": 5897 }, { "epoch": 0.71, "learning_rate": 2.1905130617291474e-06, "loss": 2.5788, "step": 5898 }, { "epoch": 0.71, "learning_rate": 2.1888525346455936e-06, "loss": 2.4094, "step": 5899 }, { "epoch": 0.71, "learning_rate": 2.18719246079938e-06, "loss": 2.5961, "step": 5900 }, { "epoch": 0.71, "learning_rate": 2.1855328404581616e-06, "loss": 2.4909, "step": 5901 }, { "epoch": 0.71, "learning_rate": 2.1838736738895134e-06, "loss": 2.5542, "step": 5902 }, { "epoch": 0.71, "learning_rate": 2.1822149613609415e-06, "loss": 2.4897, "step": 5903 }, { "epoch": 0.71, "learning_rate": 2.1805567031398812e-06, "loss": 2.5184, "step": 5904 }, { "epoch": 0.71, "learning_rate": 2.1788988994936855e-06, "loss": 2.4122, "step": 5905 }, { "epoch": 0.71, "learning_rate": 2.1772415506896447e-06, "loss": 2.5108, "step": 5906 }, { "epoch": 0.71, "learning_rate": 2.175584656994965e-06, "loss": 2.3596, "step": 5907 }, { "epoch": 0.71, "learning_rate": 2.173928218676792e-06, "loss": 2.417, "step": 5908 }, { "epoch": 0.71, "learning_rate": 2.172272236002187e-06, "loss": 2.3193, "step": 5909 }, { "epoch": 0.71, "learning_rate": 2.1706167092381416e-06, "loss": 2.3345, "step": 5910 }, { "epoch": 0.71, "learning_rate": 2.168961638651576e-06, "loss": 2.3646, "step": 5911 }, { "epoch": 0.71, "learning_rate": 2.1673070245093324e-06, "loss": 2.4597, "step": 5912 }, { "epoch": 0.71, "learning_rate": 2.165652867078185e-06, "loss": 2.5869, "step": 5913 }, { "epoch": 0.71, "learning_rate": 2.163999166624828e-06, "loss": 2.7108, "step": 5914 }, { "epoch": 0.71, "learning_rate": 2.1623459234158863e-06, "loss": 2.4202, "step": 5915 }, { "epoch": 0.71, "learning_rate": 2.160693137717912e-06, "loss": 2.3703, "step": 5916 }, { "epoch": 0.71, "learning_rate": 2.159040809797378e-06, "loss": 2.358, "step": 5917 }, { "epoch": 0.71, "learning_rate": 2.157388939920689e-06, "loss": 2.5393, "step": 5918 }, { "epoch": 0.71, "learning_rate": 2.1557375283541726e-06, "loss": 2.5896, "step": 5919 }, { "epoch": 0.71, "learning_rate": 2.154086575364086e-06, "loss": 2.6151, "step": 5920 }, { "epoch": 0.71, "learning_rate": 2.152436081216607e-06, "loss": 2.5488, "step": 5921 }, { "epoch": 0.71, "learning_rate": 2.1507860461778424e-06, "loss": 2.4761, "step": 5922 }, { "epoch": 0.71, "learning_rate": 2.149136470513829e-06, "loss": 2.4714, "step": 5923 }, { "epoch": 0.71, "learning_rate": 2.1474873544905204e-06, "loss": 2.5399, "step": 5924 }, { "epoch": 0.71, "learning_rate": 2.145838698373806e-06, "loss": 2.4887, "step": 5925 }, { "epoch": 0.71, "learning_rate": 2.1441905024294917e-06, "loss": 2.502, "step": 5926 }, { "epoch": 0.71, "learning_rate": 2.142542766923317e-06, "loss": 2.4718, "step": 5927 }, { "epoch": 0.71, "learning_rate": 2.1408954921209435e-06, "loss": 2.4556, "step": 5928 }, { "epoch": 0.71, "learning_rate": 2.1392486782879573e-06, "loss": 2.5141, "step": 5929 }, { "epoch": 0.71, "learning_rate": 2.137602325689873e-06, "loss": 2.4717, "step": 5930 }, { "epoch": 0.71, "learning_rate": 2.1359564345921304e-06, "loss": 2.5349, "step": 5931 }, { "epoch": 0.71, "learning_rate": 2.134311005260093e-06, "loss": 2.4174, "step": 5932 }, { "epoch": 0.71, "learning_rate": 2.1326660379590538e-06, "loss": 2.5451, "step": 5933 }, { "epoch": 0.71, "learning_rate": 2.1310215329542243e-06, "loss": 2.5673, "step": 5934 }, { "epoch": 0.71, "learning_rate": 2.1293774905107496e-06, "loss": 2.439, "step": 5935 }, { "epoch": 0.71, "learning_rate": 2.127733910893693e-06, "loss": 2.4341, "step": 5936 }, { "epoch": 0.71, "learning_rate": 2.1260907943680482e-06, "loss": 2.522, "step": 5937 }, { "epoch": 0.71, "learning_rate": 2.124448141198734e-06, "loss": 2.3849, "step": 5938 }, { "epoch": 0.71, "learning_rate": 2.1228059516505894e-06, "loss": 2.3982, "step": 5939 }, { "epoch": 0.71, "learning_rate": 2.121164225988387e-06, "loss": 2.4897, "step": 5940 }, { "epoch": 0.71, "learning_rate": 2.1195229644768136e-06, "loss": 2.4818, "step": 5941 }, { "epoch": 0.71, "learning_rate": 2.1178821673804943e-06, "loss": 2.434, "step": 5942 }, { "epoch": 0.71, "learning_rate": 2.116241834963968e-06, "loss": 2.5565, "step": 5943 }, { "epoch": 0.71, "learning_rate": 2.1146019674917044e-06, "loss": 2.6814, "step": 5944 }, { "epoch": 0.71, "learning_rate": 2.1129625652280987e-06, "loss": 2.5577, "step": 5945 }, { "epoch": 0.71, "learning_rate": 2.1113236284374673e-06, "loss": 2.5071, "step": 5946 }, { "epoch": 0.71, "learning_rate": 2.109685157384055e-06, "loss": 2.54, "step": 5947 }, { "epoch": 0.71, "learning_rate": 2.108047152332028e-06, "loss": 2.4774, "step": 5948 }, { "epoch": 0.71, "learning_rate": 2.106409613545481e-06, "loss": 2.4907, "step": 5949 }, { "epoch": 0.71, "learning_rate": 2.104772541288434e-06, "loss": 2.6219, "step": 5950 }, { "epoch": 0.71, "learning_rate": 2.103135935824826e-06, "loss": 2.6793, "step": 5951 }, { "epoch": 0.72, "learning_rate": 2.101499797418527e-06, "loss": 2.5391, "step": 5952 }, { "epoch": 0.72, "learning_rate": 2.0998641263333287e-06, "loss": 2.3052, "step": 5953 }, { "epoch": 0.72, "learning_rate": 2.0982289228329495e-06, "loss": 2.3836, "step": 5954 }, { "epoch": 0.72, "learning_rate": 2.096594187181028e-06, "loss": 2.5218, "step": 5955 }, { "epoch": 0.72, "learning_rate": 2.0949599196411326e-06, "loss": 2.4734, "step": 5956 }, { "epoch": 0.72, "learning_rate": 2.093326120476754e-06, "loss": 2.4891, "step": 5957 }, { "epoch": 0.72, "learning_rate": 2.0916927899513055e-06, "loss": 2.3335, "step": 5958 }, { "epoch": 0.72, "learning_rate": 2.0900599283281296e-06, "loss": 2.3977, "step": 5959 }, { "epoch": 0.72, "learning_rate": 2.0884275358704863e-06, "loss": 2.4655, "step": 5960 }, { "epoch": 0.72, "learning_rate": 2.086795612841567e-06, "loss": 2.465, "step": 5961 }, { "epoch": 0.72, "learning_rate": 2.085164159504484e-06, "loss": 2.6598, "step": 5962 }, { "epoch": 0.72, "learning_rate": 2.083533176122271e-06, "loss": 2.3651, "step": 5963 }, { "epoch": 0.72, "learning_rate": 2.081902662957895e-06, "loss": 2.4563, "step": 5964 }, { "epoch": 0.72, "learning_rate": 2.0802726202742375e-06, "loss": 2.5568, "step": 5965 }, { "epoch": 0.72, "learning_rate": 2.078643048334109e-06, "loss": 2.5168, "step": 5966 }, { "epoch": 0.72, "learning_rate": 2.0770139474002413e-06, "loss": 2.6272, "step": 5967 }, { "epoch": 0.72, "learning_rate": 2.0753853177352945e-06, "loss": 2.5647, "step": 5968 }, { "epoch": 0.72, "learning_rate": 2.07375715960185e-06, "loss": 2.5741, "step": 5969 }, { "epoch": 0.72, "learning_rate": 2.0721294732624113e-06, "loss": 2.4754, "step": 5970 }, { "epoch": 0.72, "learning_rate": 2.070502258979411e-06, "loss": 2.5973, "step": 5971 }, { "epoch": 0.72, "learning_rate": 2.0688755170152e-06, "loss": 2.5362, "step": 5972 }, { "epoch": 0.72, "learning_rate": 2.0672492476320555e-06, "loss": 2.7385, "step": 5973 }, { "epoch": 0.72, "learning_rate": 2.06562345109218e-06, "loss": 2.445, "step": 5974 }, { "epoch": 0.72, "learning_rate": 2.063998127657698e-06, "loss": 2.5785, "step": 5975 }, { "epoch": 0.72, "learning_rate": 2.06237327759066e-06, "loss": 2.4941, "step": 5976 }, { "epoch": 0.72, "learning_rate": 2.0607489011530346e-06, "loss": 2.5725, "step": 5977 }, { "epoch": 0.72, "learning_rate": 2.0591249986067214e-06, "loss": 2.5758, "step": 5978 }, { "epoch": 0.72, "learning_rate": 2.0575015702135363e-06, "loss": 2.4613, "step": 5979 }, { "epoch": 0.72, "learning_rate": 2.0558786162352245e-06, "loss": 2.731, "step": 5980 }, { "epoch": 0.72, "learning_rate": 2.054256136933454e-06, "loss": 2.5043, "step": 5981 }, { "epoch": 0.72, "learning_rate": 2.0526341325698107e-06, "loss": 2.4693, "step": 5982 }, { "epoch": 0.72, "learning_rate": 2.051012603405811e-06, "loss": 2.4341, "step": 5983 }, { "epoch": 0.72, "learning_rate": 2.0493915497028933e-06, "loss": 2.5523, "step": 5984 }, { "epoch": 0.72, "learning_rate": 2.0477709717224115e-06, "loss": 2.5866, "step": 5985 }, { "epoch": 0.72, "learning_rate": 2.0461508697256573e-06, "loss": 2.567, "step": 5986 }, { "epoch": 0.72, "learning_rate": 2.0445312439738313e-06, "loss": 2.4185, "step": 5987 }, { "epoch": 0.72, "learning_rate": 2.042912094728068e-06, "loss": 2.589, "step": 5988 }, { "epoch": 0.72, "learning_rate": 2.0412934222494155e-06, "loss": 2.5847, "step": 5989 }, { "epoch": 0.72, "learning_rate": 2.039675226798854e-06, "loss": 2.7594, "step": 5990 }, { "epoch": 0.72, "learning_rate": 2.0380575086372826e-06, "loss": 2.4887, "step": 5991 }, { "epoch": 0.72, "learning_rate": 2.036440268025522e-06, "loss": 2.3989, "step": 5992 }, { "epoch": 0.72, "learning_rate": 2.0348235052243193e-06, "loss": 2.7113, "step": 5993 }, { "epoch": 0.72, "learning_rate": 2.0332072204943405e-06, "loss": 2.5177, "step": 5994 }, { "epoch": 0.72, "learning_rate": 2.0315914140961786e-06, "loss": 2.5275, "step": 5995 }, { "epoch": 0.72, "learning_rate": 2.029976086290347e-06, "loss": 2.5828, "step": 5996 }, { "epoch": 0.72, "learning_rate": 2.028361237337284e-06, "loss": 2.6801, "step": 5997 }, { "epoch": 0.72, "learning_rate": 2.02674686749735e-06, "loss": 2.5148, "step": 5998 }, { "epoch": 0.72, "learning_rate": 2.025132977030825e-06, "loss": 2.625, "step": 5999 }, { "epoch": 0.72, "learning_rate": 2.0235195661979175e-06, "loss": 2.5928, "step": 6000 }, { "epoch": 0.72, "learning_rate": 2.0219066352587513e-06, "loss": 2.4292, "step": 6001 }, { "epoch": 0.72, "learning_rate": 2.0202941844733792e-06, "loss": 2.5492, "step": 6002 }, { "epoch": 0.72, "learning_rate": 2.0186822141017764e-06, "loss": 2.4903, "step": 6003 }, { "epoch": 0.72, "learning_rate": 2.017070724403835e-06, "loss": 2.631, "step": 6004 }, { "epoch": 0.72, "learning_rate": 2.015459715639376e-06, "loss": 2.6201, "step": 6005 }, { "epoch": 0.72, "learning_rate": 2.013849188068138e-06, "loss": 2.5436, "step": 6006 }, { "epoch": 0.72, "learning_rate": 2.0122391419497844e-06, "loss": 2.4297, "step": 6007 }, { "epoch": 0.72, "learning_rate": 2.0106295775439018e-06, "loss": 2.5309, "step": 6008 }, { "epoch": 0.72, "learning_rate": 2.0090204951099966e-06, "loss": 2.2816, "step": 6009 }, { "epoch": 0.72, "learning_rate": 2.0074118949075024e-06, "loss": 2.5731, "step": 6010 }, { "epoch": 0.72, "learning_rate": 2.0058037771957666e-06, "loss": 2.4621, "step": 6011 }, { "epoch": 0.72, "learning_rate": 2.004196142234068e-06, "loss": 2.5809, "step": 6012 }, { "epoch": 0.72, "learning_rate": 2.0025889902815993e-06, "loss": 2.3612, "step": 6013 }, { "epoch": 0.72, "learning_rate": 2.0009823215974815e-06, "loss": 2.5492, "step": 6014 }, { "epoch": 0.72, "learning_rate": 1.9993761364407575e-06, "loss": 2.5757, "step": 6015 }, { "epoch": 0.72, "learning_rate": 1.9977704350703865e-06, "loss": 2.5392, "step": 6016 }, { "epoch": 0.72, "learning_rate": 1.996165217745257e-06, "loss": 2.6633, "step": 6017 }, { "epoch": 0.72, "learning_rate": 1.9945604847241697e-06, "loss": 2.5084, "step": 6018 }, { "epoch": 0.72, "learning_rate": 1.9929562362658623e-06, "loss": 2.585, "step": 6019 }, { "epoch": 0.72, "learning_rate": 1.9913524726289784e-06, "loss": 2.6002, "step": 6020 }, { "epoch": 0.72, "learning_rate": 1.9897491940720936e-06, "loss": 2.531, "step": 6021 }, { "epoch": 0.72, "learning_rate": 1.988146400853704e-06, "loss": 2.3933, "step": 6022 }, { "epoch": 0.72, "learning_rate": 1.986544093232222e-06, "loss": 2.582, "step": 6023 }, { "epoch": 0.72, "learning_rate": 1.9849422714659875e-06, "loss": 2.5339, "step": 6024 }, { "epoch": 0.72, "learning_rate": 1.9833409358132584e-06, "loss": 2.5074, "step": 6025 }, { "epoch": 0.72, "learning_rate": 1.9817400865322166e-06, "loss": 2.48, "step": 6026 }, { "epoch": 0.72, "learning_rate": 1.9801397238809665e-06, "loss": 2.3314, "step": 6027 }, { "epoch": 0.72, "learning_rate": 1.9785398481175295e-06, "loss": 2.5114, "step": 6028 }, { "epoch": 0.72, "learning_rate": 1.976940459499854e-06, "loss": 2.3695, "step": 6029 }, { "epoch": 0.72, "learning_rate": 1.9753415582858026e-06, "loss": 2.3009, "step": 6030 }, { "epoch": 0.72, "learning_rate": 1.9737431447331706e-06, "loss": 2.6007, "step": 6031 }, { "epoch": 0.72, "learning_rate": 1.972145219099662e-06, "loss": 2.4165, "step": 6032 }, { "epoch": 0.72, "learning_rate": 1.9705477816429107e-06, "loss": 2.5151, "step": 6033 }, { "epoch": 0.72, "learning_rate": 1.9689508326204716e-06, "loss": 2.5491, "step": 6034 }, { "epoch": 0.73, "learning_rate": 1.9673543722898137e-06, "loss": 2.4833, "step": 6035 }, { "epoch": 0.73, "learning_rate": 1.965758400908334e-06, "loss": 2.5457, "step": 6036 }, { "epoch": 0.73, "learning_rate": 1.9641629187333515e-06, "loss": 2.6067, "step": 6037 }, { "epoch": 0.73, "learning_rate": 1.962567926022099e-06, "loss": 2.5089, "step": 6038 }, { "epoch": 0.73, "learning_rate": 1.960973423031739e-06, "loss": 2.4966, "step": 6039 }, { "epoch": 0.73, "learning_rate": 1.9593794100193474e-06, "loss": 2.3741, "step": 6040 }, { "epoch": 0.73, "learning_rate": 1.957785887241926e-06, "loss": 2.3839, "step": 6041 }, { "epoch": 0.73, "learning_rate": 1.956192854956397e-06, "loss": 2.4711, "step": 6042 }, { "epoch": 0.73, "learning_rate": 1.954600313419602e-06, "loss": 2.4952, "step": 6043 }, { "epoch": 0.73, "learning_rate": 1.9530082628883058e-06, "loss": 2.376, "step": 6044 }, { "epoch": 0.73, "learning_rate": 1.95141670361919e-06, "loss": 2.4977, "step": 6045 }, { "epoch": 0.73, "learning_rate": 1.949825635868862e-06, "loss": 2.564, "step": 6046 }, { "epoch": 0.73, "learning_rate": 1.9482350598938447e-06, "loss": 2.4423, "step": 6047 }, { "epoch": 0.73, "learning_rate": 1.9466449759505856e-06, "loss": 2.5614, "step": 6048 }, { "epoch": 0.73, "learning_rate": 1.9450553842954533e-06, "loss": 2.6503, "step": 6049 }, { "epoch": 0.73, "learning_rate": 1.9434662851847325e-06, "loss": 2.4795, "step": 6050 }, { "epoch": 0.73, "learning_rate": 1.9418776788746345e-06, "loss": 2.5971, "step": 6051 }, { "epoch": 0.73, "learning_rate": 1.9402895656212834e-06, "loss": 2.5378, "step": 6052 }, { "epoch": 0.73, "learning_rate": 1.938701945680735e-06, "loss": 2.5061, "step": 6053 }, { "epoch": 0.73, "learning_rate": 1.937114819308953e-06, "loss": 2.654, "step": 6054 }, { "epoch": 0.73, "learning_rate": 1.9355281867618306e-06, "loss": 2.5217, "step": 6055 }, { "epoch": 0.73, "learning_rate": 1.9339420482951794e-06, "loss": 2.4749, "step": 6056 }, { "epoch": 0.73, "learning_rate": 1.932356404164727e-06, "loss": 2.3838, "step": 6057 }, { "epoch": 0.73, "learning_rate": 1.930771254626128e-06, "loss": 2.5949, "step": 6058 }, { "epoch": 0.73, "learning_rate": 1.92918659993495e-06, "loss": 2.5186, "step": 6059 }, { "epoch": 0.73, "learning_rate": 1.927602440346687e-06, "loss": 2.389, "step": 6060 }, { "epoch": 0.73, "learning_rate": 1.9260187761167527e-06, "loss": 2.6009, "step": 6061 }, { "epoch": 0.73, "learning_rate": 1.9244356075004743e-06, "loss": 2.4803, "step": 6062 }, { "epoch": 0.73, "learning_rate": 1.9228529347531067e-06, "loss": 2.5759, "step": 6063 }, { "epoch": 0.73, "learning_rate": 1.921270758129822e-06, "loss": 2.4875, "step": 6064 }, { "epoch": 0.73, "learning_rate": 1.9196890778857137e-06, "loss": 2.4662, "step": 6065 }, { "epoch": 0.73, "learning_rate": 1.91810789427579e-06, "loss": 2.5986, "step": 6066 }, { "epoch": 0.73, "learning_rate": 1.9165272075549856e-06, "loss": 2.4909, "step": 6067 }, { "epoch": 0.73, "learning_rate": 1.914947017978153e-06, "loss": 2.6352, "step": 6068 }, { "epoch": 0.73, "learning_rate": 1.9133673258000617e-06, "loss": 2.5849, "step": 6069 }, { "epoch": 0.73, "learning_rate": 1.911788131275406e-06, "loss": 2.5037, "step": 6070 }, { "epoch": 0.73, "learning_rate": 1.9102094346587935e-06, "loss": 2.5859, "step": 6071 }, { "epoch": 0.73, "learning_rate": 1.9086312362047576e-06, "loss": 2.6319, "step": 6072 }, { "epoch": 0.73, "learning_rate": 1.9070535361677506e-06, "loss": 2.5948, "step": 6073 }, { "epoch": 0.73, "learning_rate": 1.9054763348021372e-06, "loss": 2.6972, "step": 6074 }, { "epoch": 0.73, "learning_rate": 1.903899632362215e-06, "loss": 2.5334, "step": 6075 }, { "epoch": 0.73, "learning_rate": 1.9023234291021875e-06, "loss": 2.3813, "step": 6076 }, { "epoch": 0.73, "learning_rate": 1.9007477252761875e-06, "loss": 2.4932, "step": 6077 }, { "epoch": 0.73, "learning_rate": 1.89917252113826e-06, "loss": 2.5408, "step": 6078 }, { "epoch": 0.73, "learning_rate": 1.8975978169423754e-06, "loss": 2.5393, "step": 6079 }, { "epoch": 0.73, "learning_rate": 1.896023612942422e-06, "loss": 2.6058, "step": 6080 }, { "epoch": 0.73, "learning_rate": 1.894449909392203e-06, "loss": 2.4534, "step": 6081 }, { "epoch": 0.73, "learning_rate": 1.8928767065454478e-06, "loss": 2.6178, "step": 6082 }, { "epoch": 0.73, "learning_rate": 1.891304004655799e-06, "loss": 2.5869, "step": 6083 }, { "epoch": 0.73, "learning_rate": 1.889731803976822e-06, "loss": 2.6212, "step": 6084 }, { "epoch": 0.73, "learning_rate": 1.8881601047620013e-06, "loss": 2.4643, "step": 6085 }, { "epoch": 0.73, "learning_rate": 1.8865889072647386e-06, "loss": 2.5527, "step": 6086 }, { "epoch": 0.73, "learning_rate": 1.8850182117383587e-06, "loss": 2.434, "step": 6087 }, { "epoch": 0.73, "learning_rate": 1.8834480184360987e-06, "loss": 2.4418, "step": 6088 }, { "epoch": 0.73, "learning_rate": 1.8818783276111203e-06, "loss": 2.6916, "step": 6089 }, { "epoch": 0.73, "learning_rate": 1.8803091395165046e-06, "loss": 2.3544, "step": 6090 }, { "epoch": 0.73, "learning_rate": 1.8787404544052457e-06, "loss": 2.5289, "step": 6091 }, { "epoch": 0.73, "learning_rate": 1.8771722725302644e-06, "loss": 2.59, "step": 6092 }, { "epoch": 0.73, "learning_rate": 1.8756045941443923e-06, "loss": 2.4017, "step": 6093 }, { "epoch": 0.73, "learning_rate": 1.8740374195003863e-06, "loss": 2.4897, "step": 6094 }, { "epoch": 0.73, "learning_rate": 1.8724707488509213e-06, "loss": 2.4571, "step": 6095 }, { "epoch": 0.73, "learning_rate": 1.8709045824485845e-06, "loss": 2.6449, "step": 6096 }, { "epoch": 0.73, "learning_rate": 1.8693389205458928e-06, "loss": 2.4249, "step": 6097 }, { "epoch": 0.73, "learning_rate": 1.8677737633952715e-06, "loss": 2.4835, "step": 6098 }, { "epoch": 0.73, "learning_rate": 1.8662091112490717e-06, "loss": 2.343, "step": 6099 }, { "epoch": 0.73, "learning_rate": 1.8646449643595565e-06, "loss": 2.5574, "step": 6100 }, { "epoch": 0.73, "learning_rate": 1.863081322978913e-06, "loss": 2.5299, "step": 6101 }, { "epoch": 0.73, "learning_rate": 1.8615181873592465e-06, "loss": 2.478, "step": 6102 }, { "epoch": 0.73, "learning_rate": 1.8599555577525752e-06, "loss": 2.6043, "step": 6103 }, { "epoch": 0.73, "learning_rate": 1.8583934344108446e-06, "loss": 2.3894, "step": 6104 }, { "epoch": 0.73, "learning_rate": 1.8568318175859084e-06, "loss": 2.4664, "step": 6105 }, { "epoch": 0.73, "learning_rate": 1.8552707075295468e-06, "loss": 2.364, "step": 6106 }, { "epoch": 0.73, "learning_rate": 1.8537101044934553e-06, "loss": 2.5101, "step": 6107 }, { "epoch": 0.73, "learning_rate": 1.8521500087292466e-06, "loss": 2.5445, "step": 6108 }, { "epoch": 0.73, "learning_rate": 1.8505904204884563e-06, "loss": 2.6182, "step": 6109 }, { "epoch": 0.73, "learning_rate": 1.8490313400225296e-06, "loss": 2.5294, "step": 6110 }, { "epoch": 0.73, "learning_rate": 1.8474727675828386e-06, "loss": 2.532, "step": 6111 }, { "epoch": 0.73, "learning_rate": 1.8459147034206671e-06, "loss": 2.5182, "step": 6112 }, { "epoch": 0.73, "learning_rate": 1.8443571477872207e-06, "loss": 2.5269, "step": 6113 }, { "epoch": 0.73, "learning_rate": 1.8428001009336233e-06, "loss": 2.5126, "step": 6114 }, { "epoch": 0.73, "learning_rate": 1.8412435631109126e-06, "loss": 2.3535, "step": 6115 }, { "epoch": 0.73, "learning_rate": 1.8396875345700498e-06, "loss": 2.6907, "step": 6116 }, { "epoch": 0.73, "learning_rate": 1.8381320155619088e-06, "loss": 2.4706, "step": 6117 }, { "epoch": 0.73, "learning_rate": 1.8365770063372844e-06, "loss": 2.4135, "step": 6118 }, { "epoch": 0.74, "learning_rate": 1.8350225071468887e-06, "loss": 2.5322, "step": 6119 }, { "epoch": 0.74, "learning_rate": 1.833468518241352e-06, "loss": 2.4684, "step": 6120 }, { "epoch": 0.74, "learning_rate": 1.8319150398712227e-06, "loss": 2.4512, "step": 6121 }, { "epoch": 0.74, "learning_rate": 1.830362072286963e-06, "loss": 2.5191, "step": 6122 }, { "epoch": 0.74, "learning_rate": 1.828809615738959e-06, "loss": 2.6897, "step": 6123 }, { "epoch": 0.74, "learning_rate": 1.8272576704775074e-06, "loss": 2.5788, "step": 6124 }, { "epoch": 0.74, "learning_rate": 1.8257062367528284e-06, "loss": 2.4151, "step": 6125 }, { "epoch": 0.74, "learning_rate": 1.8241553148150587e-06, "loss": 2.5673, "step": 6126 }, { "epoch": 0.74, "learning_rate": 1.8226049049142481e-06, "loss": 2.5084, "step": 6127 }, { "epoch": 0.74, "learning_rate": 1.8210550073003701e-06, "loss": 2.4797, "step": 6128 }, { "epoch": 0.74, "learning_rate": 1.8195056222233098e-06, "loss": 2.4562, "step": 6129 }, { "epoch": 0.74, "learning_rate": 1.817956749932873e-06, "loss": 2.459, "step": 6130 }, { "epoch": 0.74, "learning_rate": 1.8164083906787832e-06, "loss": 2.7372, "step": 6131 }, { "epoch": 0.74, "learning_rate": 1.81486054471068e-06, "loss": 2.4502, "step": 6132 }, { "epoch": 0.74, "learning_rate": 1.813313212278121e-06, "loss": 2.6849, "step": 6133 }, { "epoch": 0.74, "learning_rate": 1.8117663936305785e-06, "loss": 2.4881, "step": 6134 }, { "epoch": 0.74, "learning_rate": 1.8102200890174465e-06, "loss": 2.6765, "step": 6135 }, { "epoch": 0.74, "learning_rate": 1.8086742986880308e-06, "loss": 2.4205, "step": 6136 }, { "epoch": 0.74, "learning_rate": 1.8071290228915577e-06, "loss": 2.3796, "step": 6137 }, { "epoch": 0.74, "learning_rate": 1.8055842618771724e-06, "loss": 2.453, "step": 6138 }, { "epoch": 0.74, "learning_rate": 1.8040400158939302e-06, "loss": 2.4089, "step": 6139 }, { "epoch": 0.74, "learning_rate": 1.8024962851908106e-06, "loss": 2.5198, "step": 6140 }, { "epoch": 0.74, "learning_rate": 1.800953070016706e-06, "loss": 2.4407, "step": 6141 }, { "epoch": 0.74, "learning_rate": 1.799410370620428e-06, "loss": 2.6879, "step": 6142 }, { "epoch": 0.74, "learning_rate": 1.7978681872507043e-06, "loss": 2.5456, "step": 6143 }, { "epoch": 0.74, "learning_rate": 1.7963265201561763e-06, "loss": 2.5073, "step": 6144 }, { "epoch": 0.74, "learning_rate": 1.7947853695854083e-06, "loss": 2.5424, "step": 6145 }, { "epoch": 0.74, "learning_rate": 1.7932447357868737e-06, "loss": 2.6657, "step": 6146 }, { "epoch": 0.74, "learning_rate": 1.7917046190089693e-06, "loss": 2.6421, "step": 6147 }, { "epoch": 0.74, "learning_rate": 1.790165019500007e-06, "loss": 2.4667, "step": 6148 }, { "epoch": 0.74, "learning_rate": 1.788625937508211e-06, "loss": 2.5344, "step": 6149 }, { "epoch": 0.74, "learning_rate": 1.787087373281729e-06, "loss": 2.4343, "step": 6150 }, { "epoch": 0.74, "learning_rate": 1.7855493270686181e-06, "loss": 2.4672, "step": 6151 }, { "epoch": 0.74, "learning_rate": 1.7840117991168566e-06, "loss": 2.455, "step": 6152 }, { "epoch": 0.74, "learning_rate": 1.7824747896743384e-06, "loss": 2.4995, "step": 6153 }, { "epoch": 0.74, "learning_rate": 1.780938298988873e-06, "loss": 2.5538, "step": 6154 }, { "epoch": 0.74, "learning_rate": 1.779402327308189e-06, "loss": 2.5026, "step": 6155 }, { "epoch": 0.74, "learning_rate": 1.7778668748799244e-06, "loss": 2.4977, "step": 6156 }, { "epoch": 0.74, "learning_rate": 1.7763319419516428e-06, "loss": 2.5427, "step": 6157 }, { "epoch": 0.74, "learning_rate": 1.7747975287708147e-06, "loss": 2.5118, "step": 6158 }, { "epoch": 0.74, "learning_rate": 1.7732636355848336e-06, "loss": 2.7009, "step": 6159 }, { "epoch": 0.74, "learning_rate": 1.7717302626410087e-06, "loss": 2.497, "step": 6160 }, { "epoch": 0.74, "learning_rate": 1.7701974101865598e-06, "loss": 2.5041, "step": 6161 }, { "epoch": 0.74, "learning_rate": 1.768665078468631e-06, "loss": 2.6949, "step": 6162 }, { "epoch": 0.74, "learning_rate": 1.7671332677342711e-06, "loss": 2.3949, "step": 6163 }, { "epoch": 0.74, "learning_rate": 1.7656019782304602e-06, "loss": 2.6839, "step": 6164 }, { "epoch": 0.74, "learning_rate": 1.7640712102040802e-06, "loss": 2.5522, "step": 6165 }, { "epoch": 0.74, "learning_rate": 1.7625409639019358e-06, "loss": 2.4793, "step": 6166 }, { "epoch": 0.74, "learning_rate": 1.7610112395707496e-06, "loss": 2.4227, "step": 6167 }, { "epoch": 0.74, "learning_rate": 1.759482037457152e-06, "loss": 2.5532, "step": 6168 }, { "epoch": 0.74, "learning_rate": 1.7579533578076985e-06, "loss": 2.5204, "step": 6169 }, { "epoch": 0.74, "learning_rate": 1.7564252008688514e-06, "loss": 2.5635, "step": 6170 }, { "epoch": 0.74, "learning_rate": 1.7548975668869966e-06, "loss": 2.4454, "step": 6171 }, { "epoch": 0.74, "learning_rate": 1.7533704561084331e-06, "loss": 2.5629, "step": 6172 }, { "epoch": 0.74, "learning_rate": 1.7518438687793715e-06, "loss": 2.4768, "step": 6173 }, { "epoch": 0.74, "learning_rate": 1.750317805145943e-06, "loss": 2.546, "step": 6174 }, { "epoch": 0.74, "learning_rate": 1.7487922654541927e-06, "loss": 2.5994, "step": 6175 }, { "epoch": 0.74, "learning_rate": 1.7472672499500837e-06, "loss": 2.64, "step": 6176 }, { "epoch": 0.74, "learning_rate": 1.7457427588794874e-06, "loss": 2.4444, "step": 6177 }, { "epoch": 0.74, "learning_rate": 1.7442187924881975e-06, "loss": 2.4877, "step": 6178 }, { "epoch": 0.74, "learning_rate": 1.742695351021923e-06, "loss": 2.5095, "step": 6179 }, { "epoch": 0.74, "learning_rate": 1.7411724347262826e-06, "loss": 2.4172, "step": 6180 }, { "epoch": 0.74, "learning_rate": 1.7396500438468172e-06, "loss": 2.344, "step": 6181 }, { "epoch": 0.74, "learning_rate": 1.7381281786289767e-06, "loss": 2.3966, "step": 6182 }, { "epoch": 0.74, "learning_rate": 1.7366068393181307e-06, "loss": 2.4993, "step": 6183 }, { "epoch": 0.74, "learning_rate": 1.7350860261595647e-06, "loss": 2.5481, "step": 6184 }, { "epoch": 0.74, "learning_rate": 1.7335657393984718e-06, "loss": 2.5684, "step": 6185 }, { "epoch": 0.74, "learning_rate": 1.732045979279972e-06, "loss": 2.5723, "step": 6186 }, { "epoch": 0.74, "learning_rate": 1.7305267460490898e-06, "loss": 2.4548, "step": 6187 }, { "epoch": 0.74, "learning_rate": 1.729008039950772e-06, "loss": 2.3987, "step": 6188 }, { "epoch": 0.74, "learning_rate": 1.7274898612298745e-06, "loss": 2.6342, "step": 6189 }, { "epoch": 0.74, "learning_rate": 1.725972210131172e-06, "loss": 2.5457, "step": 6190 }, { "epoch": 0.74, "learning_rate": 1.724455086899356e-06, "loss": 2.6236, "step": 6191 }, { "epoch": 0.74, "learning_rate": 1.722938491779026e-06, "loss": 2.5, "step": 6192 }, { "epoch": 0.74, "learning_rate": 1.721422425014702e-06, "loss": 2.4481, "step": 6193 }, { "epoch": 0.74, "learning_rate": 1.71990688685082e-06, "loss": 2.6013, "step": 6194 }, { "epoch": 0.74, "learning_rate": 1.7183918775317237e-06, "loss": 2.615, "step": 6195 }, { "epoch": 0.74, "learning_rate": 1.7168773973016779e-06, "loss": 2.553, "step": 6196 }, { "epoch": 0.74, "learning_rate": 1.7153634464048602e-06, "loss": 2.4336, "step": 6197 }, { "epoch": 0.74, "learning_rate": 1.7138500250853645e-06, "loss": 2.542, "step": 6198 }, { "epoch": 0.74, "learning_rate": 1.7123371335871946e-06, "loss": 2.6031, "step": 6199 }, { "epoch": 0.74, "learning_rate": 1.7108247721542725e-06, "loss": 2.6543, "step": 6200 }, { "epoch": 0.74, "learning_rate": 1.7093129410304366e-06, "loss": 2.5589, "step": 6201 }, { "epoch": 0.75, "learning_rate": 1.7078016404594338e-06, "loss": 2.3019, "step": 6202 }, { "epoch": 0.75, "learning_rate": 1.7062908706849324e-06, "loss": 2.4995, "step": 6203 }, { "epoch": 0.75, "learning_rate": 1.7047806319505079e-06, "loss": 2.5481, "step": 6204 }, { "epoch": 0.75, "learning_rate": 1.7032709244996559e-06, "loss": 2.724, "step": 6205 }, { "epoch": 0.75, "learning_rate": 1.701761748575786e-06, "loss": 2.6534, "step": 6206 }, { "epoch": 0.75, "learning_rate": 1.7002531044222158e-06, "loss": 2.5079, "step": 6207 }, { "epoch": 0.75, "learning_rate": 1.6987449922821887e-06, "loss": 2.3036, "step": 6208 }, { "epoch": 0.75, "learning_rate": 1.6972374123988494e-06, "loss": 2.5034, "step": 6209 }, { "epoch": 0.75, "learning_rate": 1.6957303650152674e-06, "loss": 2.5834, "step": 6210 }, { "epoch": 0.75, "learning_rate": 1.6942238503744173e-06, "loss": 2.5031, "step": 6211 }, { "epoch": 0.75, "learning_rate": 1.6927178687191953e-06, "loss": 2.4492, "step": 6212 }, { "epoch": 0.75, "learning_rate": 1.6912124202924101e-06, "loss": 2.3933, "step": 6213 }, { "epoch": 0.75, "learning_rate": 1.689707505336779e-06, "loss": 2.3531, "step": 6214 }, { "epoch": 0.75, "learning_rate": 1.6882031240949408e-06, "loss": 2.5352, "step": 6215 }, { "epoch": 0.75, "learning_rate": 1.686699276809442e-06, "loss": 2.6495, "step": 6216 }, { "epoch": 0.75, "learning_rate": 1.6851959637227472e-06, "loss": 2.5844, "step": 6217 }, { "epoch": 0.75, "learning_rate": 1.6836931850772331e-06, "loss": 2.3818, "step": 6218 }, { "epoch": 0.75, "learning_rate": 1.682190941115191e-06, "loss": 2.4075, "step": 6219 }, { "epoch": 0.75, "learning_rate": 1.680689232078827e-06, "loss": 2.4176, "step": 6220 }, { "epoch": 0.75, "learning_rate": 1.679188058210256e-06, "loss": 2.4942, "step": 6221 }, { "epoch": 0.75, "learning_rate": 1.6776874197515141e-06, "loss": 2.5682, "step": 6222 }, { "epoch": 0.75, "learning_rate": 1.6761873169445437e-06, "loss": 2.5357, "step": 6223 }, { "epoch": 0.75, "learning_rate": 1.6746877500312054e-06, "loss": 2.6225, "step": 6224 }, { "epoch": 0.75, "learning_rate": 1.6731887192532743e-06, "loss": 2.477, "step": 6225 }, { "epoch": 0.75, "learning_rate": 1.6716902248524331e-06, "loss": 2.5823, "step": 6226 }, { "epoch": 0.75, "learning_rate": 1.6701922670702863e-06, "loss": 2.4594, "step": 6227 }, { "epoch": 0.75, "learning_rate": 1.6686948461483432e-06, "loss": 2.3283, "step": 6228 }, { "epoch": 0.75, "learning_rate": 1.6671979623280331e-06, "loss": 2.459, "step": 6229 }, { "epoch": 0.75, "learning_rate": 1.6657016158506966e-06, "loss": 2.3691, "step": 6230 }, { "epoch": 0.75, "learning_rate": 1.6642058069575872e-06, "loss": 2.5298, "step": 6231 }, { "epoch": 0.75, "learning_rate": 1.6627105358898737e-06, "loss": 2.4684, "step": 6232 }, { "epoch": 0.75, "learning_rate": 1.6612158028886333e-06, "loss": 2.4497, "step": 6233 }, { "epoch": 0.75, "learning_rate": 1.659721608194863e-06, "loss": 2.594, "step": 6234 }, { "epoch": 0.75, "learning_rate": 1.6582279520494665e-06, "loss": 2.6507, "step": 6235 }, { "epoch": 0.75, "learning_rate": 1.656734834693266e-06, "loss": 2.2544, "step": 6236 }, { "epoch": 0.75, "learning_rate": 1.655242256366995e-06, "loss": 2.557, "step": 6237 }, { "epoch": 0.75, "learning_rate": 1.6537502173112974e-06, "loss": 2.334, "step": 6238 }, { "epoch": 0.75, "learning_rate": 1.6522587177667343e-06, "loss": 2.6791, "step": 6239 }, { "epoch": 0.75, "learning_rate": 1.6507677579737795e-06, "loss": 2.5374, "step": 6240 }, { "epoch": 0.75, "learning_rate": 1.649277338172814e-06, "loss": 2.459, "step": 6241 }, { "epoch": 0.75, "learning_rate": 1.6477874586041415e-06, "loss": 2.4842, "step": 6242 }, { "epoch": 0.75, "learning_rate": 1.6462981195079685e-06, "loss": 2.3779, "step": 6243 }, { "epoch": 0.75, "learning_rate": 1.6448093211244232e-06, "loss": 2.3774, "step": 6244 }, { "epoch": 0.75, "learning_rate": 1.6433210636935388e-06, "loss": 2.7192, "step": 6245 }, { "epoch": 0.75, "learning_rate": 1.641833347455266e-06, "loss": 2.5152, "step": 6246 }, { "epoch": 0.75, "learning_rate": 1.6403461726494697e-06, "loss": 2.6255, "step": 6247 }, { "epoch": 0.75, "learning_rate": 1.6388595395159207e-06, "loss": 2.4622, "step": 6248 }, { "epoch": 0.75, "learning_rate": 1.637373448294311e-06, "loss": 2.5294, "step": 6249 }, { "epoch": 0.75, "learning_rate": 1.6358878992242377e-06, "loss": 2.5627, "step": 6250 }, { "epoch": 0.75, "learning_rate": 1.6344028925452144e-06, "loss": 2.4048, "step": 6251 }, { "epoch": 0.75, "learning_rate": 1.6329184284966675e-06, "loss": 2.637, "step": 6252 }, { "epoch": 0.75, "learning_rate": 1.6314345073179356e-06, "loss": 2.5374, "step": 6253 }, { "epoch": 0.75, "learning_rate": 1.6299511292482689e-06, "loss": 2.5172, "step": 6254 }, { "epoch": 0.75, "learning_rate": 1.6284682945268292e-06, "loss": 2.5292, "step": 6255 }, { "epoch": 0.75, "learning_rate": 1.6269860033926938e-06, "loss": 2.4974, "step": 6256 }, { "epoch": 0.75, "learning_rate": 1.6255042560848478e-06, "loss": 2.5602, "step": 6257 }, { "epoch": 0.75, "learning_rate": 1.6240230528421924e-06, "loss": 2.5591, "step": 6258 }, { "epoch": 0.75, "learning_rate": 1.6225423939035418e-06, "loss": 2.4685, "step": 6259 }, { "epoch": 0.75, "learning_rate": 1.621062279507617e-06, "loss": 2.5955, "step": 6260 }, { "epoch": 0.75, "learning_rate": 1.6195827098930588e-06, "loss": 2.6571, "step": 6261 }, { "epoch": 0.75, "learning_rate": 1.6181036852984118e-06, "loss": 2.4877, "step": 6262 }, { "epoch": 0.75, "learning_rate": 1.6166252059621396e-06, "loss": 2.3767, "step": 6263 }, { "epoch": 0.75, "learning_rate": 1.6151472721226148e-06, "loss": 2.376, "step": 6264 }, { "epoch": 0.75, "learning_rate": 1.6136698840181226e-06, "loss": 2.4114, "step": 6265 }, { "epoch": 0.75, "learning_rate": 1.612193041886862e-06, "loss": 2.3644, "step": 6266 }, { "epoch": 0.75, "learning_rate": 1.6107167459669393e-06, "loss": 2.4428, "step": 6267 }, { "epoch": 0.75, "learning_rate": 1.6092409964963779e-06, "loss": 2.3334, "step": 6268 }, { "epoch": 0.75, "learning_rate": 1.6077657937131086e-06, "loss": 2.5282, "step": 6269 }, { "epoch": 0.75, "learning_rate": 1.6062911378549768e-06, "loss": 2.5719, "step": 6270 }, { "epoch": 0.75, "learning_rate": 1.604817029159742e-06, "loss": 2.5855, "step": 6271 }, { "epoch": 0.75, "learning_rate": 1.6033434678650684e-06, "loss": 2.579, "step": 6272 }, { "epoch": 0.75, "learning_rate": 1.60187045420854e-06, "loss": 2.4394, "step": 6273 }, { "epoch": 0.75, "learning_rate": 1.600397988427644e-06, "loss": 2.3723, "step": 6274 }, { "epoch": 0.75, "learning_rate": 1.5989260707597898e-06, "loss": 2.556, "step": 6275 }, { "epoch": 0.75, "learning_rate": 1.597454701442288e-06, "loss": 2.556, "step": 6276 }, { "epoch": 0.75, "learning_rate": 1.5959838807123672e-06, "loss": 2.5655, "step": 6277 }, { "epoch": 0.75, "learning_rate": 1.5945136088071677e-06, "loss": 2.5421, "step": 6278 }, { "epoch": 0.75, "learning_rate": 1.593043885963736e-06, "loss": 2.4283, "step": 6279 }, { "epoch": 0.75, "learning_rate": 1.5915747124190356e-06, "loss": 2.4524, "step": 6280 }, { "epoch": 0.75, "learning_rate": 1.5901060884099374e-06, "loss": 2.6047, "step": 6281 }, { "epoch": 0.75, "learning_rate": 1.5886380141732267e-06, "loss": 2.4911, "step": 6282 }, { "epoch": 0.75, "learning_rate": 1.587170489945601e-06, "loss": 2.5257, "step": 6283 }, { "epoch": 0.75, "learning_rate": 1.5857035159636625e-06, "loss": 2.5221, "step": 6284 }, { "epoch": 0.76, "learning_rate": 1.5842370924639327e-06, "loss": 2.4198, "step": 6285 }, { "epoch": 0.76, "learning_rate": 1.5827712196828405e-06, "loss": 2.3544, "step": 6286 }, { "epoch": 0.76, "learning_rate": 1.5813058978567276e-06, "loss": 2.535, "step": 6287 }, { "epoch": 0.76, "learning_rate": 1.5798411272218427e-06, "loss": 2.5314, "step": 6288 }, { "epoch": 0.76, "learning_rate": 1.5783769080143514e-06, "loss": 2.5093, "step": 6289 }, { "epoch": 0.76, "learning_rate": 1.5769132404703274e-06, "loss": 2.4158, "step": 6290 }, { "epoch": 0.76, "learning_rate": 1.5754501248257537e-06, "loss": 2.5725, "step": 6291 }, { "epoch": 0.76, "learning_rate": 1.5739875613165283e-06, "loss": 2.3843, "step": 6292 }, { "epoch": 0.76, "learning_rate": 1.5725255501784592e-06, "loss": 2.4339, "step": 6293 }, { "epoch": 0.76, "learning_rate": 1.5710640916472614e-06, "loss": 2.2395, "step": 6294 }, { "epoch": 0.76, "learning_rate": 1.5696031859585664e-06, "loss": 2.4804, "step": 6295 }, { "epoch": 0.76, "learning_rate": 1.5681428333479104e-06, "loss": 2.517, "step": 6296 }, { "epoch": 0.76, "learning_rate": 1.5666830340507494e-06, "loss": 2.5937, "step": 6297 }, { "epoch": 0.76, "learning_rate": 1.5652237883024407e-06, "loss": 2.5128, "step": 6298 }, { "epoch": 0.76, "learning_rate": 1.5637650963382573e-06, "loss": 2.5078, "step": 6299 }, { "epoch": 0.76, "learning_rate": 1.5623069583933836e-06, "loss": 2.5047, "step": 6300 }, { "epoch": 0.76, "learning_rate": 1.5608493747029108e-06, "loss": 2.6039, "step": 6301 }, { "epoch": 0.76, "learning_rate": 1.5593923455018462e-06, "loss": 2.557, "step": 6302 }, { "epoch": 0.76, "learning_rate": 1.5579358710251003e-06, "loss": 2.5642, "step": 6303 }, { "epoch": 0.76, "learning_rate": 1.5564799515075007e-06, "loss": 2.6319, "step": 6304 }, { "epoch": 0.76, "learning_rate": 1.5550245871837848e-06, "loss": 2.5084, "step": 6305 }, { "epoch": 0.76, "learning_rate": 1.553569778288596e-06, "loss": 2.5955, "step": 6306 }, { "epoch": 0.76, "learning_rate": 1.5521155250564923e-06, "loss": 2.6302, "step": 6307 }, { "epoch": 0.76, "learning_rate": 1.550661827721941e-06, "loss": 2.6135, "step": 6308 }, { "epoch": 0.76, "learning_rate": 1.5492086865193217e-06, "loss": 2.5802, "step": 6309 }, { "epoch": 0.76, "learning_rate": 1.5477561016829185e-06, "loss": 2.5337, "step": 6310 }, { "epoch": 0.76, "learning_rate": 1.5463040734469314e-06, "loss": 2.4724, "step": 6311 }, { "epoch": 0.76, "learning_rate": 1.5448526020454702e-06, "loss": 2.6671, "step": 6312 }, { "epoch": 0.76, "learning_rate": 1.5434016877125508e-06, "loss": 2.578, "step": 6313 }, { "epoch": 0.76, "learning_rate": 1.5419513306821055e-06, "loss": 2.5598, "step": 6314 }, { "epoch": 0.76, "learning_rate": 1.5405015311879696e-06, "loss": 2.5154, "step": 6315 }, { "epoch": 0.76, "learning_rate": 1.5390522894638937e-06, "loss": 2.5111, "step": 6316 }, { "epoch": 0.76, "learning_rate": 1.5376036057435394e-06, "loss": 2.5135, "step": 6317 }, { "epoch": 0.76, "learning_rate": 1.53615548026047e-06, "loss": 2.596, "step": 6318 }, { "epoch": 0.76, "learning_rate": 1.5347079132481723e-06, "loss": 2.4466, "step": 6319 }, { "epoch": 0.76, "learning_rate": 1.5332609049400298e-06, "loss": 2.6255, "step": 6320 }, { "epoch": 0.76, "learning_rate": 1.5318144555693454e-06, "loss": 2.576, "step": 6321 }, { "epoch": 0.76, "learning_rate": 1.5303685653693246e-06, "loss": 2.5353, "step": 6322 }, { "epoch": 0.76, "learning_rate": 1.5289232345730882e-06, "loss": 2.4884, "step": 6323 }, { "epoch": 0.76, "learning_rate": 1.5274784634136658e-06, "loss": 2.3854, "step": 6324 }, { "epoch": 0.76, "learning_rate": 1.526034252123993e-06, "loss": 2.5539, "step": 6325 }, { "epoch": 0.76, "learning_rate": 1.5245906009369211e-06, "loss": 2.3929, "step": 6326 }, { "epoch": 0.76, "learning_rate": 1.5231475100852044e-06, "loss": 2.5888, "step": 6327 }, { "epoch": 0.76, "learning_rate": 1.5217049798015127e-06, "loss": 2.3624, "step": 6328 }, { "epoch": 0.76, "learning_rate": 1.520263010318424e-06, "loss": 2.5663, "step": 6329 }, { "epoch": 0.76, "learning_rate": 1.518821601868421e-06, "loss": 2.5721, "step": 6330 }, { "epoch": 0.76, "learning_rate": 1.517380754683906e-06, "loss": 2.6077, "step": 6331 }, { "epoch": 0.76, "learning_rate": 1.5159404689971797e-06, "loss": 2.4003, "step": 6332 }, { "epoch": 0.76, "learning_rate": 1.5145007450404608e-06, "loss": 2.474, "step": 6333 }, { "epoch": 0.76, "learning_rate": 1.5130615830458705e-06, "loss": 2.4282, "step": 6334 }, { "epoch": 0.76, "learning_rate": 1.5116229832454448e-06, "loss": 2.4419, "step": 6335 }, { "epoch": 0.76, "learning_rate": 1.5101849458711288e-06, "loss": 2.4102, "step": 6336 }, { "epoch": 0.76, "learning_rate": 1.5087474711547711e-06, "loss": 2.5742, "step": 6337 }, { "epoch": 0.76, "learning_rate": 1.5073105593281385e-06, "loss": 2.5421, "step": 6338 }, { "epoch": 0.76, "learning_rate": 1.505874210622898e-06, "loss": 2.336, "step": 6339 }, { "epoch": 0.76, "learning_rate": 1.5044384252706312e-06, "loss": 2.5405, "step": 6340 }, { "epoch": 0.76, "learning_rate": 1.5030032035028292e-06, "loss": 2.4859, "step": 6341 }, { "epoch": 0.76, "learning_rate": 1.5015685455508894e-06, "loss": 2.3305, "step": 6342 }, { "epoch": 0.76, "learning_rate": 1.500134451646122e-06, "loss": 2.5273, "step": 6343 }, { "epoch": 0.76, "learning_rate": 1.4987009220197406e-06, "loss": 2.4403, "step": 6344 }, { "epoch": 0.76, "learning_rate": 1.497267956902873e-06, "loss": 2.5051, "step": 6345 }, { "epoch": 0.76, "learning_rate": 1.4958355565265559e-06, "loss": 2.5182, "step": 6346 }, { "epoch": 0.76, "learning_rate": 1.4944037211217289e-06, "loss": 2.531, "step": 6347 }, { "epoch": 0.76, "learning_rate": 1.492972450919249e-06, "loss": 2.5816, "step": 6348 }, { "epoch": 0.76, "learning_rate": 1.4915417461498743e-06, "loss": 2.3879, "step": 6349 }, { "epoch": 0.76, "learning_rate": 1.4901116070442772e-06, "loss": 2.4461, "step": 6350 }, { "epoch": 0.76, "learning_rate": 1.4886820338330382e-06, "loss": 2.459, "step": 6351 }, { "epoch": 0.76, "learning_rate": 1.4872530267466411e-06, "loss": 2.5567, "step": 6352 }, { "epoch": 0.76, "learning_rate": 1.4858245860154885e-06, "loss": 2.4055, "step": 6353 }, { "epoch": 0.76, "learning_rate": 1.4843967118698816e-06, "loss": 2.5041, "step": 6354 }, { "epoch": 0.76, "learning_rate": 1.4829694045400373e-06, "loss": 2.5423, "step": 6355 }, { "epoch": 0.76, "learning_rate": 1.4815426642560753e-06, "loss": 2.3766, "step": 6356 }, { "epoch": 0.76, "learning_rate": 1.4801164912480286e-06, "loss": 2.53, "step": 6357 }, { "epoch": 0.76, "learning_rate": 1.4786908857458388e-06, "loss": 2.4645, "step": 6358 }, { "epoch": 0.76, "learning_rate": 1.4772658479793506e-06, "loss": 2.2306, "step": 6359 }, { "epoch": 0.76, "learning_rate": 1.4758413781783249e-06, "loss": 2.5422, "step": 6360 }, { "epoch": 0.76, "learning_rate": 1.4744174765724228e-06, "loss": 2.6254, "step": 6361 }, { "epoch": 0.76, "learning_rate": 1.47299414339122e-06, "loss": 2.488, "step": 6362 }, { "epoch": 0.76, "learning_rate": 1.4715713788641982e-06, "loss": 2.5071, "step": 6363 }, { "epoch": 0.76, "learning_rate": 1.4701491832207481e-06, "loss": 2.297, "step": 6364 }, { "epoch": 0.76, "learning_rate": 1.4687275566901705e-06, "loss": 2.5722, "step": 6365 }, { "epoch": 0.76, "learning_rate": 1.4673064995016672e-06, "loss": 2.6829, "step": 6366 }, { "epoch": 0.76, "learning_rate": 1.4658860118843583e-06, "loss": 2.6527, "step": 6367 }, { "epoch": 0.77, "learning_rate": 1.4644660940672628e-06, "loss": 2.6203, "step": 6368 }, { "epoch": 0.77, "learning_rate": 1.4630467462793142e-06, "loss": 2.4755, "step": 6369 }, { "epoch": 0.77, "learning_rate": 1.4616279687493528e-06, "loss": 2.599, "step": 6370 }, { "epoch": 0.77, "learning_rate": 1.4602097617061235e-06, "loss": 2.4989, "step": 6371 }, { "epoch": 0.77, "learning_rate": 1.458792125378285e-06, "loss": 2.5067, "step": 6372 }, { "epoch": 0.77, "learning_rate": 1.4573750599943975e-06, "loss": 2.5169, "step": 6373 }, { "epoch": 0.77, "learning_rate": 1.455958565782934e-06, "loss": 2.2895, "step": 6374 }, { "epoch": 0.77, "learning_rate": 1.4545426429722737e-06, "loss": 2.4549, "step": 6375 }, { "epoch": 0.77, "learning_rate": 1.453127291790704e-06, "loss": 2.2885, "step": 6376 }, { "epoch": 0.77, "learning_rate": 1.4517125124664222e-06, "loss": 2.4892, "step": 6377 }, { "epoch": 0.77, "learning_rate": 1.450298305227527e-06, "loss": 2.6348, "step": 6378 }, { "epoch": 0.77, "learning_rate": 1.4488846703020326e-06, "loss": 2.5849, "step": 6379 }, { "epoch": 0.77, "learning_rate": 1.4474716079178541e-06, "loss": 2.4127, "step": 6380 }, { "epoch": 0.77, "learning_rate": 1.4460591183028195e-06, "loss": 2.3603, "step": 6381 }, { "epoch": 0.77, "learning_rate": 1.444647201684664e-06, "loss": 2.4361, "step": 6382 }, { "epoch": 0.77, "learning_rate": 1.443235858291025e-06, "loss": 2.5296, "step": 6383 }, { "epoch": 0.77, "learning_rate": 1.4418250883494556e-06, "loss": 2.3567, "step": 6384 }, { "epoch": 0.77, "learning_rate": 1.4404148920874073e-06, "loss": 2.4745, "step": 6385 }, { "epoch": 0.77, "learning_rate": 1.4390052697322499e-06, "loss": 2.4612, "step": 6386 }, { "epoch": 0.77, "learning_rate": 1.4375962215112504e-06, "loss": 2.5648, "step": 6387 }, { "epoch": 0.77, "learning_rate": 1.436187747651589e-06, "loss": 2.5367, "step": 6388 }, { "epoch": 0.77, "learning_rate": 1.4347798483803538e-06, "loss": 2.4555, "step": 6389 }, { "epoch": 0.77, "learning_rate": 1.4333725239245355e-06, "loss": 2.5323, "step": 6390 }, { "epoch": 0.77, "learning_rate": 1.4319657745110372e-06, "loss": 2.4196, "step": 6391 }, { "epoch": 0.77, "learning_rate": 1.430559600366665e-06, "loss": 2.5982, "step": 6392 }, { "epoch": 0.77, "learning_rate": 1.429154001718136e-06, "loss": 2.5836, "step": 6393 }, { "epoch": 0.77, "learning_rate": 1.4277489787920733e-06, "loss": 2.5185, "step": 6394 }, { "epoch": 0.77, "learning_rate": 1.4263445318150048e-06, "loss": 2.567, "step": 6395 }, { "epoch": 0.77, "learning_rate": 1.4249406610133686e-06, "loss": 2.3482, "step": 6396 }, { "epoch": 0.77, "learning_rate": 1.4235373666135087e-06, "loss": 2.2306, "step": 6397 }, { "epoch": 0.77, "learning_rate": 1.4221346488416765e-06, "loss": 2.5274, "step": 6398 }, { "epoch": 0.77, "learning_rate": 1.420732507924032e-06, "loss": 2.3507, "step": 6399 }, { "epoch": 0.77, "learning_rate": 1.4193309440866366e-06, "loss": 2.5357, "step": 6400 }, { "epoch": 0.77, "learning_rate": 1.4179299575554661e-06, "loss": 2.6459, "step": 6401 }, { "epoch": 0.77, "learning_rate": 1.4165295485563962e-06, "loss": 2.5064, "step": 6402 }, { "epoch": 0.77, "learning_rate": 1.4151297173152152e-06, "loss": 2.5294, "step": 6403 }, { "epoch": 0.77, "learning_rate": 1.4137304640576161e-06, "loss": 2.5064, "step": 6404 }, { "epoch": 0.77, "learning_rate": 1.4123317890091965e-06, "loss": 2.6676, "step": 6405 }, { "epoch": 0.77, "learning_rate": 1.4109336923954652e-06, "loss": 2.5421, "step": 6406 }, { "epoch": 0.77, "learning_rate": 1.4095361744418312e-06, "loss": 2.5511, "step": 6407 }, { "epoch": 0.77, "learning_rate": 1.4081392353736206e-06, "loss": 2.5696, "step": 6408 }, { "epoch": 0.77, "learning_rate": 1.406742875416055e-06, "loss": 2.635, "step": 6409 }, { "epoch": 0.77, "learning_rate": 1.4053470947942694e-06, "loss": 2.6467, "step": 6410 }, { "epoch": 0.77, "learning_rate": 1.4039518937333047e-06, "loss": 2.5732, "step": 6411 }, { "epoch": 0.77, "learning_rate": 1.4025572724581037e-06, "loss": 2.5326, "step": 6412 }, { "epoch": 0.77, "learning_rate": 1.4011632311935237e-06, "loss": 2.4711, "step": 6413 }, { "epoch": 0.77, "learning_rate": 1.39976977016432e-06, "loss": 2.6506, "step": 6414 }, { "epoch": 0.77, "learning_rate": 1.3983768895951594e-06, "loss": 2.3152, "step": 6415 }, { "epoch": 0.77, "learning_rate": 1.3969845897106166e-06, "loss": 2.4289, "step": 6416 }, { "epoch": 0.77, "learning_rate": 1.3955928707351668e-06, "loss": 2.4685, "step": 6417 }, { "epoch": 0.77, "learning_rate": 1.3942017328931974e-06, "loss": 2.5651, "step": 6418 }, { "epoch": 0.77, "learning_rate": 1.3928111764089957e-06, "loss": 2.4222, "step": 6419 }, { "epoch": 0.77, "learning_rate": 1.3914212015067653e-06, "loss": 2.378, "step": 6420 }, { "epoch": 0.77, "learning_rate": 1.3900318084106045e-06, "loss": 2.4775, "step": 6421 }, { "epoch": 0.77, "learning_rate": 1.3886429973445253e-06, "loss": 2.4255, "step": 6422 }, { "epoch": 0.77, "learning_rate": 1.3872547685324456e-06, "loss": 2.546, "step": 6423 }, { "epoch": 0.77, "learning_rate": 1.385867122198184e-06, "loss": 2.4063, "step": 6424 }, { "epoch": 0.77, "learning_rate": 1.3844800585654721e-06, "loss": 2.552, "step": 6425 }, { "epoch": 0.77, "learning_rate": 1.3830935778579407e-06, "loss": 2.5308, "step": 6426 }, { "epoch": 0.77, "learning_rate": 1.381707680299132e-06, "loss": 2.4289, "step": 6427 }, { "epoch": 0.77, "learning_rate": 1.3803223661124938e-06, "loss": 2.7028, "step": 6428 }, { "epoch": 0.77, "learning_rate": 1.3789376355213758e-06, "loss": 2.631, "step": 6429 }, { "epoch": 0.77, "learning_rate": 1.3775534887490365e-06, "loss": 2.4656, "step": 6430 }, { "epoch": 0.77, "learning_rate": 1.3761699260186407e-06, "loss": 2.434, "step": 6431 }, { "epoch": 0.77, "learning_rate": 1.3747869475532598e-06, "loss": 2.5879, "step": 6432 }, { "epoch": 0.77, "learning_rate": 1.3734045535758667e-06, "loss": 2.5157, "step": 6433 }, { "epoch": 0.77, "learning_rate": 1.3720227443093437e-06, "loss": 2.4777, "step": 6434 }, { "epoch": 0.77, "learning_rate": 1.37064151997648e-06, "loss": 2.564, "step": 6435 }, { "epoch": 0.77, "learning_rate": 1.3692608807999652e-06, "loss": 2.5147, "step": 6436 }, { "epoch": 0.77, "learning_rate": 1.3678808270024008e-06, "loss": 2.5625, "step": 6437 }, { "epoch": 0.77, "learning_rate": 1.3665013588062875e-06, "loss": 2.5354, "step": 6438 }, { "epoch": 0.77, "learning_rate": 1.3651224764340371e-06, "loss": 2.451, "step": 6439 }, { "epoch": 0.77, "learning_rate": 1.3637441801079666e-06, "loss": 2.5723, "step": 6440 }, { "epoch": 0.77, "learning_rate": 1.3623664700502915e-06, "loss": 2.5165, "step": 6441 }, { "epoch": 0.77, "learning_rate": 1.3609893464831447e-06, "loss": 2.321, "step": 6442 }, { "epoch": 0.77, "learning_rate": 1.3596128096285527e-06, "loss": 2.5065, "step": 6443 }, { "epoch": 0.77, "learning_rate": 1.3582368597084566e-06, "loss": 2.5337, "step": 6444 }, { "epoch": 0.77, "learning_rate": 1.3568614969446947e-06, "loss": 2.3071, "step": 6445 }, { "epoch": 0.77, "learning_rate": 1.3554867215590174e-06, "loss": 2.4848, "step": 6446 }, { "epoch": 0.77, "learning_rate": 1.3541125337730786e-06, "loss": 2.6199, "step": 6447 }, { "epoch": 0.77, "learning_rate": 1.352738933808434e-06, "loss": 2.6431, "step": 6448 }, { "epoch": 0.77, "learning_rate": 1.3513659218865483e-06, "loss": 2.4526, "step": 6449 }, { "epoch": 0.77, "learning_rate": 1.3499934982287922e-06, "loss": 2.6765, "step": 6450 }, { "epoch": 0.77, "learning_rate": 1.348621663056436e-06, "loss": 2.6479, "step": 6451 }, { "epoch": 0.78, "learning_rate": 1.3472504165906614e-06, "loss": 2.4188, "step": 6452 }, { "epoch": 0.78, "learning_rate": 1.3458797590525513e-06, "loss": 2.5463, "step": 6453 }, { "epoch": 0.78, "learning_rate": 1.3445096906630966e-06, "loss": 2.4685, "step": 6454 }, { "epoch": 0.78, "learning_rate": 1.3431402116431896e-06, "loss": 2.4783, "step": 6455 }, { "epoch": 0.78, "learning_rate": 1.3417713222136297e-06, "loss": 2.6402, "step": 6456 }, { "epoch": 0.78, "learning_rate": 1.340403022595123e-06, "loss": 2.5257, "step": 6457 }, { "epoch": 0.78, "learning_rate": 1.3390353130082756e-06, "loss": 2.4442, "step": 6458 }, { "epoch": 0.78, "learning_rate": 1.337668193673604e-06, "loss": 2.5003, "step": 6459 }, { "epoch": 0.78, "learning_rate": 1.3363016648115246e-06, "loss": 2.5911, "step": 6460 }, { "epoch": 0.78, "learning_rate": 1.3349357266423624e-06, "loss": 2.4491, "step": 6461 }, { "epoch": 0.78, "learning_rate": 1.3335703793863464e-06, "loss": 2.5828, "step": 6462 }, { "epoch": 0.78, "learning_rate": 1.332205623263605e-06, "loss": 2.4079, "step": 6463 }, { "epoch": 0.78, "learning_rate": 1.330841458494183e-06, "loss": 2.6267, "step": 6464 }, { "epoch": 0.78, "learning_rate": 1.3294778852980178e-06, "loss": 2.4384, "step": 6465 }, { "epoch": 0.78, "learning_rate": 1.3281149038949591e-06, "loss": 2.3579, "step": 6466 }, { "epoch": 0.78, "learning_rate": 1.3267525145047555e-06, "loss": 2.5781, "step": 6467 }, { "epoch": 0.78, "learning_rate": 1.325390717347065e-06, "loss": 2.3955, "step": 6468 }, { "epoch": 0.78, "learning_rate": 1.3240295126414492e-06, "loss": 2.4448, "step": 6469 }, { "epoch": 0.78, "learning_rate": 1.3226689006073712e-06, "loss": 2.5643, "step": 6470 }, { "epoch": 0.78, "learning_rate": 1.3213088814642023e-06, "loss": 2.6067, "step": 6471 }, { "epoch": 0.78, "learning_rate": 1.3199494554312143e-06, "loss": 2.6089, "step": 6472 }, { "epoch": 0.78, "learning_rate": 1.3185906227275863e-06, "loss": 2.3964, "step": 6473 }, { "epoch": 0.78, "learning_rate": 1.3172323835724021e-06, "loss": 2.5362, "step": 6474 }, { "epoch": 0.78, "learning_rate": 1.3158747381846481e-06, "loss": 2.4736, "step": 6475 }, { "epoch": 0.78, "learning_rate": 1.3145176867832165e-06, "loss": 2.3416, "step": 6476 }, { "epoch": 0.78, "learning_rate": 1.3131612295869007e-06, "loss": 2.3775, "step": 6477 }, { "epoch": 0.78, "learning_rate": 1.3118053668144026e-06, "loss": 2.5352, "step": 6478 }, { "epoch": 0.78, "learning_rate": 1.3104500986843239e-06, "loss": 2.405, "step": 6479 }, { "epoch": 0.78, "learning_rate": 1.3090954254151733e-06, "loss": 2.527, "step": 6480 }, { "epoch": 0.78, "learning_rate": 1.3077413472253647e-06, "loss": 2.2763, "step": 6481 }, { "epoch": 0.78, "learning_rate": 1.3063878643332112e-06, "loss": 2.6017, "step": 6482 }, { "epoch": 0.78, "learning_rate": 1.305034976956936e-06, "loss": 2.4723, "step": 6483 }, { "epoch": 0.78, "learning_rate": 1.3036826853146601e-06, "loss": 2.5914, "step": 6484 }, { "epoch": 0.78, "learning_rate": 1.3023309896244129e-06, "loss": 2.4898, "step": 6485 }, { "epoch": 0.78, "learning_rate": 1.3009798901041264e-06, "loss": 2.512, "step": 6486 }, { "epoch": 0.78, "learning_rate": 1.2996293869716369e-06, "loss": 2.6156, "step": 6487 }, { "epoch": 0.78, "learning_rate": 1.2982794804446858e-06, "loss": 2.6218, "step": 6488 }, { "epoch": 0.78, "learning_rate": 1.2969301707409126e-06, "loss": 2.5452, "step": 6489 }, { "epoch": 0.78, "learning_rate": 1.2955814580778686e-06, "loss": 2.3198, "step": 6490 }, { "epoch": 0.78, "learning_rate": 1.2942333426730014e-06, "loss": 2.5006, "step": 6491 }, { "epoch": 0.78, "learning_rate": 1.2928858247436672e-06, "loss": 2.5931, "step": 6492 }, { "epoch": 0.78, "learning_rate": 1.2915389045071258e-06, "loss": 2.5282, "step": 6493 }, { "epoch": 0.78, "learning_rate": 1.2901925821805372e-06, "loss": 2.6882, "step": 6494 }, { "epoch": 0.78, "learning_rate": 1.2888468579809689e-06, "loss": 2.4782, "step": 6495 }, { "epoch": 0.78, "learning_rate": 1.2875017321253857e-06, "loss": 2.3116, "step": 6496 }, { "epoch": 0.78, "learning_rate": 1.286157204830667e-06, "loss": 2.47, "step": 6497 }, { "epoch": 0.78, "learning_rate": 1.284813276313584e-06, "loss": 2.4635, "step": 6498 }, { "epoch": 0.78, "learning_rate": 1.2834699467908184e-06, "loss": 2.4826, "step": 6499 }, { "epoch": 0.78, "learning_rate": 1.2821272164789544e-06, "loss": 2.6379, "step": 6500 }, { "epoch": 0.78, "learning_rate": 1.2807850855944753e-06, "loss": 2.4043, "step": 6501 }, { "epoch": 0.78, "learning_rate": 1.2794435543537737e-06, "loss": 2.4441, "step": 6502 }, { "epoch": 0.78, "learning_rate": 1.2781026229731425e-06, "loss": 2.5198, "step": 6503 }, { "epoch": 0.78, "learning_rate": 1.2767622916687767e-06, "loss": 2.459, "step": 6504 }, { "epoch": 0.78, "learning_rate": 1.2754225606567783e-06, "loss": 2.6249, "step": 6505 }, { "epoch": 0.78, "learning_rate": 1.2740834301531468e-06, "loss": 2.3966, "step": 6506 }, { "epoch": 0.78, "learning_rate": 1.2727449003737913e-06, "loss": 2.4985, "step": 6507 }, { "epoch": 0.78, "learning_rate": 1.2714069715345195e-06, "loss": 2.494, "step": 6508 }, { "epoch": 0.78, "learning_rate": 1.2700696438510445e-06, "loss": 2.4309, "step": 6509 }, { "epoch": 0.78, "learning_rate": 1.2687329175389835e-06, "loss": 2.6146, "step": 6510 }, { "epoch": 0.78, "learning_rate": 1.2673967928138514e-06, "loss": 2.44, "step": 6511 }, { "epoch": 0.78, "learning_rate": 1.266061269891073e-06, "loss": 2.5612, "step": 6512 }, { "epoch": 0.78, "learning_rate": 1.26472634898597e-06, "loss": 2.6592, "step": 6513 }, { "epoch": 0.78, "learning_rate": 1.2633920303137708e-06, "loss": 2.5469, "step": 6514 }, { "epoch": 0.78, "learning_rate": 1.2620583140896075e-06, "loss": 2.3146, "step": 6515 }, { "epoch": 0.78, "learning_rate": 1.2607252005285109e-06, "loss": 2.5924, "step": 6516 }, { "epoch": 0.78, "learning_rate": 1.259392689845419e-06, "loss": 2.4271, "step": 6517 }, { "epoch": 0.78, "learning_rate": 1.2580607822551677e-06, "loss": 2.4513, "step": 6518 }, { "epoch": 0.78, "learning_rate": 1.2567294779725008e-06, "loss": 2.516, "step": 6519 }, { "epoch": 0.78, "learning_rate": 1.2553987772120619e-06, "loss": 2.5777, "step": 6520 }, { "epoch": 0.78, "learning_rate": 1.2540686801883989e-06, "loss": 2.7267, "step": 6521 }, { "epoch": 0.78, "learning_rate": 1.2527391871159616e-06, "loss": 2.5439, "step": 6522 }, { "epoch": 0.78, "learning_rate": 1.251410298209101e-06, "loss": 2.5735, "step": 6523 }, { "epoch": 0.78, "learning_rate": 1.2500820136820735e-06, "loss": 2.5534, "step": 6524 }, { "epoch": 0.78, "learning_rate": 1.2487543337490343e-06, "loss": 2.2641, "step": 6525 }, { "epoch": 0.78, "learning_rate": 1.2474272586240444e-06, "loss": 2.5682, "step": 6526 }, { "epoch": 0.78, "learning_rate": 1.2461007885210685e-06, "loss": 2.5803, "step": 6527 }, { "epoch": 0.78, "learning_rate": 1.2447749236539674e-06, "loss": 2.5273, "step": 6528 }, { "epoch": 0.78, "learning_rate": 1.2434496642365123e-06, "loss": 2.4944, "step": 6529 }, { "epoch": 0.78, "learning_rate": 1.2421250104823683e-06, "loss": 2.5581, "step": 6530 }, { "epoch": 0.78, "learning_rate": 1.2408009626051137e-06, "loss": 2.7278, "step": 6531 }, { "epoch": 0.78, "learning_rate": 1.2394775208182175e-06, "loss": 2.4026, "step": 6532 }, { "epoch": 0.78, "learning_rate": 1.2381546853350584e-06, "loss": 2.5554, "step": 6533 }, { "epoch": 0.78, "learning_rate": 1.2368324563689171e-06, "loss": 2.43, "step": 6534 }, { "epoch": 0.79, "learning_rate": 1.2355108341329708e-06, "loss": 2.4993, "step": 6535 }, { "epoch": 0.79, "learning_rate": 1.2341898188403068e-06, "loss": 2.428, "step": 6536 }, { "epoch": 0.79, "learning_rate": 1.232869410703907e-06, "loss": 2.5324, "step": 6537 }, { "epoch": 0.79, "learning_rate": 1.2315496099366603e-06, "loss": 2.4588, "step": 6538 }, { "epoch": 0.79, "learning_rate": 1.2302304167513586e-06, "loss": 2.4715, "step": 6539 }, { "epoch": 0.79, "learning_rate": 1.2289118313606895e-06, "loss": 2.5146, "step": 6540 }, { "epoch": 0.79, "learning_rate": 1.2275938539772485e-06, "loss": 2.5291, "step": 6541 }, { "epoch": 0.79, "learning_rate": 1.2262764848135316e-06, "loss": 2.5888, "step": 6542 }, { "epoch": 0.79, "learning_rate": 1.2249597240819377e-06, "loss": 2.4507, "step": 6543 }, { "epoch": 0.79, "learning_rate": 1.2236435719947638e-06, "loss": 2.4703, "step": 6544 }, { "epoch": 0.79, "learning_rate": 1.2223280287642115e-06, "loss": 2.6027, "step": 6545 }, { "epoch": 0.79, "learning_rate": 1.2210130946023862e-06, "loss": 2.4591, "step": 6546 }, { "epoch": 0.79, "learning_rate": 1.2196987697212903e-06, "loss": 2.406, "step": 6547 }, { "epoch": 0.79, "learning_rate": 1.2183850543328313e-06, "loss": 2.4112, "step": 6548 }, { "epoch": 0.79, "learning_rate": 1.2170719486488192e-06, "loss": 2.3469, "step": 6549 }, { "epoch": 0.79, "learning_rate": 1.2157594528809619e-06, "loss": 2.4943, "step": 6550 }, { "epoch": 0.79, "learning_rate": 1.2144475672408733e-06, "loss": 2.3436, "step": 6551 }, { "epoch": 0.79, "learning_rate": 1.2131362919400635e-06, "loss": 2.4741, "step": 6552 }, { "epoch": 0.79, "learning_rate": 1.2118256271899525e-06, "loss": 2.4925, "step": 6553 }, { "epoch": 0.79, "learning_rate": 1.2105155732018532e-06, "loss": 2.5788, "step": 6554 }, { "epoch": 0.79, "learning_rate": 1.209206130186985e-06, "loss": 2.5773, "step": 6555 }, { "epoch": 0.79, "learning_rate": 1.2078972983564686e-06, "loss": 2.3581, "step": 6556 }, { "epoch": 0.79, "learning_rate": 1.206589077921323e-06, "loss": 2.5353, "step": 6557 }, { "epoch": 0.79, "learning_rate": 1.2052814690924724e-06, "loss": 2.5795, "step": 6558 }, { "epoch": 0.79, "learning_rate": 1.2039744720807396e-06, "loss": 2.5837, "step": 6559 }, { "epoch": 0.79, "learning_rate": 1.2026680870968494e-06, "loss": 2.4573, "step": 6560 }, { "epoch": 0.79, "learning_rate": 1.2013623143514314e-06, "loss": 2.4834, "step": 6561 }, { "epoch": 0.79, "learning_rate": 1.2000571540550092e-06, "loss": 2.4639, "step": 6562 }, { "epoch": 0.79, "learning_rate": 1.1987526064180149e-06, "loss": 2.5363, "step": 6563 }, { "epoch": 0.79, "learning_rate": 1.1974486716507782e-06, "loss": 2.5597, "step": 6564 }, { "epoch": 0.79, "learning_rate": 1.1961453499635323e-06, "loss": 2.5179, "step": 6565 }, { "epoch": 0.79, "learning_rate": 1.194842641566406e-06, "loss": 2.4419, "step": 6566 }, { "epoch": 0.79, "learning_rate": 1.1935405466694362e-06, "loss": 2.4785, "step": 6567 }, { "epoch": 0.79, "learning_rate": 1.1922390654825582e-06, "loss": 2.4786, "step": 6568 }, { "epoch": 0.79, "learning_rate": 1.1909381982156054e-06, "loss": 2.4695, "step": 6569 }, { "epoch": 0.79, "learning_rate": 1.1896379450783174e-06, "loss": 2.3857, "step": 6570 }, { "epoch": 0.79, "learning_rate": 1.1883383062803293e-06, "loss": 2.5147, "step": 6571 }, { "epoch": 0.79, "learning_rate": 1.187039282031182e-06, "loss": 2.4763, "step": 6572 }, { "epoch": 0.79, "learning_rate": 1.185740872540317e-06, "loss": 2.5528, "step": 6573 }, { "epoch": 0.79, "learning_rate": 1.1844430780170697e-06, "loss": 2.4968, "step": 6574 }, { "epoch": 0.79, "learning_rate": 1.1831458986706879e-06, "loss": 2.622, "step": 6575 }, { "epoch": 0.79, "learning_rate": 1.1818493347103098e-06, "loss": 2.393, "step": 6576 }, { "epoch": 0.79, "learning_rate": 1.1805533863449813e-06, "loss": 2.4127, "step": 6577 }, { "epoch": 0.79, "learning_rate": 1.179258053783644e-06, "loss": 2.6365, "step": 6578 }, { "epoch": 0.79, "learning_rate": 1.177963337235143e-06, "loss": 2.5919, "step": 6579 }, { "epoch": 0.79, "learning_rate": 1.1766692369082255e-06, "loss": 2.5602, "step": 6580 }, { "epoch": 0.79, "learning_rate": 1.1753757530115351e-06, "loss": 2.4821, "step": 6581 }, { "epoch": 0.79, "learning_rate": 1.1740828857536206e-06, "loss": 2.4298, "step": 6582 }, { "epoch": 0.79, "learning_rate": 1.1727906353429264e-06, "loss": 2.5387, "step": 6583 }, { "epoch": 0.79, "learning_rate": 1.171499001987802e-06, "loss": 2.4051, "step": 6584 }, { "epoch": 0.79, "learning_rate": 1.1702079858964953e-06, "loss": 2.5807, "step": 6585 }, { "epoch": 0.79, "learning_rate": 1.1689175872771552e-06, "loss": 2.5333, "step": 6586 }, { "epoch": 0.79, "learning_rate": 1.1676278063378322e-06, "loss": 2.4234, "step": 6587 }, { "epoch": 0.79, "learning_rate": 1.1663386432864725e-06, "loss": 2.49, "step": 6588 }, { "epoch": 0.79, "learning_rate": 1.16505009833093e-06, "loss": 2.5732, "step": 6589 }, { "epoch": 0.79, "learning_rate": 1.163762171678951e-06, "loss": 2.4577, "step": 6590 }, { "epoch": 0.79, "learning_rate": 1.1624748635381883e-06, "loss": 2.759, "step": 6591 }, { "epoch": 0.79, "learning_rate": 1.161188174116194e-06, "loss": 2.5374, "step": 6592 }, { "epoch": 0.79, "learning_rate": 1.159902103620416e-06, "loss": 2.3443, "step": 6593 }, { "epoch": 0.79, "learning_rate": 1.1586166522582094e-06, "loss": 2.5762, "step": 6594 }, { "epoch": 0.79, "learning_rate": 1.1573318202368217e-06, "loss": 2.6016, "step": 6595 }, { "epoch": 0.79, "learning_rate": 1.156047607763407e-06, "loss": 2.5861, "step": 6596 }, { "epoch": 0.79, "learning_rate": 1.1547640150450162e-06, "loss": 2.7419, "step": 6597 }, { "epoch": 0.79, "learning_rate": 1.1534810422886016e-06, "loss": 2.3385, "step": 6598 }, { "epoch": 0.79, "learning_rate": 1.1521986897010163e-06, "loss": 2.7658, "step": 6599 }, { "epoch": 0.79, "learning_rate": 1.15091695748901e-06, "loss": 2.5143, "step": 6600 }, { "epoch": 0.79, "learning_rate": 1.149635845859235e-06, "loss": 2.47, "step": 6601 }, { "epoch": 0.79, "learning_rate": 1.1483553550182453e-06, "loss": 2.6732, "step": 6602 }, { "epoch": 0.79, "learning_rate": 1.1470754851724897e-06, "loss": 2.3553, "step": 6603 }, { "epoch": 0.79, "learning_rate": 1.145796236528322e-06, "loss": 2.5309, "step": 6604 }, { "epoch": 0.79, "learning_rate": 1.1445176092919918e-06, "loss": 2.3967, "step": 6605 }, { "epoch": 0.79, "learning_rate": 1.1432396036696508e-06, "loss": 2.5617, "step": 6606 }, { "epoch": 0.79, "learning_rate": 1.1419622198673512e-06, "loss": 2.427, "step": 6607 }, { "epoch": 0.79, "learning_rate": 1.1406854580910426e-06, "loss": 2.4354, "step": 6608 }, { "epoch": 0.79, "learning_rate": 1.1394093185465776e-06, "loss": 2.3972, "step": 6609 }, { "epoch": 0.79, "learning_rate": 1.1381338014397035e-06, "loss": 2.5399, "step": 6610 }, { "epoch": 0.79, "learning_rate": 1.1368589069760728e-06, "loss": 2.5406, "step": 6611 }, { "epoch": 0.79, "learning_rate": 1.135584635361232e-06, "loss": 2.4687, "step": 6612 }, { "epoch": 0.79, "learning_rate": 1.134310986800632e-06, "loss": 2.6946, "step": 6613 }, { "epoch": 0.79, "learning_rate": 1.1330379614996223e-06, "loss": 2.4416, "step": 6614 }, { "epoch": 0.79, "learning_rate": 1.131765559663448e-06, "loss": 2.4813, "step": 6615 }, { "epoch": 0.79, "learning_rate": 1.13049378149726e-06, "loss": 2.4994, "step": 6616 }, { "epoch": 0.79, "learning_rate": 1.1292226272061023e-06, "loss": 2.509, "step": 6617 }, { "epoch": 0.8, "learning_rate": 1.1279520969949225e-06, "loss": 2.4326, "step": 6618 }, { "epoch": 0.8, "learning_rate": 1.1266821910685671e-06, "loss": 2.4436, "step": 6619 }, { "epoch": 0.8, "learning_rate": 1.1254129096317807e-06, "loss": 2.4042, "step": 6620 }, { "epoch": 0.8, "learning_rate": 1.1241442528892088e-06, "loss": 2.4786, "step": 6621 }, { "epoch": 0.8, "learning_rate": 1.1228762210453926e-06, "loss": 2.5781, "step": 6622 }, { "epoch": 0.8, "learning_rate": 1.1216088143047781e-06, "loss": 2.5228, "step": 6623 }, { "epoch": 0.8, "learning_rate": 1.1203420328717052e-06, "loss": 2.6158, "step": 6624 }, { "epoch": 0.8, "learning_rate": 1.1190758769504156e-06, "loss": 2.349, "step": 6625 }, { "epoch": 0.8, "learning_rate": 1.1178103467450512e-06, "loss": 2.4841, "step": 6626 }, { "epoch": 0.8, "learning_rate": 1.11654544245965e-06, "loss": 2.5912, "step": 6627 }, { "epoch": 0.8, "learning_rate": 1.115281164298153e-06, "loss": 2.5283, "step": 6628 }, { "epoch": 0.8, "learning_rate": 1.1140175124643948e-06, "loss": 2.4902, "step": 6629 }, { "epoch": 0.8, "learning_rate": 1.1127544871621144e-06, "loss": 2.4647, "step": 6630 }, { "epoch": 0.8, "learning_rate": 1.1114920885949466e-06, "loss": 2.4614, "step": 6631 }, { "epoch": 0.8, "learning_rate": 1.110230316966427e-06, "loss": 2.4321, "step": 6632 }, { "epoch": 0.8, "learning_rate": 1.10896917247999e-06, "loss": 2.4033, "step": 6633 }, { "epoch": 0.8, "learning_rate": 1.1077086553389654e-06, "loss": 2.5009, "step": 6634 }, { "epoch": 0.8, "learning_rate": 1.1064487657465883e-06, "loss": 2.602, "step": 6635 }, { "epoch": 0.8, "learning_rate": 1.1051895039059851e-06, "loss": 2.471, "step": 6636 }, { "epoch": 0.8, "learning_rate": 1.1039308700201868e-06, "loss": 2.7274, "step": 6637 }, { "epoch": 0.8, "learning_rate": 1.102672864292122e-06, "loss": 2.5045, "step": 6638 }, { "epoch": 0.8, "learning_rate": 1.1014154869246146e-06, "loss": 2.5104, "step": 6639 }, { "epoch": 0.8, "learning_rate": 1.1001587381203931e-06, "loss": 2.4347, "step": 6640 }, { "epoch": 0.8, "learning_rate": 1.0989026180820766e-06, "loss": 2.3562, "step": 6641 }, { "epoch": 0.8, "learning_rate": 1.097647127012193e-06, "loss": 2.4224, "step": 6642 }, { "epoch": 0.8, "learning_rate": 1.0963922651131598e-06, "loss": 2.5556, "step": 6643 }, { "epoch": 0.8, "learning_rate": 1.095138032587298e-06, "loss": 2.4572, "step": 6644 }, { "epoch": 0.8, "learning_rate": 1.0938844296368262e-06, "loss": 2.5073, "step": 6645 }, { "epoch": 0.8, "learning_rate": 1.092631456463859e-06, "loss": 2.5863, "step": 6646 }, { "epoch": 0.8, "learning_rate": 1.0913791132704144e-06, "loss": 2.3776, "step": 6647 }, { "epoch": 0.8, "learning_rate": 1.0901274002584029e-06, "loss": 2.3049, "step": 6648 }, { "epoch": 0.8, "learning_rate": 1.088876317629638e-06, "loss": 2.5818, "step": 6649 }, { "epoch": 0.8, "learning_rate": 1.0876258655858307e-06, "loss": 2.4197, "step": 6650 }, { "epoch": 0.8, "learning_rate": 1.0863760443285876e-06, "loss": 2.5391, "step": 6651 }, { "epoch": 0.8, "learning_rate": 1.0851268540594168e-06, "loss": 2.4959, "step": 6652 }, { "epoch": 0.8, "learning_rate": 1.0838782949797227e-06, "loss": 2.4136, "step": 6653 }, { "epoch": 0.8, "learning_rate": 1.08263036729081e-06, "loss": 2.4707, "step": 6654 }, { "epoch": 0.8, "learning_rate": 1.0813830711938816e-06, "loss": 2.4599, "step": 6655 }, { "epoch": 0.8, "learning_rate": 1.0801364068900334e-06, "loss": 2.4183, "step": 6656 }, { "epoch": 0.8, "learning_rate": 1.078890374580267e-06, "loss": 2.4569, "step": 6657 }, { "epoch": 0.8, "learning_rate": 1.0776449744654755e-06, "loss": 2.4535, "step": 6658 }, { "epoch": 0.8, "learning_rate": 1.076400206746454e-06, "loss": 2.5795, "step": 6659 }, { "epoch": 0.8, "learning_rate": 1.0751560716238968e-06, "loss": 2.5735, "step": 6660 }, { "epoch": 0.8, "learning_rate": 1.0739125692983904e-06, "loss": 2.5768, "step": 6661 }, { "epoch": 0.8, "learning_rate": 1.0726696999704266e-06, "loss": 2.6314, "step": 6662 }, { "epoch": 0.8, "learning_rate": 1.0714274638403865e-06, "loss": 2.673, "step": 6663 }, { "epoch": 0.8, "learning_rate": 1.0701858611085602e-06, "loss": 2.6326, "step": 6664 }, { "epoch": 0.8, "learning_rate": 1.068944891975125e-06, "loss": 2.5631, "step": 6665 }, { "epoch": 0.8, "learning_rate": 1.0677045566401623e-06, "loss": 2.5143, "step": 6666 }, { "epoch": 0.8, "learning_rate": 1.0664648553036505e-06, "loss": 2.5849, "step": 6667 }, { "epoch": 0.8, "learning_rate": 1.0652257881654625e-06, "loss": 2.2979, "step": 6668 }, { "epoch": 0.8, "learning_rate": 1.0639873554253743e-06, "loss": 2.6429, "step": 6669 }, { "epoch": 0.8, "learning_rate": 1.0627495572830537e-06, "loss": 2.5491, "step": 6670 }, { "epoch": 0.8, "learning_rate": 1.0615123939380707e-06, "loss": 2.5859, "step": 6671 }, { "epoch": 0.8, "learning_rate": 1.060275865589892e-06, "loss": 2.4764, "step": 6672 }, { "epoch": 0.8, "learning_rate": 1.0590399724378797e-06, "loss": 2.5178, "step": 6673 }, { "epoch": 0.8, "learning_rate": 1.057804714681296e-06, "loss": 2.4703, "step": 6674 }, { "epoch": 0.8, "learning_rate": 1.0565700925192995e-06, "loss": 2.4716, "step": 6675 }, { "epoch": 0.8, "learning_rate": 1.0553361061509482e-06, "loss": 2.3997, "step": 6676 }, { "epoch": 0.8, "learning_rate": 1.0541027557751937e-06, "loss": 2.5094, "step": 6677 }, { "epoch": 0.8, "learning_rate": 1.0528700415908876e-06, "loss": 2.5093, "step": 6678 }, { "epoch": 0.8, "learning_rate": 1.051637963796781e-06, "loss": 2.5762, "step": 6679 }, { "epoch": 0.8, "learning_rate": 1.0504065225915166e-06, "loss": 2.4511, "step": 6680 }, { "epoch": 0.8, "learning_rate": 1.0491757181736418e-06, "loss": 2.4777, "step": 6681 }, { "epoch": 0.8, "learning_rate": 1.0479455507415937e-06, "loss": 2.317, "step": 6682 }, { "epoch": 0.8, "learning_rate": 1.0467160204937115e-06, "loss": 2.3329, "step": 6683 }, { "epoch": 0.8, "learning_rate": 1.0454871276282335e-06, "loss": 2.5611, "step": 6684 }, { "epoch": 0.8, "learning_rate": 1.0442588723432872e-06, "loss": 2.4642, "step": 6685 }, { "epoch": 0.8, "learning_rate": 1.0430312548369076e-06, "loss": 2.4513, "step": 6686 }, { "epoch": 0.8, "learning_rate": 1.041804275307019e-06, "loss": 2.516, "step": 6687 }, { "epoch": 0.8, "learning_rate": 1.0405779339514466e-06, "loss": 2.6282, "step": 6688 }, { "epoch": 0.8, "learning_rate": 1.0393522309679106e-06, "loss": 2.3808, "step": 6689 }, { "epoch": 0.8, "learning_rate": 1.0381271665540294e-06, "loss": 2.4726, "step": 6690 }, { "epoch": 0.8, "learning_rate": 1.0369027409073207e-06, "loss": 2.4192, "step": 6691 }, { "epoch": 0.8, "learning_rate": 1.0356789542251939e-06, "loss": 2.5391, "step": 6692 }, { "epoch": 0.8, "learning_rate": 1.0344558067049603e-06, "loss": 2.5699, "step": 6693 }, { "epoch": 0.8, "learning_rate": 1.0332332985438248e-06, "loss": 2.3571, "step": 6694 }, { "epoch": 0.8, "learning_rate": 1.0320114299388916e-06, "loss": 2.5828, "step": 6695 }, { "epoch": 0.8, "learning_rate": 1.0307902010871606e-06, "loss": 2.4573, "step": 6696 }, { "epoch": 0.8, "learning_rate": 1.0295696121855292e-06, "loss": 2.4675, "step": 6697 }, { "epoch": 0.8, "learning_rate": 1.028349663430792e-06, "loss": 2.3509, "step": 6698 }, { "epoch": 0.8, "learning_rate": 1.0271303550196376e-06, "loss": 2.4551, "step": 6699 }, { "epoch": 0.8, "learning_rate": 1.0259116871486557e-06, "loss": 2.5644, "step": 6700 }, { "epoch": 0.81, "learning_rate": 1.0246936600143276e-06, "loss": 2.4142, "step": 6701 }, { "epoch": 0.81, "learning_rate": 1.0234762738130354e-06, "loss": 2.7077, "step": 6702 }, { "epoch": 0.81, "learning_rate": 1.0222595287410586e-06, "loss": 2.4355, "step": 6703 }, { "epoch": 0.81, "learning_rate": 1.0210434249945677e-06, "loss": 2.526, "step": 6704 }, { "epoch": 0.81, "learning_rate": 1.019827962769635e-06, "loss": 2.4043, "step": 6705 }, { "epoch": 0.81, "learning_rate": 1.0186131422622297e-06, "loss": 2.3991, "step": 6706 }, { "epoch": 0.81, "learning_rate": 1.0173989636682109e-06, "loss": 2.3965, "step": 6707 }, { "epoch": 0.81, "learning_rate": 1.0161854271833444e-06, "loss": 2.7059, "step": 6708 }, { "epoch": 0.81, "learning_rate": 1.0149725330032827e-06, "loss": 2.3652, "step": 6709 }, { "epoch": 0.81, "learning_rate": 1.0137602813235824e-06, "loss": 2.4159, "step": 6710 }, { "epoch": 0.81, "learning_rate": 1.0125486723396905e-06, "loss": 2.4414, "step": 6711 }, { "epoch": 0.81, "learning_rate": 1.0113377062469532e-06, "loss": 2.5917, "step": 6712 }, { "epoch": 0.81, "learning_rate": 1.0101273832406156e-06, "loss": 2.5579, "step": 6713 }, { "epoch": 0.81, "learning_rate": 1.0089177035158127e-06, "loss": 2.4856, "step": 6714 }, { "epoch": 0.81, "learning_rate": 1.0077086672675823e-06, "loss": 2.5277, "step": 6715 }, { "epoch": 0.81, "learning_rate": 1.0065002746908532e-06, "loss": 2.4392, "step": 6716 }, { "epoch": 0.81, "learning_rate": 1.0052925259804536e-06, "loss": 2.4239, "step": 6717 }, { "epoch": 0.81, "learning_rate": 1.0040854213311096e-06, "loss": 2.5553, "step": 6718 }, { "epoch": 0.81, "learning_rate": 1.0028789609374356e-06, "loss": 2.4595, "step": 6719 }, { "epoch": 0.81, "learning_rate": 1.0016731449939543e-06, "loss": 2.6189, "step": 6720 }, { "epoch": 0.81, "learning_rate": 1.0004679736950722e-06, "loss": 2.5324, "step": 6721 }, { "epoch": 0.81, "learning_rate": 9.992634472351016e-07, "loss": 2.5018, "step": 6722 }, { "epoch": 0.81, "learning_rate": 9.980595658082426e-07, "loss": 2.5164, "step": 6723 }, { "epoch": 0.81, "learning_rate": 9.96856329608597e-07, "loss": 2.475, "step": 6724 }, { "epoch": 0.81, "learning_rate": 9.956537388301623e-07, "loss": 2.4222, "step": 6725 }, { "epoch": 0.81, "learning_rate": 9.944517936668285e-07, "loss": 2.5997, "step": 6726 }, { "epoch": 0.81, "learning_rate": 9.93250494312385e-07, "loss": 2.6606, "step": 6727 }, { "epoch": 0.81, "learning_rate": 9.92049840960514e-07, "loss": 2.5187, "step": 6728 }, { "epoch": 0.81, "learning_rate": 9.908498338047956e-07, "loss": 2.3918, "step": 6729 }, { "epoch": 0.81, "learning_rate": 9.896504730387059e-07, "loss": 2.4241, "step": 6730 }, { "epoch": 0.81, "learning_rate": 9.884517588556158e-07, "loss": 2.5145, "step": 6731 }, { "epoch": 0.81, "learning_rate": 9.87253691448794e-07, "loss": 2.4539, "step": 6732 }, { "epoch": 0.81, "learning_rate": 9.860562710113996e-07, "loss": 2.72, "step": 6733 }, { "epoch": 0.81, "learning_rate": 9.84859497736495e-07, "loss": 2.5777, "step": 6734 }, { "epoch": 0.81, "learning_rate": 9.836633718170308e-07, "loss": 2.421, "step": 6735 }, { "epoch": 0.81, "learning_rate": 9.82467893445858e-07, "loss": 2.3478, "step": 6736 }, { "epoch": 0.81, "learning_rate": 9.81273062815724e-07, "loss": 2.4038, "step": 6737 }, { "epoch": 0.81, "learning_rate": 9.800788801192662e-07, "loss": 2.5633, "step": 6738 }, { "epoch": 0.81, "learning_rate": 9.788853455490232e-07, "loss": 2.4342, "step": 6739 }, { "epoch": 0.81, "learning_rate": 9.776924592974257e-07, "loss": 2.4838, "step": 6740 }, { "epoch": 0.81, "learning_rate": 9.765002215568015e-07, "loss": 2.4236, "step": 6741 }, { "epoch": 0.81, "learning_rate": 9.753086325193733e-07, "loss": 2.5882, "step": 6742 }, { "epoch": 0.81, "learning_rate": 9.741176923772593e-07, "loss": 2.6417, "step": 6743 }, { "epoch": 0.81, "learning_rate": 9.729274013224754e-07, "loss": 2.4518, "step": 6744 }, { "epoch": 0.81, "learning_rate": 9.717377595469269e-07, "loss": 2.6279, "step": 6745 }, { "epoch": 0.81, "learning_rate": 9.705487672424202e-07, "loss": 2.6027, "step": 6746 }, { "epoch": 0.81, "learning_rate": 9.69360424600654e-07, "loss": 2.4802, "step": 6747 }, { "epoch": 0.81, "learning_rate": 9.681727318132228e-07, "loss": 2.3432, "step": 6748 }, { "epoch": 0.81, "learning_rate": 9.669856890716188e-07, "loss": 2.4321, "step": 6749 }, { "epoch": 0.81, "learning_rate": 9.657992965672242e-07, "loss": 2.4774, "step": 6750 }, { "epoch": 0.81, "learning_rate": 9.646135544913226e-07, "loss": 2.4578, "step": 6751 }, { "epoch": 0.81, "learning_rate": 9.63428463035085e-07, "loss": 2.6671, "step": 6752 }, { "epoch": 0.81, "learning_rate": 9.622440223895868e-07, "loss": 2.4264, "step": 6753 }, { "epoch": 0.81, "learning_rate": 9.610602327457913e-07, "loss": 2.5435, "step": 6754 }, { "epoch": 0.81, "learning_rate": 9.59877094294559e-07, "loss": 2.4945, "step": 6755 }, { "epoch": 0.81, "learning_rate": 9.586946072266479e-07, "loss": 2.5343, "step": 6756 }, { "epoch": 0.81, "learning_rate": 9.57512771732706e-07, "loss": 2.4736, "step": 6757 }, { "epoch": 0.81, "learning_rate": 9.563315880032798e-07, "loss": 2.6527, "step": 6758 }, { "epoch": 0.81, "learning_rate": 9.551510562288112e-07, "loss": 2.3592, "step": 6759 }, { "epoch": 0.81, "learning_rate": 9.539711765996334e-07, "loss": 2.3183, "step": 6760 }, { "epoch": 0.81, "learning_rate": 9.527919493059801e-07, "loss": 2.3207, "step": 6761 }, { "epoch": 0.81, "learning_rate": 9.516133745379718e-07, "loss": 2.5467, "step": 6762 }, { "epoch": 0.81, "learning_rate": 9.504354524856318e-07, "loss": 2.414, "step": 6763 }, { "epoch": 0.81, "learning_rate": 9.492581833388736e-07, "loss": 2.4635, "step": 6764 }, { "epoch": 0.81, "learning_rate": 9.480815672875077e-07, "loss": 2.4049, "step": 6765 }, { "epoch": 0.81, "learning_rate": 9.469056045212382e-07, "loss": 2.5578, "step": 6766 }, { "epoch": 0.81, "learning_rate": 9.457302952296621e-07, "loss": 2.4616, "step": 6767 }, { "epoch": 0.81, "learning_rate": 9.445556396022754e-07, "loss": 2.5129, "step": 6768 }, { "epoch": 0.81, "learning_rate": 9.433816378284638e-07, "loss": 2.4566, "step": 6769 }, { "epoch": 0.81, "learning_rate": 9.422082900975105e-07, "loss": 2.4696, "step": 6770 }, { "epoch": 0.81, "learning_rate": 9.410355965985951e-07, "loss": 2.4196, "step": 6771 }, { "epoch": 0.81, "learning_rate": 9.398635575207854e-07, "loss": 2.6637, "step": 6772 }, { "epoch": 0.81, "learning_rate": 9.386921730530513e-07, "loss": 2.5521, "step": 6773 }, { "epoch": 0.81, "learning_rate": 9.375214433842489e-07, "loss": 2.4868, "step": 6774 }, { "epoch": 0.81, "learning_rate": 9.363513687031389e-07, "loss": 2.5464, "step": 6775 }, { "epoch": 0.81, "learning_rate": 9.351819491983671e-07, "loss": 2.5319, "step": 6776 }, { "epoch": 0.81, "learning_rate": 9.340131850584777e-07, "loss": 2.4377, "step": 6777 }, { "epoch": 0.81, "learning_rate": 9.32845076471911e-07, "loss": 2.4328, "step": 6778 }, { "epoch": 0.81, "learning_rate": 9.31677623626997e-07, "loss": 2.444, "step": 6779 }, { "epoch": 0.81, "learning_rate": 9.305108267119645e-07, "loss": 2.3913, "step": 6780 }, { "epoch": 0.81, "learning_rate": 9.293446859149324e-07, "loss": 2.5384, "step": 6781 }, { "epoch": 0.81, "learning_rate": 9.281792014239171e-07, "loss": 2.5745, "step": 6782 }, { "epoch": 0.81, "learning_rate": 9.270143734268289e-07, "loss": 2.6119, "step": 6783 }, { "epoch": 0.81, "learning_rate": 9.258502021114696e-07, "loss": 2.3984, "step": 6784 }, { "epoch": 0.82, "learning_rate": 9.246866876655375e-07, "loss": 2.5093, "step": 6785 }, { "epoch": 0.82, "learning_rate": 9.235238302766247e-07, "loss": 2.4536, "step": 6786 }, { "epoch": 0.82, "learning_rate": 9.22361630132218e-07, "loss": 2.2997, "step": 6787 }, { "epoch": 0.82, "learning_rate": 9.212000874196953e-07, "loss": 2.6088, "step": 6788 }, { "epoch": 0.82, "learning_rate": 9.200392023263311e-07, "loss": 2.5615, "step": 6789 }, { "epoch": 0.82, "learning_rate": 9.188789750392951e-07, "loss": 2.4818, "step": 6790 }, { "epoch": 0.82, "learning_rate": 9.177194057456468e-07, "loss": 2.4207, "step": 6791 }, { "epoch": 0.82, "learning_rate": 9.165604946323436e-07, "loss": 2.4474, "step": 6792 }, { "epoch": 0.82, "learning_rate": 9.154022418862329e-07, "loss": 2.4188, "step": 6793 }, { "epoch": 0.82, "learning_rate": 9.142446476940598e-07, "loss": 2.5743, "step": 6794 }, { "epoch": 0.82, "learning_rate": 9.130877122424625e-07, "loss": 2.3427, "step": 6795 }, { "epoch": 0.82, "learning_rate": 9.119314357179687e-07, "loss": 2.4942, "step": 6796 }, { "epoch": 0.82, "learning_rate": 9.107758183070076e-07, "loss": 2.5176, "step": 6797 }, { "epoch": 0.82, "learning_rate": 9.09620860195894e-07, "loss": 2.6185, "step": 6798 }, { "epoch": 0.82, "learning_rate": 9.084665615708432e-07, "loss": 2.513, "step": 6799 }, { "epoch": 0.82, "learning_rate": 9.073129226179589e-07, "loss": 2.5216, "step": 6800 }, { "epoch": 0.82, "learning_rate": 9.06159943523241e-07, "loss": 2.5273, "step": 6801 }, { "epoch": 0.82, "learning_rate": 9.050076244725847e-07, "loss": 2.6114, "step": 6802 }, { "epoch": 0.82, "learning_rate": 9.038559656517737e-07, "loss": 2.61, "step": 6803 }, { "epoch": 0.82, "learning_rate": 9.027049672464916e-07, "loss": 2.438, "step": 6804 }, { "epoch": 0.82, "learning_rate": 9.015546294423089e-07, "loss": 2.4383, "step": 6805 }, { "epoch": 0.82, "learning_rate": 9.004049524246944e-07, "loss": 2.3922, "step": 6806 }, { "epoch": 0.82, "learning_rate": 8.992559363790093e-07, "loss": 2.413, "step": 6807 }, { "epoch": 0.82, "learning_rate": 8.981075814905077e-07, "loss": 2.3703, "step": 6808 }, { "epoch": 0.82, "learning_rate": 8.969598879443381e-07, "loss": 2.4278, "step": 6809 }, { "epoch": 0.82, "learning_rate": 8.958128559255397e-07, "loss": 2.5568, "step": 6810 }, { "epoch": 0.82, "learning_rate": 8.946664856190473e-07, "loss": 2.5371, "step": 6811 }, { "epoch": 0.82, "learning_rate": 8.935207772096904e-07, "loss": 2.4801, "step": 6812 }, { "epoch": 0.82, "learning_rate": 8.923757308821873e-07, "loss": 2.5355, "step": 6813 }, { "epoch": 0.82, "learning_rate": 8.912313468211547e-07, "loss": 2.3753, "step": 6814 }, { "epoch": 0.82, "learning_rate": 8.900876252110974e-07, "loss": 2.2935, "step": 6815 }, { "epoch": 0.82, "learning_rate": 8.889445662364177e-07, "loss": 2.4367, "step": 6816 }, { "epoch": 0.82, "learning_rate": 8.878021700814099e-07, "loss": 2.5967, "step": 6817 }, { "epoch": 0.82, "learning_rate": 8.86660436930259e-07, "loss": 2.6055, "step": 6818 }, { "epoch": 0.82, "learning_rate": 8.855193669670459e-07, "loss": 2.5807, "step": 6819 }, { "epoch": 0.82, "learning_rate": 8.843789603757446e-07, "loss": 2.555, "step": 6820 }, { "epoch": 0.82, "learning_rate": 8.83239217340221e-07, "loss": 2.5251, "step": 6821 }, { "epoch": 0.82, "learning_rate": 8.821001380442334e-07, "loss": 2.4014, "step": 6822 }, { "epoch": 0.82, "learning_rate": 8.80961722671434e-07, "loss": 2.6247, "step": 6823 }, { "epoch": 0.82, "learning_rate": 8.798239714053692e-07, "loss": 2.4878, "step": 6824 }, { "epoch": 0.82, "learning_rate": 8.786868844294755e-07, "loss": 2.5047, "step": 6825 }, { "epoch": 0.82, "learning_rate": 8.775504619270852e-07, "loss": 2.3376, "step": 6826 }, { "epoch": 0.82, "learning_rate": 8.764147040814203e-07, "loss": 2.5749, "step": 6827 }, { "epoch": 0.82, "learning_rate": 8.752796110755985e-07, "loss": 2.5368, "step": 6828 }, { "epoch": 0.82, "learning_rate": 8.741451830926301e-07, "loss": 2.5531, "step": 6829 }, { "epoch": 0.82, "learning_rate": 8.730114203154144e-07, "loss": 2.4628, "step": 6830 }, { "epoch": 0.82, "learning_rate": 8.718783229267508e-07, "loss": 2.3553, "step": 6831 }, { "epoch": 0.82, "learning_rate": 8.707458911093231e-07, "loss": 2.5392, "step": 6832 }, { "epoch": 0.82, "learning_rate": 8.696141250457152e-07, "loss": 2.5145, "step": 6833 }, { "epoch": 0.82, "learning_rate": 8.684830249183962e-07, "loss": 2.6096, "step": 6834 }, { "epoch": 0.82, "learning_rate": 8.673525909097342e-07, "loss": 2.5186, "step": 6835 }, { "epoch": 0.82, "learning_rate": 8.662228232019876e-07, "loss": 2.43, "step": 6836 }, { "epoch": 0.82, "learning_rate": 8.65093721977306e-07, "loss": 2.5191, "step": 6837 }, { "epoch": 0.82, "learning_rate": 8.639652874177346e-07, "loss": 2.5696, "step": 6838 }, { "epoch": 0.82, "learning_rate": 8.628375197052069e-07, "loss": 2.4231, "step": 6839 }, { "epoch": 0.82, "learning_rate": 8.617104190215525e-07, "loss": 2.4872, "step": 6840 }, { "epoch": 0.82, "learning_rate": 8.60583985548492e-07, "loss": 2.5507, "step": 6841 }, { "epoch": 0.82, "learning_rate": 8.594582194676393e-07, "loss": 2.4487, "step": 6842 }, { "epoch": 0.82, "learning_rate": 8.583331209605011e-07, "loss": 2.5925, "step": 6843 }, { "epoch": 0.82, "learning_rate": 8.572086902084731e-07, "loss": 2.3633, "step": 6844 }, { "epoch": 0.82, "learning_rate": 8.560849273928479e-07, "loss": 2.5216, "step": 6845 }, { "epoch": 0.82, "learning_rate": 8.549618326948056e-07, "loss": 2.4321, "step": 6846 }, { "epoch": 0.82, "learning_rate": 8.538394062954225e-07, "loss": 2.4959, "step": 6847 }, { "epoch": 0.82, "learning_rate": 8.527176483756671e-07, "loss": 2.3352, "step": 6848 }, { "epoch": 0.82, "learning_rate": 8.515965591163966e-07, "loss": 2.4374, "step": 6849 }, { "epoch": 0.82, "learning_rate": 8.504761386983651e-07, "loss": 2.6216, "step": 6850 }, { "epoch": 0.82, "learning_rate": 8.493563873022137e-07, "loss": 2.6362, "step": 6851 }, { "epoch": 0.82, "learning_rate": 8.482373051084791e-07, "loss": 2.5443, "step": 6852 }, { "epoch": 0.82, "learning_rate": 8.471188922975903e-07, "loss": 2.4744, "step": 6853 }, { "epoch": 0.82, "learning_rate": 8.460011490498671e-07, "loss": 2.6094, "step": 6854 }, { "epoch": 0.82, "learning_rate": 8.448840755455229e-07, "loss": 2.5169, "step": 6855 }, { "epoch": 0.82, "learning_rate": 8.437676719646593e-07, "loss": 2.4628, "step": 6856 }, { "epoch": 0.82, "learning_rate": 8.426519384872733e-07, "loss": 2.5622, "step": 6857 }, { "epoch": 0.82, "learning_rate": 8.415368752932551e-07, "loss": 2.5443, "step": 6858 }, { "epoch": 0.82, "learning_rate": 8.404224825623819e-07, "loss": 2.5632, "step": 6859 }, { "epoch": 0.82, "learning_rate": 8.393087604743283e-07, "loss": 2.4735, "step": 6860 }, { "epoch": 0.82, "learning_rate": 8.381957092086551e-07, "loss": 2.436, "step": 6861 }, { "epoch": 0.82, "learning_rate": 8.370833289448199e-07, "loss": 2.5449, "step": 6862 }, { "epoch": 0.82, "learning_rate": 8.359716198621698e-07, "loss": 2.4819, "step": 6863 }, { "epoch": 0.82, "learning_rate": 8.348605821399441e-07, "loss": 2.5689, "step": 6864 }, { "epoch": 0.82, "learning_rate": 8.337502159572758e-07, "loss": 2.3686, "step": 6865 }, { "epoch": 0.82, "learning_rate": 8.326405214931838e-07, "loss": 2.5153, "step": 6866 }, { "epoch": 0.82, "learning_rate": 8.315314989265866e-07, "loss": 2.6249, "step": 6867 }, { "epoch": 0.83, "learning_rate": 8.304231484362868e-07, "loss": 2.5751, "step": 6868 }, { "epoch": 0.83, "learning_rate": 8.293154702009837e-07, "loss": 2.3922, "step": 6869 }, { "epoch": 0.83, "learning_rate": 8.282084643992677e-07, "loss": 2.4298, "step": 6870 }, { "epoch": 0.83, "learning_rate": 8.271021312096178e-07, "loss": 2.4978, "step": 6871 }, { "epoch": 0.83, "learning_rate": 8.259964708104091e-07, "loss": 2.5672, "step": 6872 }, { "epoch": 0.83, "learning_rate": 8.248914833799027e-07, "loss": 2.5524, "step": 6873 }, { "epoch": 0.83, "learning_rate": 8.237871690962557e-07, "loss": 2.611, "step": 6874 }, { "epoch": 0.83, "learning_rate": 8.226835281375151e-07, "loss": 2.4287, "step": 6875 }, { "epoch": 0.83, "learning_rate": 8.215805606816191e-07, "loss": 2.515, "step": 6876 }, { "epoch": 0.83, "learning_rate": 8.204782669063993e-07, "loss": 2.398, "step": 6877 }, { "epoch": 0.83, "learning_rate": 8.193766469895737e-07, "loss": 2.497, "step": 6878 }, { "epoch": 0.83, "learning_rate": 8.182757011087583e-07, "loss": 2.5607, "step": 6879 }, { "epoch": 0.83, "learning_rate": 8.171754294414546e-07, "loss": 2.3995, "step": 6880 }, { "epoch": 0.83, "learning_rate": 8.16075832165058e-07, "loss": 2.495, "step": 6881 }, { "epoch": 0.83, "learning_rate": 8.149769094568577e-07, "loss": 2.5406, "step": 6882 }, { "epoch": 0.83, "learning_rate": 8.138786614940275e-07, "loss": 2.5584, "step": 6883 }, { "epoch": 0.83, "learning_rate": 8.127810884536402e-07, "loss": 2.6382, "step": 6884 }, { "epoch": 0.83, "learning_rate": 8.11684190512651e-07, "loss": 2.4393, "step": 6885 }, { "epoch": 0.83, "learning_rate": 8.105879678479172e-07, "loss": 2.206, "step": 6886 }, { "epoch": 0.83, "learning_rate": 8.094924206361771e-07, "loss": 2.5761, "step": 6887 }, { "epoch": 0.83, "learning_rate": 8.083975490540658e-07, "loss": 2.5352, "step": 6888 }, { "epoch": 0.83, "learning_rate": 8.073033532781083e-07, "loss": 2.3965, "step": 6889 }, { "epoch": 0.83, "learning_rate": 8.062098334847185e-07, "loss": 2.531, "step": 6890 }, { "epoch": 0.83, "learning_rate": 8.051169898502053e-07, "loss": 2.4125, "step": 6891 }, { "epoch": 0.83, "learning_rate": 8.040248225507641e-07, "loss": 2.4702, "step": 6892 }, { "epoch": 0.83, "learning_rate": 8.029333317624838e-07, "loss": 2.5914, "step": 6893 }, { "epoch": 0.83, "learning_rate": 8.018425176613464e-07, "loss": 2.3309, "step": 6894 }, { "epoch": 0.83, "learning_rate": 8.007523804232192e-07, "loss": 2.5323, "step": 6895 }, { "epoch": 0.83, "learning_rate": 7.996629202238654e-07, "loss": 2.454, "step": 6896 }, { "epoch": 0.83, "learning_rate": 7.985741372389361e-07, "loss": 2.4252, "step": 6897 }, { "epoch": 0.83, "learning_rate": 7.974860316439759e-07, "loss": 2.4812, "step": 6898 }, { "epoch": 0.83, "learning_rate": 7.963986036144161e-07, "loss": 2.4529, "step": 6899 }, { "epoch": 0.83, "learning_rate": 7.953118533255821e-07, "loss": 2.4786, "step": 6900 }, { "epoch": 0.83, "learning_rate": 7.94225780952691e-07, "loss": 2.4672, "step": 6901 }, { "epoch": 0.83, "learning_rate": 7.931403866708464e-07, "loss": 2.5062, "step": 6902 }, { "epoch": 0.83, "learning_rate": 7.920556706550464e-07, "loss": 2.579, "step": 6903 }, { "epoch": 0.83, "learning_rate": 7.909716330801765e-07, "loss": 2.6029, "step": 6904 }, { "epoch": 0.83, "learning_rate": 7.898882741210151e-07, "loss": 2.6966, "step": 6905 }, { "epoch": 0.83, "learning_rate": 7.888055939522327e-07, "loss": 2.5529, "step": 6906 }, { "epoch": 0.83, "learning_rate": 7.877235927483856e-07, "loss": 2.5558, "step": 6907 }, { "epoch": 0.83, "learning_rate": 7.866422706839239e-07, "loss": 2.463, "step": 6908 }, { "epoch": 0.83, "learning_rate": 7.855616279331885e-07, "loss": 2.4322, "step": 6909 }, { "epoch": 0.83, "learning_rate": 7.844816646704096e-07, "loss": 2.527, "step": 6910 }, { "epoch": 0.83, "learning_rate": 7.834023810697088e-07, "loss": 2.5621, "step": 6911 }, { "epoch": 0.83, "learning_rate": 7.823237773050963e-07, "loss": 2.5232, "step": 6912 }, { "epoch": 0.83, "learning_rate": 7.812458535504752e-07, "loss": 2.386, "step": 6913 }, { "epoch": 0.83, "learning_rate": 7.801686099796358e-07, "loss": 2.6354, "step": 6914 }, { "epoch": 0.83, "learning_rate": 7.790920467662611e-07, "loss": 2.532, "step": 6915 }, { "epoch": 0.83, "learning_rate": 7.780161640839257e-07, "loss": 2.4484, "step": 6916 }, { "epoch": 0.83, "learning_rate": 7.769409621060903e-07, "loss": 2.6563, "step": 6917 }, { "epoch": 0.83, "learning_rate": 7.758664410061095e-07, "loss": 2.5626, "step": 6918 }, { "epoch": 0.83, "learning_rate": 7.747926009572249e-07, "loss": 2.5439, "step": 6919 }, { "epoch": 0.83, "learning_rate": 7.737194421325739e-07, "loss": 2.5609, "step": 6920 }, { "epoch": 0.83, "learning_rate": 7.726469647051771e-07, "loss": 2.5251, "step": 6921 }, { "epoch": 0.83, "learning_rate": 7.7157516884795e-07, "loss": 2.5114, "step": 6922 }, { "epoch": 0.83, "learning_rate": 7.705040547336973e-07, "loss": 2.6372, "step": 6923 }, { "epoch": 0.83, "learning_rate": 7.694336225351107e-07, "loss": 2.5883, "step": 6924 }, { "epoch": 0.83, "learning_rate": 7.683638724247778e-07, "loss": 2.5683, "step": 6925 }, { "epoch": 0.83, "learning_rate": 7.672948045751699e-07, "loss": 2.3527, "step": 6926 }, { "epoch": 0.83, "learning_rate": 7.662264191586533e-07, "loss": 2.5291, "step": 6927 }, { "epoch": 0.83, "learning_rate": 7.651587163474822e-07, "loss": 2.5628, "step": 6928 }, { "epoch": 0.83, "learning_rate": 7.64091696313799e-07, "loss": 2.4565, "step": 6929 }, { "epoch": 0.83, "learning_rate": 7.630253592296388e-07, "loss": 2.4799, "step": 6930 }, { "epoch": 0.83, "learning_rate": 7.619597052669265e-07, "loss": 2.5149, "step": 6931 }, { "epoch": 0.83, "learning_rate": 7.60894734597476e-07, "loss": 2.4274, "step": 6932 }, { "epoch": 0.83, "learning_rate": 7.59830447392989e-07, "loss": 2.6478, "step": 6933 }, { "epoch": 0.83, "learning_rate": 7.587668438250612e-07, "loss": 2.6902, "step": 6934 }, { "epoch": 0.83, "learning_rate": 7.577039240651757e-07, "loss": 2.5341, "step": 6935 }, { "epoch": 0.83, "learning_rate": 7.566416882847039e-07, "loss": 2.3667, "step": 6936 }, { "epoch": 0.83, "learning_rate": 7.555801366549109e-07, "loss": 2.5559, "step": 6937 }, { "epoch": 0.83, "learning_rate": 7.545192693469467e-07, "loss": 2.4354, "step": 6938 }, { "epoch": 0.83, "learning_rate": 7.534590865318547e-07, "loss": 2.3792, "step": 6939 }, { "epoch": 0.83, "learning_rate": 7.52399588380568e-07, "loss": 2.4067, "step": 6940 }, { "epoch": 0.83, "learning_rate": 7.51340775063904e-07, "loss": 2.5818, "step": 6941 }, { "epoch": 0.83, "learning_rate": 7.502826467525787e-07, "loss": 2.5167, "step": 6942 }, { "epoch": 0.83, "learning_rate": 7.492252036171893e-07, "loss": 2.4099, "step": 6943 }, { "epoch": 0.83, "learning_rate": 7.481684458282273e-07, "loss": 2.3273, "step": 6944 }, { "epoch": 0.83, "learning_rate": 7.471123735560715e-07, "loss": 2.6003, "step": 6945 }, { "epoch": 0.83, "learning_rate": 7.460569869709905e-07, "loss": 2.47, "step": 6946 }, { "epoch": 0.83, "learning_rate": 7.450022862431449e-07, "loss": 2.5858, "step": 6947 }, { "epoch": 0.83, "learning_rate": 7.439482715425806e-07, "loss": 2.571, "step": 6948 }, { "epoch": 0.83, "learning_rate": 7.428949430392357e-07, "loss": 2.3359, "step": 6949 }, { "epoch": 0.83, "learning_rate": 7.418423009029363e-07, "loss": 2.6286, "step": 6950 }, { "epoch": 0.84, "learning_rate": 7.407903453033982e-07, "loss": 2.4648, "step": 6951 }, { "epoch": 0.84, "learning_rate": 7.39739076410228e-07, "loss": 2.4452, "step": 6952 }, { "epoch": 0.84, "learning_rate": 7.38688494392919e-07, "loss": 2.5696, "step": 6953 }, { "epoch": 0.84, "learning_rate": 7.376385994208574e-07, "loss": 2.5671, "step": 6954 }, { "epoch": 0.84, "learning_rate": 7.365893916633132e-07, "loss": 2.6858, "step": 6955 }, { "epoch": 0.84, "learning_rate": 7.355408712894508e-07, "loss": 2.4907, "step": 6956 }, { "epoch": 0.84, "learning_rate": 7.344930384683202e-07, "loss": 2.6572, "step": 6957 }, { "epoch": 0.84, "learning_rate": 7.334458933688626e-07, "loss": 2.4569, "step": 6958 }, { "epoch": 0.84, "learning_rate": 7.323994361599091e-07, "loss": 2.3819, "step": 6959 }, { "epoch": 0.84, "learning_rate": 7.313536670101762e-07, "loss": 2.441, "step": 6960 }, { "epoch": 0.84, "learning_rate": 7.303085860882725e-07, "loss": 2.6341, "step": 6961 }, { "epoch": 0.84, "learning_rate": 7.292641935626966e-07, "loss": 2.686, "step": 6962 }, { "epoch": 0.84, "learning_rate": 7.282204896018307e-07, "loss": 2.4708, "step": 6963 }, { "epoch": 0.84, "learning_rate": 7.271774743739546e-07, "loss": 2.3816, "step": 6964 }, { "epoch": 0.84, "learning_rate": 7.261351480472284e-07, "loss": 2.5959, "step": 6965 }, { "epoch": 0.84, "learning_rate": 7.250935107897078e-07, "loss": 2.4079, "step": 6966 }, { "epoch": 0.84, "learning_rate": 7.240525627693312e-07, "loss": 2.3906, "step": 6967 }, { "epoch": 0.84, "learning_rate": 7.23012304153931e-07, "loss": 2.577, "step": 6968 }, { "epoch": 0.84, "learning_rate": 7.219727351112276e-07, "loss": 2.46, "step": 6969 }, { "epoch": 0.84, "learning_rate": 7.209338558088275e-07, "loss": 2.473, "step": 6970 }, { "epoch": 0.84, "learning_rate": 7.198956664142292e-07, "loss": 2.3829, "step": 6971 }, { "epoch": 0.84, "learning_rate": 7.18858167094817e-07, "loss": 2.5336, "step": 6972 }, { "epoch": 0.84, "learning_rate": 7.178213580178655e-07, "loss": 2.5946, "step": 6973 }, { "epoch": 0.84, "learning_rate": 7.167852393505393e-07, "loss": 2.4993, "step": 6974 }, { "epoch": 0.84, "learning_rate": 7.157498112598893e-07, "loss": 2.5622, "step": 6975 }, { "epoch": 0.84, "learning_rate": 7.147150739128577e-07, "loss": 2.379, "step": 6976 }, { "epoch": 0.84, "learning_rate": 7.136810274762717e-07, "loss": 2.5264, "step": 6977 }, { "epoch": 0.84, "learning_rate": 7.126476721168513e-07, "loss": 2.4595, "step": 6978 }, { "epoch": 0.84, "learning_rate": 7.116150080011996e-07, "loss": 2.7064, "step": 6979 }, { "epoch": 0.84, "learning_rate": 7.105830352958143e-07, "loss": 2.6926, "step": 6980 }, { "epoch": 0.84, "learning_rate": 7.095517541670793e-07, "loss": 2.4068, "step": 6981 }, { "epoch": 0.84, "learning_rate": 7.085211647812645e-07, "loss": 2.5204, "step": 6982 }, { "epoch": 0.84, "learning_rate": 7.07491267304532e-07, "loss": 2.3869, "step": 6983 }, { "epoch": 0.84, "learning_rate": 7.064620619029294e-07, "loss": 2.6386, "step": 6984 }, { "epoch": 0.84, "learning_rate": 7.054335487423946e-07, "loss": 2.4831, "step": 6985 }, { "epoch": 0.84, "learning_rate": 7.04405727988754e-07, "loss": 2.6016, "step": 6986 }, { "epoch": 0.84, "learning_rate": 7.033785998077202e-07, "loss": 2.5212, "step": 6987 }, { "epoch": 0.84, "learning_rate": 7.023521643648984e-07, "loss": 2.4323, "step": 6988 }, { "epoch": 0.84, "learning_rate": 7.013264218257765e-07, "loss": 2.5483, "step": 6989 }, { "epoch": 0.84, "learning_rate": 7.003013723557356e-07, "loss": 2.5896, "step": 6990 }, { "epoch": 0.84, "learning_rate": 6.992770161200402e-07, "loss": 2.5293, "step": 6991 }, { "epoch": 0.84, "learning_rate": 6.982533532838481e-07, "loss": 2.4751, "step": 6992 }, { "epoch": 0.84, "learning_rate": 6.972303840122036e-07, "loss": 2.3935, "step": 6993 }, { "epoch": 0.84, "learning_rate": 6.962081084700361e-07, "loss": 2.4752, "step": 6994 }, { "epoch": 0.84, "learning_rate": 6.951865268221686e-07, "loss": 2.4264, "step": 6995 }, { "epoch": 0.84, "learning_rate": 6.941656392333046e-07, "loss": 2.5385, "step": 6996 }, { "epoch": 0.84, "learning_rate": 6.931454458680464e-07, "loss": 2.4379, "step": 6997 }, { "epoch": 0.84, "learning_rate": 6.921259468908742e-07, "loss": 2.5093, "step": 6998 }, { "epoch": 0.84, "learning_rate": 6.911071424661614e-07, "loss": 2.5523, "step": 6999 }, { "epoch": 0.84, "learning_rate": 6.900890327581694e-07, "loss": 2.2903, "step": 7000 }, { "epoch": 0.84, "learning_rate": 6.890716179310447e-07, "loss": 2.3628, "step": 7001 }, { "epoch": 0.84, "learning_rate": 6.880548981488261e-07, "loss": 2.395, "step": 7002 }, { "epoch": 0.84, "learning_rate": 6.870388735754358e-07, "loss": 2.623, "step": 7003 }, { "epoch": 0.84, "learning_rate": 6.86023544374686e-07, "loss": 2.5501, "step": 7004 }, { "epoch": 0.84, "learning_rate": 6.850089107102787e-07, "loss": 2.6441, "step": 7005 }, { "epoch": 0.84, "learning_rate": 6.839949727458e-07, "loss": 2.4659, "step": 7006 }, { "epoch": 0.84, "learning_rate": 6.829817306447267e-07, "loss": 2.5754, "step": 7007 }, { "epoch": 0.84, "learning_rate": 6.819691845704207e-07, "loss": 2.4002, "step": 7008 }, { "epoch": 0.84, "learning_rate": 6.809573346861364e-07, "loss": 2.5553, "step": 7009 }, { "epoch": 0.84, "learning_rate": 6.799461811550101e-07, "loss": 2.5189, "step": 7010 }, { "epoch": 0.84, "learning_rate": 6.789357241400701e-07, "loss": 2.5037, "step": 7011 }, { "epoch": 0.84, "learning_rate": 6.779259638042318e-07, "loss": 2.2808, "step": 7012 }, { "epoch": 0.84, "learning_rate": 6.769169003102954e-07, "loss": 2.4919, "step": 7013 }, { "epoch": 0.84, "learning_rate": 6.759085338209514e-07, "loss": 2.6612, "step": 7014 }, { "epoch": 0.84, "learning_rate": 6.749008644987787e-07, "loss": 2.5852, "step": 7015 }, { "epoch": 0.84, "learning_rate": 6.738938925062399e-07, "loss": 2.4972, "step": 7016 }, { "epoch": 0.84, "learning_rate": 6.728876180056904e-07, "loss": 2.5964, "step": 7017 }, { "epoch": 0.84, "learning_rate": 6.718820411593685e-07, "loss": 2.4698, "step": 7018 }, { "epoch": 0.84, "learning_rate": 6.708771621294019e-07, "loss": 2.577, "step": 7019 }, { "epoch": 0.84, "learning_rate": 6.698729810778065e-07, "loss": 2.5412, "step": 7020 }, { "epoch": 0.84, "learning_rate": 6.688694981664857e-07, "loss": 2.425, "step": 7021 }, { "epoch": 0.84, "learning_rate": 6.678667135572293e-07, "loss": 2.5704, "step": 7022 }, { "epoch": 0.84, "learning_rate": 6.668646274117135e-07, "loss": 2.5388, "step": 7023 }, { "epoch": 0.84, "learning_rate": 6.658632398915049e-07, "loss": 2.6105, "step": 7024 }, { "epoch": 0.84, "learning_rate": 6.648625511580547e-07, "loss": 2.4506, "step": 7025 }, { "epoch": 0.84, "learning_rate": 6.638625613727024e-07, "loss": 2.4881, "step": 7026 }, { "epoch": 0.84, "learning_rate": 6.62863270696677e-07, "loss": 2.5272, "step": 7027 }, { "epoch": 0.84, "learning_rate": 6.618646792910893e-07, "loss": 2.4991, "step": 7028 }, { "epoch": 0.84, "learning_rate": 6.608667873169444e-07, "loss": 2.5807, "step": 7029 }, { "epoch": 0.84, "learning_rate": 6.59869594935127e-07, "loss": 2.5865, "step": 7030 }, { "epoch": 0.84, "learning_rate": 6.588731023064177e-07, "loss": 2.5757, "step": 7031 }, { "epoch": 0.84, "learning_rate": 6.578773095914758e-07, "loss": 2.5052, "step": 7032 }, { "epoch": 0.84, "learning_rate": 6.568822169508532e-07, "loss": 2.3653, "step": 7033 }, { "epoch": 0.85, "learning_rate": 6.558878245449879e-07, "loss": 2.4283, "step": 7034 }, { "epoch": 0.85, "learning_rate": 6.548941325342024e-07, "loss": 2.3236, "step": 7035 }, { "epoch": 0.85, "learning_rate": 6.539011410787105e-07, "loss": 2.4657, "step": 7036 }, { "epoch": 0.85, "learning_rate": 6.529088503386089e-07, "loss": 2.4938, "step": 7037 }, { "epoch": 0.85, "learning_rate": 6.519172604738838e-07, "loss": 2.4699, "step": 7038 }, { "epoch": 0.85, "learning_rate": 6.509263716444092e-07, "loss": 2.4351, "step": 7039 }, { "epoch": 0.85, "learning_rate": 6.499361840099421e-07, "loss": 2.4577, "step": 7040 }, { "epoch": 0.85, "learning_rate": 6.489466977301312e-07, "loss": 2.4382, "step": 7041 }, { "epoch": 0.85, "learning_rate": 6.479579129645092e-07, "loss": 2.5262, "step": 7042 }, { "epoch": 0.85, "learning_rate": 6.469698298724974e-07, "loss": 2.5562, "step": 7043 }, { "epoch": 0.85, "learning_rate": 6.459824486134015e-07, "loss": 2.3493, "step": 7044 }, { "epoch": 0.85, "learning_rate": 6.449957693464159e-07, "loss": 2.5105, "step": 7045 }, { "epoch": 0.85, "learning_rate": 6.440097922306232e-07, "loss": 2.5205, "step": 7046 }, { "epoch": 0.85, "learning_rate": 6.430245174249889e-07, "loss": 2.3766, "step": 7047 }, { "epoch": 0.85, "learning_rate": 6.42039945088369e-07, "loss": 2.5755, "step": 7048 }, { "epoch": 0.85, "learning_rate": 6.410560753795037e-07, "loss": 2.4185, "step": 7049 }, { "epoch": 0.85, "learning_rate": 6.400729084570212e-07, "loss": 2.6484, "step": 7050 }, { "epoch": 0.85, "learning_rate": 6.390904444794372e-07, "loss": 2.488, "step": 7051 }, { "epoch": 0.85, "learning_rate": 6.381086836051498e-07, "loss": 2.5949, "step": 7052 }, { "epoch": 0.85, "learning_rate": 6.371276259924514e-07, "loss": 2.3084, "step": 7053 }, { "epoch": 0.85, "learning_rate": 6.361472717995126e-07, "loss": 2.4573, "step": 7054 }, { "epoch": 0.85, "learning_rate": 6.351676211843983e-07, "loss": 2.5246, "step": 7055 }, { "epoch": 0.85, "learning_rate": 6.341886743050523e-07, "loss": 2.3508, "step": 7056 }, { "epoch": 0.85, "learning_rate": 6.332104313193111e-07, "loss": 2.5343, "step": 7057 }, { "epoch": 0.85, "learning_rate": 6.322328923848958e-07, "loss": 2.5926, "step": 7058 }, { "epoch": 0.85, "learning_rate": 6.312560576594118e-07, "loss": 2.4048, "step": 7059 }, { "epoch": 0.85, "learning_rate": 6.302799273003546e-07, "loss": 2.4688, "step": 7060 }, { "epoch": 0.85, "learning_rate": 6.293045014651028e-07, "loss": 2.7096, "step": 7061 }, { "epoch": 0.85, "learning_rate": 6.283297803109234e-07, "loss": 2.6595, "step": 7062 }, { "epoch": 0.85, "learning_rate": 6.273557639949695e-07, "loss": 2.3241, "step": 7063 }, { "epoch": 0.85, "learning_rate": 6.263824526742807e-07, "loss": 2.5094, "step": 7064 }, { "epoch": 0.85, "learning_rate": 6.254098465057834e-07, "loss": 2.5791, "step": 7065 }, { "epoch": 0.85, "learning_rate": 6.244379456462873e-07, "loss": 2.4879, "step": 7066 }, { "epoch": 0.85, "learning_rate": 6.234667502524915e-07, "loss": 2.5054, "step": 7067 }, { "epoch": 0.85, "learning_rate": 6.22496260480982e-07, "loss": 2.4852, "step": 7068 }, { "epoch": 0.85, "learning_rate": 6.215264764882273e-07, "loss": 2.5027, "step": 7069 }, { "epoch": 0.85, "learning_rate": 6.205573984305857e-07, "loss": 2.461, "step": 7070 }, { "epoch": 0.85, "learning_rate": 6.195890264642995e-07, "loss": 2.5505, "step": 7071 }, { "epoch": 0.85, "learning_rate": 6.186213607454977e-07, "loss": 2.6249, "step": 7072 }, { "epoch": 0.85, "learning_rate": 6.176544014301978e-07, "loss": 2.6036, "step": 7073 }, { "epoch": 0.85, "learning_rate": 6.16688148674297e-07, "loss": 2.3603, "step": 7074 }, { "epoch": 0.85, "learning_rate": 6.157226026335883e-07, "loss": 2.4026, "step": 7075 }, { "epoch": 0.85, "learning_rate": 6.147577634637413e-07, "loss": 2.5778, "step": 7076 }, { "epoch": 0.85, "learning_rate": 6.13793631320318e-07, "loss": 2.4887, "step": 7077 }, { "epoch": 0.85, "learning_rate": 6.128302063587622e-07, "loss": 2.4981, "step": 7078 }, { "epoch": 0.85, "learning_rate": 6.118674887344062e-07, "loss": 2.4814, "step": 7079 }, { "epoch": 0.85, "learning_rate": 6.109054786024692e-07, "loss": 2.5769, "step": 7080 }, { "epoch": 0.85, "learning_rate": 6.099441761180519e-07, "loss": 2.5252, "step": 7081 }, { "epoch": 0.85, "learning_rate": 6.089835814361461e-07, "loss": 2.4056, "step": 7082 }, { "epoch": 0.85, "learning_rate": 6.080236947116259e-07, "loss": 2.3448, "step": 7083 }, { "epoch": 0.85, "learning_rate": 6.070645160992523e-07, "loss": 2.5033, "step": 7084 }, { "epoch": 0.85, "learning_rate": 6.061060457536727e-07, "loss": 2.5494, "step": 7085 }, { "epoch": 0.85, "learning_rate": 6.051482838294203e-07, "loss": 2.5221, "step": 7086 }, { "epoch": 0.85, "learning_rate": 6.041912304809139e-07, "loss": 2.7329, "step": 7087 }, { "epoch": 0.85, "learning_rate": 6.03234885862457e-07, "loss": 2.5862, "step": 7088 }, { "epoch": 0.85, "learning_rate": 6.022792501282409e-07, "loss": 2.5092, "step": 7089 }, { "epoch": 0.85, "learning_rate": 6.013243234323396e-07, "loss": 2.6358, "step": 7090 }, { "epoch": 0.85, "learning_rate": 6.003701059287159e-07, "loss": 2.4988, "step": 7091 }, { "epoch": 0.85, "learning_rate": 5.994165977712175e-07, "loss": 2.7039, "step": 7092 }, { "epoch": 0.85, "learning_rate": 5.98463799113575e-07, "loss": 2.3833, "step": 7093 }, { "epoch": 0.85, "learning_rate": 5.975117101094091e-07, "loss": 2.5777, "step": 7094 }, { "epoch": 0.85, "learning_rate": 5.965603309122215e-07, "loss": 2.5442, "step": 7095 }, { "epoch": 0.85, "learning_rate": 5.956096616754037e-07, "loss": 2.5086, "step": 7096 }, { "epoch": 0.85, "learning_rate": 5.946597025522294e-07, "loss": 2.577, "step": 7097 }, { "epoch": 0.85, "learning_rate": 5.937104536958598e-07, "loss": 2.5645, "step": 7098 }, { "epoch": 0.85, "learning_rate": 5.927619152593428e-07, "loss": 2.4049, "step": 7099 }, { "epoch": 0.85, "learning_rate": 5.918140873956063e-07, "loss": 2.6013, "step": 7100 }, { "epoch": 0.85, "learning_rate": 5.908669702574705e-07, "loss": 2.6227, "step": 7101 }, { "epoch": 0.85, "learning_rate": 5.899205639976347e-07, "loss": 2.577, "step": 7102 }, { "epoch": 0.85, "learning_rate": 5.889748687686886e-07, "loss": 2.5048, "step": 7103 }, { "epoch": 0.85, "learning_rate": 5.880298847231059e-07, "loss": 2.6582, "step": 7104 }, { "epoch": 0.85, "learning_rate": 5.870856120132434e-07, "loss": 2.4305, "step": 7105 }, { "epoch": 0.85, "learning_rate": 5.861420507913462e-07, "loss": 2.6511, "step": 7106 }, { "epoch": 0.85, "learning_rate": 5.851992012095414e-07, "loss": 2.3853, "step": 7107 }, { "epoch": 0.85, "learning_rate": 5.842570634198453e-07, "loss": 2.6996, "step": 7108 }, { "epoch": 0.85, "learning_rate": 5.833156375741561e-07, "loss": 2.5249, "step": 7109 }, { "epoch": 0.85, "learning_rate": 5.823749238242593e-07, "loss": 2.4923, "step": 7110 }, { "epoch": 0.85, "learning_rate": 5.814349223218263e-07, "loss": 2.515, "step": 7111 }, { "epoch": 0.85, "learning_rate": 5.804956332184092e-07, "loss": 2.5192, "step": 7112 }, { "epoch": 0.85, "learning_rate": 5.795570566654507e-07, "loss": 2.4299, "step": 7113 }, { "epoch": 0.85, "learning_rate": 5.786191928142748e-07, "loss": 2.6531, "step": 7114 }, { "epoch": 0.85, "learning_rate": 5.776820418160916e-07, "loss": 2.5931, "step": 7115 }, { "epoch": 0.85, "learning_rate": 5.767456038219987e-07, "loss": 2.5592, "step": 7116 }, { "epoch": 0.85, "learning_rate": 5.758098789829746e-07, "loss": 2.3397, "step": 7117 }, { "epoch": 0.86, "learning_rate": 5.748748674498855e-07, "loss": 2.6578, "step": 7118 }, { "epoch": 0.86, "learning_rate": 5.739405693734823e-07, "loss": 2.4699, "step": 7119 }, { "epoch": 0.86, "learning_rate": 5.730069849044007e-07, "loss": 2.5224, "step": 7120 }, { "epoch": 0.86, "learning_rate": 5.720741141931613e-07, "loss": 2.6142, "step": 7121 }, { "epoch": 0.86, "learning_rate": 5.711419573901683e-07, "loss": 2.521, "step": 7122 }, { "epoch": 0.86, "learning_rate": 5.702105146457143e-07, "loss": 2.4117, "step": 7123 }, { "epoch": 0.86, "learning_rate": 5.692797861099719e-07, "loss": 2.4403, "step": 7124 }, { "epoch": 0.86, "learning_rate": 5.683497719330022e-07, "loss": 2.4956, "step": 7125 }, { "epoch": 0.86, "learning_rate": 5.674204722647514e-07, "loss": 2.5664, "step": 7126 }, { "epoch": 0.86, "learning_rate": 5.664918872550468e-07, "loss": 2.4348, "step": 7127 }, { "epoch": 0.86, "learning_rate": 5.655640170536053e-07, "loss": 2.6201, "step": 7128 }, { "epoch": 0.86, "learning_rate": 5.64636861810024e-07, "loss": 2.6298, "step": 7129 }, { "epoch": 0.86, "learning_rate": 5.637104216737871e-07, "loss": 2.3339, "step": 7130 }, { "epoch": 0.86, "learning_rate": 5.627846967942646e-07, "loss": 2.445, "step": 7131 }, { "epoch": 0.86, "learning_rate": 5.618596873207083e-07, "loss": 2.5413, "step": 7132 }, { "epoch": 0.86, "learning_rate": 5.609353934022582e-07, "loss": 2.544, "step": 7133 }, { "epoch": 0.86, "learning_rate": 5.600118151879347e-07, "loss": 2.5083, "step": 7134 }, { "epoch": 0.86, "learning_rate": 5.590889528266469e-07, "loss": 2.4732, "step": 7135 }, { "epoch": 0.86, "learning_rate": 5.581668064671847e-07, "loss": 2.489, "step": 7136 }, { "epoch": 0.86, "learning_rate": 5.572453762582253e-07, "loss": 2.3155, "step": 7137 }, { "epoch": 0.86, "learning_rate": 5.563246623483309e-07, "loss": 2.4213, "step": 7138 }, { "epoch": 0.86, "learning_rate": 5.554046648859446e-07, "loss": 2.3451, "step": 7139 }, { "epoch": 0.86, "learning_rate": 5.544853840193981e-07, "loss": 2.4915, "step": 7140 }, { "epoch": 0.86, "learning_rate": 5.53566819896903e-07, "loss": 2.4581, "step": 7141 }, { "epoch": 0.86, "learning_rate": 5.526489726665624e-07, "loss": 2.5923, "step": 7142 }, { "epoch": 0.86, "learning_rate": 5.517318424763562e-07, "loss": 2.4803, "step": 7143 }, { "epoch": 0.86, "learning_rate": 5.50815429474153e-07, "loss": 2.5425, "step": 7144 }, { "epoch": 0.86, "learning_rate": 5.498997338077062e-07, "loss": 2.5374, "step": 7145 }, { "epoch": 0.86, "learning_rate": 5.489847556246491e-07, "loss": 2.5923, "step": 7146 }, { "epoch": 0.86, "learning_rate": 5.480704950725057e-07, "loss": 2.504, "step": 7147 }, { "epoch": 0.86, "learning_rate": 5.471569522986775e-07, "loss": 2.2859, "step": 7148 }, { "epoch": 0.86, "learning_rate": 5.46244127450456e-07, "loss": 2.4843, "step": 7149 }, { "epoch": 0.86, "learning_rate": 5.453320206750152e-07, "loss": 2.2894, "step": 7150 }, { "epoch": 0.86, "learning_rate": 5.444206321194101e-07, "loss": 2.5239, "step": 7151 }, { "epoch": 0.86, "learning_rate": 5.43509961930585e-07, "loss": 2.4396, "step": 7152 }, { "epoch": 0.86, "learning_rate": 5.426000102553647e-07, "loss": 2.3656, "step": 7153 }, { "epoch": 0.86, "learning_rate": 5.416907772404606e-07, "loss": 2.4234, "step": 7154 }, { "epoch": 0.86, "learning_rate": 5.40782263032466e-07, "loss": 2.3908, "step": 7155 }, { "epoch": 0.86, "learning_rate": 5.398744677778595e-07, "loss": 2.3035, "step": 7156 }, { "epoch": 0.86, "learning_rate": 5.389673916230048e-07, "loss": 2.499, "step": 7157 }, { "epoch": 0.86, "learning_rate": 5.380610347141463e-07, "loss": 2.3504, "step": 7158 }, { "epoch": 0.86, "learning_rate": 5.371553971974169e-07, "loss": 2.4321, "step": 7159 }, { "epoch": 0.86, "learning_rate": 5.3625047921883e-07, "loss": 2.5038, "step": 7160 }, { "epoch": 0.86, "learning_rate": 5.353462809242838e-07, "loss": 2.5523, "step": 7161 }, { "epoch": 0.86, "learning_rate": 5.344428024595633e-07, "loss": 2.5417, "step": 7162 }, { "epoch": 0.86, "learning_rate": 5.335400439703309e-07, "loss": 2.588, "step": 7163 }, { "epoch": 0.86, "learning_rate": 5.326380056021419e-07, "loss": 2.3856, "step": 7164 }, { "epoch": 0.86, "learning_rate": 5.317366875004271e-07, "loss": 2.6528, "step": 7165 }, { "epoch": 0.86, "learning_rate": 5.30836089810507e-07, "loss": 2.5672, "step": 7166 }, { "epoch": 0.86, "learning_rate": 5.299362126775814e-07, "loss": 2.4255, "step": 7167 }, { "epoch": 0.86, "learning_rate": 5.290370562467378e-07, "loss": 2.5477, "step": 7168 }, { "epoch": 0.86, "learning_rate": 5.281386206629468e-07, "loss": 2.5759, "step": 7169 }, { "epoch": 0.86, "learning_rate": 5.272409060710598e-07, "loss": 2.5212, "step": 7170 }, { "epoch": 0.86, "learning_rate": 5.263439126158149e-07, "loss": 2.4678, "step": 7171 }, { "epoch": 0.86, "learning_rate": 5.254476404418341e-07, "loss": 2.5561, "step": 7172 }, { "epoch": 0.86, "learning_rate": 5.245520896936208e-07, "loss": 2.513, "step": 7173 }, { "epoch": 0.86, "learning_rate": 5.236572605155632e-07, "loss": 2.4108, "step": 7174 }, { "epoch": 0.86, "learning_rate": 5.227631530519339e-07, "loss": 2.6567, "step": 7175 }, { "epoch": 0.86, "learning_rate": 5.218697674468898e-07, "loss": 2.6726, "step": 7176 }, { "epoch": 0.86, "learning_rate": 5.209771038444677e-07, "loss": 2.5279, "step": 7177 }, { "epoch": 0.86, "learning_rate": 5.200851623885922e-07, "loss": 2.5512, "step": 7178 }, { "epoch": 0.86, "learning_rate": 5.191939432230702e-07, "loss": 2.5547, "step": 7179 }, { "epoch": 0.86, "learning_rate": 5.183034464915898e-07, "loss": 2.4334, "step": 7180 }, { "epoch": 0.86, "learning_rate": 5.174136723377266e-07, "loss": 2.4235, "step": 7181 }, { "epoch": 0.86, "learning_rate": 5.165246209049357e-07, "loss": 2.3993, "step": 7182 }, { "epoch": 0.86, "learning_rate": 5.156362923365587e-07, "loss": 2.5758, "step": 7183 }, { "epoch": 0.86, "learning_rate": 5.147486867758201e-07, "loss": 2.3624, "step": 7184 }, { "epoch": 0.86, "learning_rate": 5.13861804365825e-07, "loss": 2.4513, "step": 7185 }, { "epoch": 0.86, "learning_rate": 5.129756452495676e-07, "loss": 2.4197, "step": 7186 }, { "epoch": 0.86, "learning_rate": 5.120902095699193e-07, "loss": 2.5422, "step": 7187 }, { "epoch": 0.86, "learning_rate": 5.112054974696395e-07, "loss": 2.476, "step": 7188 }, { "epoch": 0.86, "learning_rate": 5.103215090913676e-07, "loss": 2.4772, "step": 7189 }, { "epoch": 0.86, "learning_rate": 5.094382445776281e-07, "loss": 2.5008, "step": 7190 }, { "epoch": 0.86, "learning_rate": 5.0855570407083e-07, "loss": 2.5613, "step": 7191 }, { "epoch": 0.86, "learning_rate": 5.076738877132614e-07, "loss": 2.6242, "step": 7192 }, { "epoch": 0.86, "learning_rate": 5.067927956470992e-07, "loss": 2.506, "step": 7193 }, { "epoch": 0.86, "learning_rate": 5.059124280143985e-07, "loss": 2.4647, "step": 7194 }, { "epoch": 0.86, "learning_rate": 5.050327849571002e-07, "loss": 2.3254, "step": 7195 }, { "epoch": 0.86, "learning_rate": 5.041538666170282e-07, "loss": 2.3558, "step": 7196 }, { "epoch": 0.86, "learning_rate": 5.03275673135889e-07, "loss": 2.4896, "step": 7197 }, { "epoch": 0.86, "learning_rate": 5.023982046552739e-07, "loss": 2.502, "step": 7198 }, { "epoch": 0.86, "learning_rate": 5.015214613166535e-07, "loss": 2.5853, "step": 7199 }, { "epoch": 0.86, "learning_rate": 5.006454432613867e-07, "loss": 2.5238, "step": 7200 }, { "epoch": 0.87, "learning_rate": 4.997701506307095e-07, "loss": 2.5531, "step": 7201 }, { "epoch": 0.87, "learning_rate": 4.988955835657456e-07, "loss": 2.4281, "step": 7202 }, { "epoch": 0.87, "learning_rate": 4.980217422075018e-07, "loss": 2.5282, "step": 7203 }, { "epoch": 0.87, "learning_rate": 4.971486266968634e-07, "loss": 2.4562, "step": 7204 }, { "epoch": 0.87, "learning_rate": 4.962762371746038e-07, "loss": 2.5405, "step": 7205 }, { "epoch": 0.87, "learning_rate": 4.954045737813762e-07, "loss": 2.4427, "step": 7206 }, { "epoch": 0.87, "learning_rate": 4.945336366577169e-07, "loss": 2.5608, "step": 7207 }, { "epoch": 0.87, "learning_rate": 4.93663425944047e-07, "loss": 2.5373, "step": 7208 }, { "epoch": 0.87, "learning_rate": 4.927939417806693e-07, "loss": 2.6382, "step": 7209 }, { "epoch": 0.87, "learning_rate": 4.919251843077699e-07, "loss": 2.5288, "step": 7210 }, { "epoch": 0.87, "learning_rate": 4.910571536654163e-07, "loss": 2.2957, "step": 7211 }, { "epoch": 0.87, "learning_rate": 4.901898499935609e-07, "loss": 2.5172, "step": 7212 }, { "epoch": 0.87, "learning_rate": 4.893232734320358e-07, "loss": 2.4648, "step": 7213 }, { "epoch": 0.87, "learning_rate": 4.884574241205603e-07, "loss": 2.653, "step": 7214 }, { "epoch": 0.87, "learning_rate": 4.875923021987333e-07, "loss": 2.6679, "step": 7215 }, { "epoch": 0.87, "learning_rate": 4.867279078060366e-07, "loss": 2.5117, "step": 7216 }, { "epoch": 0.87, "learning_rate": 4.858642410818354e-07, "loss": 2.5194, "step": 7217 }, { "epoch": 0.87, "learning_rate": 4.850013021653788e-07, "loss": 2.5305, "step": 7218 }, { "epoch": 0.87, "learning_rate": 4.841390911957939e-07, "loss": 2.5615, "step": 7219 }, { "epoch": 0.87, "learning_rate": 4.832776083120983e-07, "loss": 2.6335, "step": 7220 }, { "epoch": 0.87, "learning_rate": 4.824168536531848e-07, "loss": 2.5592, "step": 7221 }, { "epoch": 0.87, "learning_rate": 4.815568273578325e-07, "loss": 2.4856, "step": 7222 }, { "epoch": 0.87, "learning_rate": 4.806975295647015e-07, "loss": 2.2908, "step": 7223 }, { "epoch": 0.87, "learning_rate": 4.798389604123355e-07, "loss": 2.3066, "step": 7224 }, { "epoch": 0.87, "learning_rate": 4.789811200391619e-07, "loss": 2.2988, "step": 7225 }, { "epoch": 0.87, "learning_rate": 4.781240085834865e-07, "loss": 2.5438, "step": 7226 }, { "epoch": 0.87, "learning_rate": 4.772676261835024e-07, "loss": 2.5536, "step": 7227 }, { "epoch": 0.87, "learning_rate": 4.764119729772809e-07, "loss": 2.5195, "step": 7228 }, { "epoch": 0.87, "learning_rate": 4.7555704910277887e-07, "loss": 2.568, "step": 7229 }, { "epoch": 0.87, "learning_rate": 4.7470285469783493e-07, "loss": 2.4764, "step": 7230 }, { "epoch": 0.87, "learning_rate": 4.7384938990016836e-07, "loss": 2.6047, "step": 7231 }, { "epoch": 0.87, "learning_rate": 4.729966548473841e-07, "loss": 2.5623, "step": 7232 }, { "epoch": 0.87, "learning_rate": 4.721446496769655e-07, "loss": 2.5745, "step": 7233 }, { "epoch": 0.87, "learning_rate": 4.712933745262815e-07, "loss": 2.4777, "step": 7234 }, { "epoch": 0.87, "learning_rate": 4.704428295325808e-07, "loss": 2.5396, "step": 7235 }, { "epoch": 0.87, "learning_rate": 4.695930148329958e-07, "loss": 2.5459, "step": 7236 }, { "epoch": 0.87, "learning_rate": 4.687439305645419e-07, "loss": 2.4172, "step": 7237 }, { "epoch": 0.87, "learning_rate": 4.678955768641147e-07, "loss": 2.5723, "step": 7238 }, { "epoch": 0.87, "learning_rate": 4.670479538684941e-07, "loss": 2.5921, "step": 7239 }, { "epoch": 0.87, "learning_rate": 4.662010617143392e-07, "loss": 2.3685, "step": 7240 }, { "epoch": 0.87, "learning_rate": 4.653549005381952e-07, "loss": 2.4473, "step": 7241 }, { "epoch": 0.87, "learning_rate": 4.645094704764863e-07, "loss": 2.471, "step": 7242 }, { "epoch": 0.87, "learning_rate": 4.6366477166552073e-07, "loss": 2.4685, "step": 7243 }, { "epoch": 0.87, "learning_rate": 4.628208042414889e-07, "loss": 2.5505, "step": 7244 }, { "epoch": 0.87, "learning_rate": 4.6197756834046037e-07, "loss": 2.4189, "step": 7245 }, { "epoch": 0.87, "learning_rate": 4.6113506409839135e-07, "loss": 2.5042, "step": 7246 }, { "epoch": 0.87, "learning_rate": 4.602932916511149e-07, "loss": 2.6627, "step": 7247 }, { "epoch": 0.87, "learning_rate": 4.5945225113435024e-07, "loss": 2.5217, "step": 7248 }, { "epoch": 0.87, "learning_rate": 4.586119426836977e-07, "loss": 2.3901, "step": 7249 }, { "epoch": 0.87, "learning_rate": 4.5777236643463787e-07, "loss": 2.5806, "step": 7250 }, { "epoch": 0.87, "learning_rate": 4.5693352252253576e-07, "loss": 2.6154, "step": 7251 }, { "epoch": 0.87, "learning_rate": 4.5609541108263377e-07, "loss": 2.38, "step": 7252 }, { "epoch": 0.87, "learning_rate": 4.5525803225006437e-07, "loss": 2.3915, "step": 7253 }, { "epoch": 0.87, "learning_rate": 4.5442138615983344e-07, "loss": 2.6117, "step": 7254 }, { "epoch": 0.87, "learning_rate": 4.535854729468331e-07, "loss": 2.5032, "step": 7255 }, { "epoch": 0.87, "learning_rate": 4.5275029274583715e-07, "loss": 2.6501, "step": 7256 }, { "epoch": 0.87, "learning_rate": 4.519158456914996e-07, "loss": 2.5988, "step": 7257 }, { "epoch": 0.87, "learning_rate": 4.5108213191835835e-07, "loss": 2.5965, "step": 7258 }, { "epoch": 0.87, "learning_rate": 4.502491515608298e-07, "loss": 2.5541, "step": 7259 }, { "epoch": 0.87, "learning_rate": 4.494169047532154e-07, "loss": 2.5433, "step": 7260 }, { "epoch": 0.87, "learning_rate": 4.4858539162969894e-07, "loss": 2.4509, "step": 7261 }, { "epoch": 0.87, "learning_rate": 4.477546123243409e-07, "loss": 2.6333, "step": 7262 }, { "epoch": 0.87, "learning_rate": 4.469245669710881e-07, "loss": 2.4801, "step": 7263 }, { "epoch": 0.87, "learning_rate": 4.4609525570376786e-07, "loss": 2.485, "step": 7264 }, { "epoch": 0.87, "learning_rate": 4.452666786560894e-07, "loss": 2.518, "step": 7265 }, { "epoch": 0.87, "learning_rate": 4.4443883596164083e-07, "loss": 2.7408, "step": 7266 }, { "epoch": 0.87, "learning_rate": 4.4361172775389596e-07, "loss": 2.5248, "step": 7267 }, { "epoch": 0.87, "learning_rate": 4.4278535416620914e-07, "loss": 2.5354, "step": 7268 }, { "epoch": 0.87, "learning_rate": 4.4195971533181223e-07, "loss": 2.5358, "step": 7269 }, { "epoch": 0.87, "learning_rate": 4.411348113838243e-07, "loss": 2.6381, "step": 7270 }, { "epoch": 0.87, "learning_rate": 4.403106424552439e-07, "loss": 2.5136, "step": 7271 }, { "epoch": 0.87, "learning_rate": 4.394872086789481e-07, "loss": 2.3875, "step": 7272 }, { "epoch": 0.87, "learning_rate": 4.3866451018770074e-07, "loss": 2.5735, "step": 7273 }, { "epoch": 0.87, "learning_rate": 4.3784254711414064e-07, "loss": 2.559, "step": 7274 }, { "epoch": 0.87, "learning_rate": 4.370213195907963e-07, "loss": 2.6276, "step": 7275 }, { "epoch": 0.87, "learning_rate": 4.362008277500701e-07, "loss": 2.4778, "step": 7276 }, { "epoch": 0.87, "learning_rate": 4.353810717242496e-07, "loss": 2.5268, "step": 7277 }, { "epoch": 0.87, "learning_rate": 4.3456205164550345e-07, "loss": 2.5978, "step": 7278 }, { "epoch": 0.87, "learning_rate": 4.3374376764588e-07, "loss": 2.5567, "step": 7279 }, { "epoch": 0.87, "learning_rate": 4.329262198573109e-07, "loss": 2.4766, "step": 7280 }, { "epoch": 0.87, "learning_rate": 4.321094084116073e-07, "loss": 2.3987, "step": 7281 }, { "epoch": 0.87, "learning_rate": 4.3129333344046345e-07, "loss": 2.3892, "step": 7282 }, { "epoch": 0.87, "learning_rate": 4.3047799507545397e-07, "loss": 2.4345, "step": 7283 }, { "epoch": 0.88, "learning_rate": 4.2966339344803376e-07, "loss": 2.5241, "step": 7284 }, { "epoch": 0.88, "learning_rate": 4.288495286895405e-07, "loss": 2.3935, "step": 7285 }, { "epoch": 0.88, "learning_rate": 4.280364009311927e-07, "loss": 2.4291, "step": 7286 }, { "epoch": 0.88, "learning_rate": 4.272240103040903e-07, "loss": 2.6228, "step": 7287 }, { "epoch": 0.88, "learning_rate": 4.2641235693921257e-07, "loss": 2.5014, "step": 7288 }, { "epoch": 0.88, "learning_rate": 4.256014409674214e-07, "loss": 2.5744, "step": 7289 }, { "epoch": 0.88, "learning_rate": 4.247912625194611e-07, "loss": 2.4496, "step": 7290 }, { "epoch": 0.88, "learning_rate": 4.2398182172595393e-07, "loss": 2.3382, "step": 7291 }, { "epoch": 0.88, "learning_rate": 4.231731187174065e-07, "loss": 2.5298, "step": 7292 }, { "epoch": 0.88, "learning_rate": 4.223651536242029e-07, "loss": 2.47, "step": 7293 }, { "epoch": 0.88, "learning_rate": 4.2155792657661066e-07, "loss": 2.4589, "step": 7294 }, { "epoch": 0.88, "learning_rate": 4.2075143770478e-07, "loss": 2.4062, "step": 7295 }, { "epoch": 0.88, "learning_rate": 4.199456871387364e-07, "loss": 2.4248, "step": 7296 }, { "epoch": 0.88, "learning_rate": 4.191406750083937e-07, "loss": 2.5215, "step": 7297 }, { "epoch": 0.88, "learning_rate": 4.183364014435398e-07, "loss": 2.4307, "step": 7298 }, { "epoch": 0.88, "learning_rate": 4.175328665738487e-07, "loss": 2.4109, "step": 7299 }, { "epoch": 0.88, "learning_rate": 4.167300705288718e-07, "loss": 2.4653, "step": 7300 }, { "epoch": 0.88, "learning_rate": 4.1592801343804334e-07, "loss": 2.5132, "step": 7301 }, { "epoch": 0.88, "learning_rate": 4.1512669543067873e-07, "loss": 2.4861, "step": 7302 }, { "epoch": 0.88, "learning_rate": 4.143261166359713e-07, "loss": 2.4211, "step": 7303 }, { "epoch": 0.88, "learning_rate": 4.1352627718299953e-07, "loss": 2.4667, "step": 7304 }, { "epoch": 0.88, "learning_rate": 4.1272717720071795e-07, "loss": 2.398, "step": 7305 }, { "epoch": 0.88, "learning_rate": 4.119288168179658e-07, "loss": 2.3611, "step": 7306 }, { "epoch": 0.88, "learning_rate": 4.111311961634623e-07, "loss": 2.7293, "step": 7307 }, { "epoch": 0.88, "learning_rate": 4.10334315365804e-07, "loss": 2.4768, "step": 7308 }, { "epoch": 0.88, "learning_rate": 4.095381745534749e-07, "loss": 2.4837, "step": 7309 }, { "epoch": 0.88, "learning_rate": 4.087427738548322e-07, "loss": 2.4832, "step": 7310 }, { "epoch": 0.88, "learning_rate": 4.079481133981189e-07, "loss": 2.5513, "step": 7311 }, { "epoch": 0.88, "learning_rate": 4.0715419331145646e-07, "loss": 2.458, "step": 7312 }, { "epoch": 0.88, "learning_rate": 4.063610137228474e-07, "loss": 2.5604, "step": 7313 }, { "epoch": 0.88, "learning_rate": 4.0556857476017566e-07, "loss": 2.6307, "step": 7314 }, { "epoch": 0.88, "learning_rate": 4.047768765512039e-07, "loss": 2.5499, "step": 7315 }, { "epoch": 0.88, "learning_rate": 4.0398591922357787e-07, "loss": 2.26, "step": 7316 }, { "epoch": 0.88, "learning_rate": 4.031957029048211e-07, "loss": 2.4035, "step": 7317 }, { "epoch": 0.88, "learning_rate": 4.0240622772234005e-07, "loss": 2.4886, "step": 7318 }, { "epoch": 0.88, "learning_rate": 4.016174938034201e-07, "loss": 2.6167, "step": 7319 }, { "epoch": 0.88, "learning_rate": 4.008295012752278e-07, "loss": 2.5344, "step": 7320 }, { "epoch": 0.88, "learning_rate": 4.000422502648116e-07, "loss": 2.6365, "step": 7321 }, { "epoch": 0.88, "learning_rate": 3.9925574089909603e-07, "loss": 2.5785, "step": 7322 }, { "epoch": 0.88, "learning_rate": 3.984699733048908e-07, "loss": 2.4383, "step": 7323 }, { "epoch": 0.88, "learning_rate": 3.9768494760888455e-07, "loss": 2.5733, "step": 7324 }, { "epoch": 0.88, "learning_rate": 3.969006639376444e-07, "loss": 2.5851, "step": 7325 }, { "epoch": 0.88, "learning_rate": 3.9611712241762024e-07, "loss": 2.4319, "step": 7326 }, { "epoch": 0.88, "learning_rate": 3.953343231751405e-07, "loss": 2.5397, "step": 7327 }, { "epoch": 0.88, "learning_rate": 3.945522663364154e-07, "loss": 2.4683, "step": 7328 }, { "epoch": 0.88, "learning_rate": 3.937709520275351e-07, "loss": 2.5308, "step": 7329 }, { "epoch": 0.88, "learning_rate": 3.9299038037446837e-07, "loss": 2.4036, "step": 7330 }, { "epoch": 0.88, "learning_rate": 3.922105515030683e-07, "loss": 2.5268, "step": 7331 }, { "epoch": 0.88, "learning_rate": 3.914314655390633e-07, "loss": 2.5696, "step": 7332 }, { "epoch": 0.88, "learning_rate": 3.9065312260806623e-07, "loss": 2.3478, "step": 7333 }, { "epoch": 0.88, "learning_rate": 3.898755228355661e-07, "loss": 2.4529, "step": 7334 }, { "epoch": 0.88, "learning_rate": 3.8909866634693484e-07, "loss": 2.3545, "step": 7335 }, { "epoch": 0.88, "learning_rate": 3.8832255326742563e-07, "loss": 2.519, "step": 7336 }, { "epoch": 0.88, "learning_rate": 3.875471837221678e-07, "loss": 2.5441, "step": 7337 }, { "epoch": 0.88, "learning_rate": 3.8677255783617475e-07, "loss": 2.4038, "step": 7338 }, { "epoch": 0.88, "learning_rate": 3.85998675734337e-07, "loss": 2.5866, "step": 7339 }, { "epoch": 0.88, "learning_rate": 3.852255375414271e-07, "loss": 2.4925, "step": 7340 }, { "epoch": 0.88, "learning_rate": 3.8445314338209693e-07, "loss": 2.5016, "step": 7341 }, { "epoch": 0.88, "learning_rate": 3.8368149338087855e-07, "loss": 2.6007, "step": 7342 }, { "epoch": 0.88, "learning_rate": 3.8291058766218526e-07, "loss": 2.4856, "step": 7343 }, { "epoch": 0.88, "learning_rate": 3.821404263503065e-07, "loss": 2.4805, "step": 7344 }, { "epoch": 0.88, "learning_rate": 3.813710095694168e-07, "loss": 2.5351, "step": 7345 }, { "epoch": 0.88, "learning_rate": 3.8060233744356634e-07, "loss": 2.5091, "step": 7346 }, { "epoch": 0.88, "learning_rate": 3.7983441009668774e-07, "loss": 2.2845, "step": 7347 }, { "epoch": 0.88, "learning_rate": 3.7906722765259364e-07, "loss": 2.5157, "step": 7348 }, { "epoch": 0.88, "learning_rate": 3.7830079023497393e-07, "loss": 2.4045, "step": 7349 }, { "epoch": 0.88, "learning_rate": 3.775350979674025e-07, "loss": 2.5561, "step": 7350 }, { "epoch": 0.88, "learning_rate": 3.767701509733285e-07, "loss": 2.5471, "step": 7351 }, { "epoch": 0.88, "learning_rate": 3.760059493760848e-07, "loss": 2.5303, "step": 7352 }, { "epoch": 0.88, "learning_rate": 3.7524249329888183e-07, "loss": 2.6072, "step": 7353 }, { "epoch": 0.88, "learning_rate": 3.744797828648111e-07, "loss": 2.4956, "step": 7354 }, { "epoch": 0.88, "learning_rate": 3.737178181968437e-07, "loss": 2.4836, "step": 7355 }, { "epoch": 0.88, "learning_rate": 3.7295659941782856e-07, "loss": 2.2705, "step": 7356 }, { "epoch": 0.88, "learning_rate": 3.721961266504975e-07, "loss": 2.3644, "step": 7357 }, { "epoch": 0.88, "learning_rate": 3.7143640001745916e-07, "loss": 2.5015, "step": 7358 }, { "epoch": 0.88, "learning_rate": 3.706774196412044e-07, "loss": 2.4285, "step": 7359 }, { "epoch": 0.88, "learning_rate": 3.69919185644102e-07, "loss": 2.6323, "step": 7360 }, { "epoch": 0.88, "learning_rate": 3.691616981484009e-07, "loss": 2.6013, "step": 7361 }, { "epoch": 0.88, "learning_rate": 3.684049572762299e-07, "loss": 2.4026, "step": 7362 }, { "epoch": 0.88, "learning_rate": 3.6764896314959606e-07, "loss": 2.5333, "step": 7363 }, { "epoch": 0.88, "learning_rate": 3.6689371589039013e-07, "loss": 2.4805, "step": 7364 }, { "epoch": 0.88, "learning_rate": 3.6613921562037633e-07, "loss": 2.492, "step": 7365 }, { "epoch": 0.88, "learning_rate": 3.6538546246120353e-07, "loss": 2.3869, "step": 7366 }, { "epoch": 0.89, "learning_rate": 3.6463245653439893e-07, "loss": 2.5174, "step": 7367 }, { "epoch": 0.89, "learning_rate": 3.6388019796136654e-07, "loss": 2.5276, "step": 7368 }, { "epoch": 0.89, "learning_rate": 3.6312868686339375e-07, "loss": 2.3055, "step": 7369 }, { "epoch": 0.89, "learning_rate": 3.6237792336164424e-07, "loss": 2.6116, "step": 7370 }, { "epoch": 0.89, "learning_rate": 3.616279075771628e-07, "loss": 2.504, "step": 7371 }, { "epoch": 0.89, "learning_rate": 3.60878639630875e-07, "loss": 2.4892, "step": 7372 }, { "epoch": 0.89, "learning_rate": 3.601301196435819e-07, "loss": 2.4271, "step": 7373 }, { "epoch": 0.89, "learning_rate": 3.593823477359676e-07, "loss": 2.5548, "step": 7374 }, { "epoch": 0.89, "learning_rate": 3.586353240285945e-07, "loss": 2.5003, "step": 7375 }, { "epoch": 0.89, "learning_rate": 3.5788904864190346e-07, "loss": 2.4124, "step": 7376 }, { "epoch": 0.89, "learning_rate": 3.5714352169621656e-07, "loss": 2.3785, "step": 7377 }, { "epoch": 0.89, "learning_rate": 3.563987433117327e-07, "loss": 2.5888, "step": 7378 }, { "epoch": 0.89, "learning_rate": 3.556547136085331e-07, "loss": 2.2479, "step": 7379 }, { "epoch": 0.89, "learning_rate": 3.5491143270657445e-07, "loss": 2.3572, "step": 7380 }, { "epoch": 0.89, "learning_rate": 3.541689007256965e-07, "loss": 2.5052, "step": 7381 }, { "epoch": 0.89, "learning_rate": 3.534271177856163e-07, "loss": 2.5544, "step": 7382 }, { "epoch": 0.89, "learning_rate": 3.5268608400592987e-07, "loss": 2.5853, "step": 7383 }, { "epoch": 0.89, "learning_rate": 3.519457995061143e-07, "loss": 2.6683, "step": 7384 }, { "epoch": 0.89, "learning_rate": 3.51206264405522e-07, "loss": 2.6758, "step": 7385 }, { "epoch": 0.89, "learning_rate": 3.504674788233908e-07, "loss": 2.4982, "step": 7386 }, { "epoch": 0.89, "learning_rate": 3.497294428788317e-07, "loss": 2.3822, "step": 7387 }, { "epoch": 0.89, "learning_rate": 3.489921566908372e-07, "loss": 2.667, "step": 7388 }, { "epoch": 0.89, "learning_rate": 3.4825562037828054e-07, "loss": 2.5653, "step": 7389 }, { "epoch": 0.89, "learning_rate": 3.4751983405991007e-07, "loss": 2.5551, "step": 7390 }, { "epoch": 0.89, "learning_rate": 3.4678479785435816e-07, "loss": 2.5126, "step": 7391 }, { "epoch": 0.89, "learning_rate": 3.460505118801316e-07, "loss": 2.5487, "step": 7392 }, { "epoch": 0.89, "learning_rate": 3.4531697625561857e-07, "loss": 2.4059, "step": 7393 }, { "epoch": 0.89, "learning_rate": 3.445841910990877e-07, "loss": 2.4765, "step": 7394 }, { "epoch": 0.89, "learning_rate": 3.438521565286823e-07, "loss": 2.642, "step": 7395 }, { "epoch": 0.89, "learning_rate": 3.4312087266242964e-07, "loss": 2.4736, "step": 7396 }, { "epoch": 0.89, "learning_rate": 3.42390339618231e-07, "loss": 2.4759, "step": 7397 }, { "epoch": 0.89, "learning_rate": 3.416605575138726e-07, "loss": 2.5898, "step": 7398 }, { "epoch": 0.89, "learning_rate": 3.409315264670132e-07, "loss": 2.5504, "step": 7399 }, { "epoch": 0.89, "learning_rate": 3.4020324659519487e-07, "loss": 2.5619, "step": 7400 }, { "epoch": 0.89, "learning_rate": 3.3947571801583756e-07, "loss": 2.4192, "step": 7401 }, { "epoch": 0.89, "learning_rate": 3.38748940846238e-07, "loss": 2.5985, "step": 7402 }, { "epoch": 0.89, "learning_rate": 3.380229152035758e-07, "loss": 2.3326, "step": 7403 }, { "epoch": 0.89, "learning_rate": 3.3729764120490447e-07, "loss": 2.4205, "step": 7404 }, { "epoch": 0.89, "learning_rate": 3.3657311896716004e-07, "loss": 2.4164, "step": 7405 }, { "epoch": 0.89, "learning_rate": 3.358493486071568e-07, "loss": 2.6297, "step": 7406 }, { "epoch": 0.89, "learning_rate": 3.351263302415864e-07, "loss": 2.5179, "step": 7407 }, { "epoch": 0.89, "learning_rate": 3.3440406398702055e-07, "loss": 2.4233, "step": 7408 }, { "epoch": 0.89, "learning_rate": 3.336825499599089e-07, "loss": 2.3842, "step": 7409 }, { "epoch": 0.89, "learning_rate": 3.329617882765807e-07, "loss": 2.3199, "step": 7410 }, { "epoch": 0.89, "learning_rate": 3.322417790532423e-07, "loss": 2.4857, "step": 7411 }, { "epoch": 0.89, "learning_rate": 3.315225224059809e-07, "loss": 2.6377, "step": 7412 }, { "epoch": 0.89, "learning_rate": 3.3080401845076106e-07, "loss": 2.6067, "step": 7413 }, { "epoch": 0.89, "learning_rate": 3.3008626730342496e-07, "loss": 2.4915, "step": 7414 }, { "epoch": 0.89, "learning_rate": 3.293692690796968e-07, "loss": 2.4119, "step": 7415 }, { "epoch": 0.89, "learning_rate": 3.286530238951746e-07, "loss": 2.4619, "step": 7416 }, { "epoch": 0.89, "learning_rate": 3.279375318653388e-07, "loss": 2.5698, "step": 7417 }, { "epoch": 0.89, "learning_rate": 3.2722279310554825e-07, "loss": 2.4443, "step": 7418 }, { "epoch": 0.89, "learning_rate": 3.2650880773103686e-07, "loss": 2.4182, "step": 7419 }, { "epoch": 0.89, "learning_rate": 3.25795575856922e-07, "loss": 2.4719, "step": 7420 }, { "epoch": 0.89, "learning_rate": 3.250830975981956e-07, "loss": 2.4857, "step": 7421 }, { "epoch": 0.89, "learning_rate": 3.243713730697301e-07, "loss": 2.4766, "step": 7422 }, { "epoch": 0.89, "learning_rate": 3.2366040238627493e-07, "loss": 2.48, "step": 7423 }, { "epoch": 0.89, "learning_rate": 3.2295018566246007e-07, "loss": 2.503, "step": 7424 }, { "epoch": 0.89, "learning_rate": 3.222407230127922e-07, "loss": 2.4238, "step": 7425 }, { "epoch": 0.89, "learning_rate": 3.215320145516565e-07, "loss": 2.5642, "step": 7426 }, { "epoch": 0.89, "learning_rate": 3.208240603933177e-07, "loss": 2.4594, "step": 7427 }, { "epoch": 0.89, "learning_rate": 3.2011686065191894e-07, "loss": 2.4236, "step": 7428 }, { "epoch": 0.89, "learning_rate": 3.1941041544147897e-07, "loss": 2.587, "step": 7429 }, { "epoch": 0.89, "learning_rate": 3.1870472487589845e-07, "loss": 2.4274, "step": 7430 }, { "epoch": 0.89, "learning_rate": 3.1799978906895456e-07, "loss": 2.5842, "step": 7431 }, { "epoch": 0.89, "learning_rate": 3.172956081343043e-07, "loss": 2.601, "step": 7432 }, { "epoch": 0.89, "learning_rate": 3.165921821854795e-07, "loss": 2.5265, "step": 7433 }, { "epoch": 0.89, "learning_rate": 3.158895113358934e-07, "loss": 2.4854, "step": 7434 }, { "epoch": 0.89, "learning_rate": 3.1518759569883814e-07, "loss": 2.3677, "step": 7435 }, { "epoch": 0.89, "learning_rate": 3.1448643538748045e-07, "loss": 2.5613, "step": 7436 }, { "epoch": 0.89, "learning_rate": 3.1378603051486877e-07, "loss": 2.1597, "step": 7437 }, { "epoch": 0.89, "learning_rate": 3.130863811939272e-07, "loss": 2.4903, "step": 7438 }, { "epoch": 0.89, "learning_rate": 3.1238748753746e-07, "loss": 2.4745, "step": 7439 }, { "epoch": 0.89, "learning_rate": 3.1168934965814966e-07, "loss": 2.5619, "step": 7440 }, { "epoch": 0.89, "learning_rate": 3.1099196766855357e-07, "loss": 2.5186, "step": 7441 }, { "epoch": 0.89, "learning_rate": 3.1029534168111217e-07, "loss": 2.4908, "step": 7442 }, { "epoch": 0.89, "learning_rate": 3.095994718081402e-07, "loss": 2.6297, "step": 7443 }, { "epoch": 0.89, "learning_rate": 3.0890435816183226e-07, "loss": 2.6244, "step": 7444 }, { "epoch": 0.89, "learning_rate": 3.082100008542599e-07, "loss": 2.6643, "step": 7445 }, { "epoch": 0.89, "learning_rate": 3.0751639999737346e-07, "loss": 2.4812, "step": 7446 }, { "epoch": 0.89, "learning_rate": 3.0682355570300306e-07, "loss": 2.636, "step": 7447 }, { "epoch": 0.89, "learning_rate": 3.06131468082852e-07, "loss": 2.4256, "step": 7448 }, { "epoch": 0.89, "learning_rate": 3.0544013724850664e-07, "loss": 2.2894, "step": 7449 }, { "epoch": 0.9, "learning_rate": 3.0474956331142837e-07, "loss": 2.6668, "step": 7450 }, { "epoch": 0.9, "learning_rate": 3.040597463829581e-07, "loss": 2.5251, "step": 7451 }, { "epoch": 0.9, "learning_rate": 3.03370686574313e-07, "loss": 2.5542, "step": 7452 }, { "epoch": 0.9, "learning_rate": 3.0268238399659035e-07, "loss": 2.5387, "step": 7453 }, { "epoch": 0.9, "learning_rate": 3.0199483876076465e-07, "loss": 2.404, "step": 7454 }, { "epoch": 0.9, "learning_rate": 3.013080509776861e-07, "loss": 2.5297, "step": 7455 }, { "epoch": 0.9, "learning_rate": 3.006220207580862e-07, "loss": 2.4893, "step": 7456 }, { "epoch": 0.9, "learning_rate": 2.999367482125709e-07, "loss": 2.5595, "step": 7457 }, { "epoch": 0.9, "learning_rate": 2.992522334516268e-07, "loss": 2.6839, "step": 7458 }, { "epoch": 0.9, "learning_rate": 2.985684765856184e-07, "loss": 2.4838, "step": 7459 }, { "epoch": 0.9, "learning_rate": 2.9788547772478416e-07, "loss": 2.5541, "step": 7460 }, { "epoch": 0.9, "learning_rate": 2.9720323697924545e-07, "loss": 2.5761, "step": 7461 }, { "epoch": 0.9, "learning_rate": 2.965217544589971e-07, "loss": 2.5328, "step": 7462 }, { "epoch": 0.9, "learning_rate": 2.9584103027391453e-07, "loss": 2.5022, "step": 7463 }, { "epoch": 0.9, "learning_rate": 2.951610645337499e-07, "loss": 2.5085, "step": 7464 }, { "epoch": 0.9, "learning_rate": 2.944818573481334e-07, "loss": 2.5811, "step": 7465 }, { "epoch": 0.9, "learning_rate": 2.938034088265723e-07, "loss": 2.6842, "step": 7466 }, { "epoch": 0.9, "learning_rate": 2.93125719078452e-07, "loss": 2.511, "step": 7467 }, { "epoch": 0.9, "learning_rate": 2.9244878821303556e-07, "loss": 2.5078, "step": 7468 }, { "epoch": 0.9, "learning_rate": 2.9177261633946294e-07, "loss": 2.3229, "step": 7469 }, { "epoch": 0.9, "learning_rate": 2.910972035667531e-07, "loss": 2.6174, "step": 7470 }, { "epoch": 0.9, "learning_rate": 2.9042255000380213e-07, "loss": 2.4438, "step": 7471 }, { "epoch": 0.9, "learning_rate": 2.897486557593826e-07, "loss": 2.4391, "step": 7472 }, { "epoch": 0.9, "learning_rate": 2.8907552094214643e-07, "loss": 2.6034, "step": 7473 }, { "epoch": 0.9, "learning_rate": 2.884031456606201e-07, "loss": 2.4423, "step": 7474 }, { "epoch": 0.9, "learning_rate": 2.877315300232131e-07, "loss": 2.4917, "step": 7475 }, { "epoch": 0.9, "learning_rate": 2.870606741382059e-07, "loss": 2.5672, "step": 7476 }, { "epoch": 0.9, "learning_rate": 2.863905781137616e-07, "loss": 2.5695, "step": 7477 }, { "epoch": 0.9, "learning_rate": 2.8572124205791916e-07, "loss": 2.567, "step": 7478 }, { "epoch": 0.9, "learning_rate": 2.8505266607859297e-07, "loss": 2.58, "step": 7479 }, { "epoch": 0.9, "learning_rate": 2.843848502835772e-07, "loss": 2.6181, "step": 7480 }, { "epoch": 0.9, "learning_rate": 2.837177947805442e-07, "loss": 2.5806, "step": 7481 }, { "epoch": 0.9, "learning_rate": 2.8305149967704e-07, "loss": 2.5277, "step": 7482 }, { "epoch": 0.9, "learning_rate": 2.8238596508049275e-07, "loss": 2.6321, "step": 7483 }, { "epoch": 0.9, "learning_rate": 2.817211910982037e-07, "loss": 2.5709, "step": 7484 }, { "epoch": 0.9, "learning_rate": 2.81057177837355e-07, "loss": 2.5485, "step": 7485 }, { "epoch": 0.9, "learning_rate": 2.803939254050031e-07, "loss": 2.5134, "step": 7486 }, { "epoch": 0.9, "learning_rate": 2.797314339080842e-07, "loss": 2.6694, "step": 7487 }, { "epoch": 0.9, "learning_rate": 2.7906970345341177e-07, "loss": 2.4697, "step": 7488 }, { "epoch": 0.9, "learning_rate": 2.7840873414767377e-07, "loss": 2.3712, "step": 7489 }, { "epoch": 0.9, "learning_rate": 2.7774852609743887e-07, "loss": 2.5892, "step": 7490 }, { "epoch": 0.9, "learning_rate": 2.770890794091502e-07, "loss": 2.5274, "step": 7491 }, { "epoch": 0.9, "learning_rate": 2.7643039418912996e-07, "loss": 2.453, "step": 7492 }, { "epoch": 0.9, "learning_rate": 2.757724705435777e-07, "loss": 2.416, "step": 7493 }, { "epoch": 0.9, "learning_rate": 2.7511530857856794e-07, "loss": 2.4695, "step": 7494 }, { "epoch": 0.9, "learning_rate": 2.744589084000565e-07, "loss": 2.4957, "step": 7495 }, { "epoch": 0.9, "learning_rate": 2.7380327011387096e-07, "loss": 2.4016, "step": 7496 }, { "epoch": 0.9, "learning_rate": 2.7314839382572067e-07, "loss": 2.5278, "step": 7497 }, { "epoch": 0.9, "learning_rate": 2.7249427964119e-07, "loss": 2.6148, "step": 7498 }, { "epoch": 0.9, "learning_rate": 2.718409276657408e-07, "loss": 2.5561, "step": 7499 }, { "epoch": 0.9, "learning_rate": 2.711883380047131e-07, "loss": 2.4227, "step": 7500 }, { "epoch": 0.9, "learning_rate": 2.705365107633212e-07, "loss": 2.4384, "step": 7501 }, { "epoch": 0.9, "learning_rate": 2.698854460466599e-07, "loss": 2.4844, "step": 7502 }, { "epoch": 0.9, "learning_rate": 2.692351439596985e-07, "loss": 2.6736, "step": 7503 }, { "epoch": 0.9, "learning_rate": 2.6858560460728433e-07, "loss": 2.4976, "step": 7504 }, { "epoch": 0.9, "learning_rate": 2.6793682809414245e-07, "loss": 2.6499, "step": 7505 }, { "epoch": 0.9, "learning_rate": 2.672888145248731e-07, "loss": 2.4516, "step": 7506 }, { "epoch": 0.9, "learning_rate": 2.6664156400395545e-07, "loss": 2.5231, "step": 7507 }, { "epoch": 0.9, "learning_rate": 2.6599507663574387e-07, "loss": 2.6003, "step": 7508 }, { "epoch": 0.9, "learning_rate": 2.653493525244721e-07, "loss": 2.4628, "step": 7509 }, { "epoch": 0.9, "learning_rate": 2.6470439177424754e-07, "loss": 2.5134, "step": 7510 }, { "epoch": 0.9, "learning_rate": 2.640601944890575e-07, "loss": 2.532, "step": 7511 }, { "epoch": 0.9, "learning_rate": 2.634167607727656e-07, "loss": 2.5282, "step": 7512 }, { "epoch": 0.9, "learning_rate": 2.6277409072910984e-07, "loss": 2.5174, "step": 7513 }, { "epoch": 0.9, "learning_rate": 2.621321844617092e-07, "loss": 2.4503, "step": 7514 }, { "epoch": 0.9, "learning_rate": 2.6149104207405515e-07, "loss": 2.5001, "step": 7515 }, { "epoch": 0.9, "learning_rate": 2.6085066366951907e-07, "loss": 2.5748, "step": 7516 }, { "epoch": 0.9, "learning_rate": 2.6021104935134934e-07, "loss": 2.4817, "step": 7517 }, { "epoch": 0.9, "learning_rate": 2.5957219922266794e-07, "loss": 2.5297, "step": 7518 }, { "epoch": 0.9, "learning_rate": 2.5893411338647757e-07, "loss": 2.4065, "step": 7519 }, { "epoch": 0.9, "learning_rate": 2.582967919456547e-07, "loss": 2.3784, "step": 7520 }, { "epoch": 0.9, "learning_rate": 2.5766023500295503e-07, "loss": 2.6452, "step": 7521 }, { "epoch": 0.9, "learning_rate": 2.5702444266100913e-07, "loss": 2.5534, "step": 7522 }, { "epoch": 0.9, "learning_rate": 2.5638941502232395e-07, "loss": 2.6655, "step": 7523 }, { "epoch": 0.9, "learning_rate": 2.557551521892859e-07, "loss": 2.4299, "step": 7524 }, { "epoch": 0.9, "learning_rate": 2.5512165426415494e-07, "loss": 2.5942, "step": 7525 }, { "epoch": 0.9, "learning_rate": 2.544889213490698e-07, "loss": 2.5404, "step": 7526 }, { "epoch": 0.9, "learning_rate": 2.53856953546045e-07, "loss": 2.5293, "step": 7527 }, { "epoch": 0.9, "learning_rate": 2.5322575095697077e-07, "loss": 2.4715, "step": 7528 }, { "epoch": 0.9, "learning_rate": 2.525953136836168e-07, "loss": 2.6186, "step": 7529 }, { "epoch": 0.9, "learning_rate": 2.5196564182762506e-07, "loss": 2.6049, "step": 7530 }, { "epoch": 0.9, "learning_rate": 2.5133673549051994e-07, "loss": 2.5306, "step": 7531 }, { "epoch": 0.9, "learning_rate": 2.5070859477369645e-07, "loss": 2.4617, "step": 7532 }, { "epoch": 0.9, "learning_rate": 2.500812197784297e-07, "loss": 2.4174, "step": 7533 }, { "epoch": 0.91, "learning_rate": 2.494546106058715e-07, "loss": 2.4929, "step": 7534 }, { "epoch": 0.91, "learning_rate": 2.4882876735704775e-07, "loss": 2.5337, "step": 7535 }, { "epoch": 0.91, "learning_rate": 2.4820369013286326e-07, "loss": 2.4312, "step": 7536 }, { "epoch": 0.91, "learning_rate": 2.475793790340969e-07, "loss": 2.4037, "step": 7537 }, { "epoch": 0.91, "learning_rate": 2.46955834161407e-07, "loss": 2.6468, "step": 7538 }, { "epoch": 0.91, "learning_rate": 2.463330556153265e-07, "loss": 2.4074, "step": 7539 }, { "epoch": 0.91, "learning_rate": 2.457110434962645e-07, "loss": 2.3817, "step": 7540 }, { "epoch": 0.91, "learning_rate": 2.450897979045069e-07, "loss": 2.5595, "step": 7541 }, { "epoch": 0.91, "learning_rate": 2.444693189402175e-07, "loss": 2.5788, "step": 7542 }, { "epoch": 0.91, "learning_rate": 2.4384960670343514e-07, "loss": 2.538, "step": 7543 }, { "epoch": 0.91, "learning_rate": 2.432306612940738e-07, "loss": 2.4828, "step": 7544 }, { "epoch": 0.91, "learning_rate": 2.4261248281192584e-07, "loss": 2.3047, "step": 7545 }, { "epoch": 0.91, "learning_rate": 2.4199507135666046e-07, "loss": 2.5859, "step": 7546 }, { "epoch": 0.91, "learning_rate": 2.4137842702782023e-07, "loss": 2.4836, "step": 7547 }, { "epoch": 0.91, "learning_rate": 2.407625499248273e-07, "loss": 2.6588, "step": 7548 }, { "epoch": 0.91, "learning_rate": 2.4014744014697723e-07, "loss": 2.6479, "step": 7549 }, { "epoch": 0.91, "learning_rate": 2.39533097793444e-07, "loss": 2.4312, "step": 7550 }, { "epoch": 0.91, "learning_rate": 2.3891952296327846e-07, "loss": 2.4688, "step": 7551 }, { "epoch": 0.91, "learning_rate": 2.3830671575540308e-07, "loss": 2.5428, "step": 7552 }, { "epoch": 0.91, "learning_rate": 2.3769467626862385e-07, "loss": 2.5049, "step": 7553 }, { "epoch": 0.91, "learning_rate": 2.3708340460161628e-07, "loss": 2.5956, "step": 7554 }, { "epoch": 0.91, "learning_rate": 2.3647290085293707e-07, "loss": 2.5924, "step": 7555 }, { "epoch": 0.91, "learning_rate": 2.3586316512101416e-07, "loss": 2.6818, "step": 7556 }, { "epoch": 0.91, "learning_rate": 2.3525419750415612e-07, "loss": 2.5844, "step": 7557 }, { "epoch": 0.91, "learning_rate": 2.346459981005461e-07, "loss": 2.4585, "step": 7558 }, { "epoch": 0.91, "learning_rate": 2.3403856700824236e-07, "loss": 2.5234, "step": 7559 }, { "epoch": 0.91, "learning_rate": 2.3343190432518092e-07, "loss": 2.4789, "step": 7560 }, { "epoch": 0.91, "learning_rate": 2.3282601014917193e-07, "loss": 2.4733, "step": 7561 }, { "epoch": 0.91, "learning_rate": 2.3222088457790448e-07, "loss": 2.4107, "step": 7562 }, { "epoch": 0.91, "learning_rate": 2.3161652770894048e-07, "loss": 2.3885, "step": 7563 }, { "epoch": 0.91, "learning_rate": 2.3101293963972094e-07, "loss": 2.5325, "step": 7564 }, { "epoch": 0.91, "learning_rate": 2.3041012046756128e-07, "loss": 2.615, "step": 7565 }, { "epoch": 0.91, "learning_rate": 2.2980807028965213e-07, "loss": 2.5826, "step": 7566 }, { "epoch": 0.91, "learning_rate": 2.2920678920306304e-07, "loss": 2.4776, "step": 7567 }, { "epoch": 0.91, "learning_rate": 2.286062773047354e-07, "loss": 2.556, "step": 7568 }, { "epoch": 0.91, "learning_rate": 2.2800653469149058e-07, "loss": 2.4157, "step": 7569 }, { "epoch": 0.91, "learning_rate": 2.2740756146002409e-07, "loss": 2.5058, "step": 7570 }, { "epoch": 0.91, "learning_rate": 2.2680935770690694e-07, "loss": 2.5982, "step": 7571 }, { "epoch": 0.91, "learning_rate": 2.2621192352858702e-07, "loss": 2.4008, "step": 7572 }, { "epoch": 0.91, "learning_rate": 2.2561525902138725e-07, "loss": 2.3623, "step": 7573 }, { "epoch": 0.91, "learning_rate": 2.2501936428150794e-07, "loss": 2.4943, "step": 7574 }, { "epoch": 0.91, "learning_rate": 2.2442423940502333e-07, "loss": 2.2234, "step": 7575 }, { "epoch": 0.91, "learning_rate": 2.2382988448788557e-07, "loss": 2.4438, "step": 7576 }, { "epoch": 0.91, "learning_rate": 2.232362996259213e-07, "loss": 2.5758, "step": 7577 }, { "epoch": 0.91, "learning_rate": 2.226434849148329e-07, "loss": 2.6327, "step": 7578 }, { "epoch": 0.91, "learning_rate": 2.2205144045019943e-07, "loss": 2.6428, "step": 7579 }, { "epoch": 0.91, "learning_rate": 2.2146016632747624e-07, "loss": 2.504, "step": 7580 }, { "epoch": 0.91, "learning_rate": 2.2086966264199206e-07, "loss": 2.5781, "step": 7581 }, { "epoch": 0.91, "learning_rate": 2.202799294889546e-07, "loss": 2.4054, "step": 7582 }, { "epoch": 0.91, "learning_rate": 2.196909669634434e-07, "loss": 2.6063, "step": 7583 }, { "epoch": 0.91, "learning_rate": 2.19102775160418e-07, "loss": 2.5317, "step": 7584 }, { "epoch": 0.91, "learning_rate": 2.1851535417471093e-07, "loss": 2.6552, "step": 7585 }, { "epoch": 0.91, "learning_rate": 2.1792870410103195e-07, "loss": 2.58, "step": 7586 }, { "epoch": 0.91, "learning_rate": 2.1734282503396543e-07, "loss": 2.5128, "step": 7587 }, { "epoch": 0.91, "learning_rate": 2.1675771706797132e-07, "loss": 2.4231, "step": 7588 }, { "epoch": 0.91, "learning_rate": 2.1617338029738698e-07, "loss": 2.6604, "step": 7589 }, { "epoch": 0.91, "learning_rate": 2.155898148164226e-07, "loss": 2.4688, "step": 7590 }, { "epoch": 0.91, "learning_rate": 2.150070207191668e-07, "loss": 2.5273, "step": 7591 }, { "epoch": 0.91, "learning_rate": 2.1442499809958273e-07, "loss": 2.3634, "step": 7592 }, { "epoch": 0.91, "learning_rate": 2.1384374705150813e-07, "loss": 2.5199, "step": 7593 }, { "epoch": 0.91, "learning_rate": 2.13263267668658e-07, "loss": 2.5234, "step": 7594 }, { "epoch": 0.91, "learning_rate": 2.1268356004462198e-07, "loss": 2.5142, "step": 7595 }, { "epoch": 0.91, "learning_rate": 2.1210462427286528e-07, "loss": 2.7263, "step": 7596 }, { "epoch": 0.91, "learning_rate": 2.1152646044672876e-07, "loss": 2.6416, "step": 7597 }, { "epoch": 0.91, "learning_rate": 2.109490686594301e-07, "loss": 2.4821, "step": 7598 }, { "epoch": 0.91, "learning_rate": 2.103724490040604e-07, "loss": 2.5278, "step": 7599 }, { "epoch": 0.91, "learning_rate": 2.097966015735875e-07, "loss": 2.4321, "step": 7600 }, { "epoch": 0.91, "learning_rate": 2.0922152646085492e-07, "loss": 2.4793, "step": 7601 }, { "epoch": 0.91, "learning_rate": 2.0864722375858015e-07, "loss": 2.5183, "step": 7602 }, { "epoch": 0.91, "learning_rate": 2.0807369355935746e-07, "loss": 2.4297, "step": 7603 }, { "epoch": 0.91, "learning_rate": 2.0750093595565735e-07, "loss": 2.4949, "step": 7604 }, { "epoch": 0.91, "learning_rate": 2.069289510398237e-07, "loss": 2.5981, "step": 7605 }, { "epoch": 0.91, "learning_rate": 2.0635773890407718e-07, "loss": 2.5156, "step": 7606 }, { "epoch": 0.91, "learning_rate": 2.0578729964051357e-07, "loss": 2.4259, "step": 7607 }, { "epoch": 0.91, "learning_rate": 2.0521763334110324e-07, "loss": 2.537, "step": 7608 }, { "epoch": 0.91, "learning_rate": 2.0464874009769377e-07, "loss": 2.4241, "step": 7609 }, { "epoch": 0.91, "learning_rate": 2.0408062000200623e-07, "loss": 2.3109, "step": 7610 }, { "epoch": 0.91, "learning_rate": 2.0351327314563907e-07, "loss": 2.4229, "step": 7611 }, { "epoch": 0.91, "learning_rate": 2.0294669962006352e-07, "loss": 2.5782, "step": 7612 }, { "epoch": 0.91, "learning_rate": 2.0238089951662765e-07, "loss": 2.2915, "step": 7613 }, { "epoch": 0.91, "learning_rate": 2.0181587292655512e-07, "loss": 2.5249, "step": 7614 }, { "epoch": 0.91, "learning_rate": 2.0125161994094312e-07, "loss": 2.5208, "step": 7615 }, { "epoch": 0.91, "learning_rate": 2.006881406507677e-07, "loss": 2.6225, "step": 7616 }, { "epoch": 0.92, "learning_rate": 2.0012543514687566e-07, "loss": 2.5495, "step": 7617 }, { "epoch": 0.92, "learning_rate": 1.995635035199922e-07, "loss": 2.5515, "step": 7618 }, { "epoch": 0.92, "learning_rate": 1.9900234586071542e-07, "loss": 2.5095, "step": 7619 }, { "epoch": 0.92, "learning_rate": 1.984419622595224e-07, "loss": 2.6258, "step": 7620 }, { "epoch": 0.92, "learning_rate": 1.9788235280676138e-07, "loss": 2.3513, "step": 7621 }, { "epoch": 0.92, "learning_rate": 1.9732351759265743e-07, "loss": 2.5115, "step": 7622 }, { "epoch": 0.92, "learning_rate": 1.9676545670731128e-07, "loss": 2.4361, "step": 7623 }, { "epoch": 0.92, "learning_rate": 1.9620817024069816e-07, "loss": 2.5774, "step": 7624 }, { "epoch": 0.92, "learning_rate": 1.9565165828266896e-07, "loss": 2.6376, "step": 7625 }, { "epoch": 0.92, "learning_rate": 1.9509592092294805e-07, "loss": 2.5592, "step": 7626 }, { "epoch": 0.92, "learning_rate": 1.9454095825113706e-07, "loss": 2.3954, "step": 7627 }, { "epoch": 0.92, "learning_rate": 1.9398677035671222e-07, "loss": 2.5003, "step": 7628 }, { "epoch": 0.92, "learning_rate": 1.9343335732902313e-07, "loss": 2.5519, "step": 7629 }, { "epoch": 0.92, "learning_rate": 1.9288071925729735e-07, "loss": 2.5303, "step": 7630 }, { "epoch": 0.92, "learning_rate": 1.923288562306347e-07, "loss": 2.4354, "step": 7631 }, { "epoch": 0.92, "learning_rate": 1.9177776833801233e-07, "loss": 2.4906, "step": 7632 }, { "epoch": 0.92, "learning_rate": 1.912274556682814e-07, "loss": 2.5275, "step": 7633 }, { "epoch": 0.92, "learning_rate": 1.9067791831016647e-07, "loss": 2.4508, "step": 7634 }, { "epoch": 0.92, "learning_rate": 1.9012915635227058e-07, "loss": 2.4331, "step": 7635 }, { "epoch": 0.92, "learning_rate": 1.8958116988306852e-07, "loss": 2.5353, "step": 7636 }, { "epoch": 0.92, "learning_rate": 1.8903395899091182e-07, "loss": 2.7129, "step": 7637 }, { "epoch": 0.92, "learning_rate": 1.8848752376402658e-07, "loss": 2.5556, "step": 7638 }, { "epoch": 0.92, "learning_rate": 1.8794186429051397e-07, "loss": 2.4212, "step": 7639 }, { "epoch": 0.92, "learning_rate": 1.8739698065834977e-07, "loss": 2.3587, "step": 7640 }, { "epoch": 0.92, "learning_rate": 1.8685287295538368e-07, "loss": 2.5139, "step": 7641 }, { "epoch": 0.92, "learning_rate": 1.863095412693433e-07, "loss": 2.5936, "step": 7642 }, { "epoch": 0.92, "learning_rate": 1.8576698568782802e-07, "loss": 2.5167, "step": 7643 }, { "epoch": 0.92, "learning_rate": 1.8522520629831396e-07, "loss": 2.4825, "step": 7644 }, { "epoch": 0.92, "learning_rate": 1.8468420318815128e-07, "loss": 2.4161, "step": 7645 }, { "epoch": 0.92, "learning_rate": 1.841439764445646e-07, "loss": 2.4846, "step": 7646 }, { "epoch": 0.92, "learning_rate": 1.8360452615465486e-07, "loss": 2.4969, "step": 7647 }, { "epoch": 0.92, "learning_rate": 1.8306585240539576e-07, "loss": 2.4819, "step": 7648 }, { "epoch": 0.92, "learning_rate": 1.8252795528363732e-07, "loss": 2.4894, "step": 7649 }, { "epoch": 0.92, "learning_rate": 1.8199083487610514e-07, "loss": 2.6562, "step": 7650 }, { "epoch": 0.92, "learning_rate": 1.8145449126939662e-07, "loss": 2.5424, "step": 7651 }, { "epoch": 0.92, "learning_rate": 1.8091892454998595e-07, "loss": 2.4792, "step": 7652 }, { "epoch": 0.92, "learning_rate": 1.803841348042229e-07, "loss": 2.4824, "step": 7653 }, { "epoch": 0.92, "learning_rate": 1.798501221183302e-07, "loss": 2.5073, "step": 7654 }, { "epoch": 0.92, "learning_rate": 1.7931688657840563e-07, "loss": 2.6783, "step": 7655 }, { "epoch": 0.92, "learning_rate": 1.7878442827042264e-07, "loss": 2.5077, "step": 7656 }, { "epoch": 0.92, "learning_rate": 1.7825274728022868e-07, "loss": 2.5522, "step": 7657 }, { "epoch": 0.92, "learning_rate": 1.7772184369354517e-07, "loss": 2.4323, "step": 7658 }, { "epoch": 0.92, "learning_rate": 1.771917175959703e-07, "loss": 2.2891, "step": 7659 }, { "epoch": 0.92, "learning_rate": 1.7666236907297407e-07, "loss": 2.513, "step": 7660 }, { "epoch": 0.92, "learning_rate": 1.7613379820990317e-07, "loss": 2.3849, "step": 7661 }, { "epoch": 0.92, "learning_rate": 1.756060050919789e-07, "loss": 2.4031, "step": 7662 }, { "epoch": 0.92, "learning_rate": 1.7507898980429539e-07, "loss": 2.3924, "step": 7663 }, { "epoch": 0.92, "learning_rate": 1.7455275243182413e-07, "loss": 2.577, "step": 7664 }, { "epoch": 0.92, "learning_rate": 1.7402729305940835e-07, "loss": 2.5801, "step": 7665 }, { "epoch": 0.92, "learning_rate": 1.7350261177176807e-07, "loss": 2.5976, "step": 7666 }, { "epoch": 0.92, "learning_rate": 1.7297870865349564e-07, "loss": 2.6736, "step": 7667 }, { "epoch": 0.92, "learning_rate": 1.7245558378906012e-07, "loss": 2.3839, "step": 7668 }, { "epoch": 0.92, "learning_rate": 1.719332372628052e-07, "loss": 2.5803, "step": 7669 }, { "epoch": 0.92, "learning_rate": 1.714116691589457e-07, "loss": 2.4605, "step": 7670 }, { "epoch": 0.92, "learning_rate": 1.7089087956157546e-07, "loss": 2.5767, "step": 7671 }, { "epoch": 0.92, "learning_rate": 1.7037086855465902e-07, "loss": 2.6585, "step": 7672 }, { "epoch": 0.92, "learning_rate": 1.698516362220376e-07, "loss": 2.3702, "step": 7673 }, { "epoch": 0.92, "learning_rate": 1.6933318264742648e-07, "loss": 2.4733, "step": 7674 }, { "epoch": 0.92, "learning_rate": 1.6881550791441548e-07, "loss": 2.567, "step": 7675 }, { "epoch": 0.92, "learning_rate": 1.682986121064689e-07, "loss": 2.4837, "step": 7676 }, { "epoch": 0.92, "learning_rate": 1.6778249530692348e-07, "loss": 2.4458, "step": 7677 }, { "epoch": 0.92, "learning_rate": 1.672671575989937e-07, "loss": 2.526, "step": 7678 }, { "epoch": 0.92, "learning_rate": 1.667525990657659e-07, "loss": 2.4089, "step": 7679 }, { "epoch": 0.92, "learning_rate": 1.662388197902015e-07, "loss": 2.4471, "step": 7680 }, { "epoch": 0.92, "learning_rate": 1.6572581985513703e-07, "loss": 2.4027, "step": 7681 }, { "epoch": 0.92, "learning_rate": 1.6521359934328185e-07, "loss": 2.4196, "step": 7682 }, { "epoch": 0.92, "learning_rate": 1.6470215833722103e-07, "loss": 2.4775, "step": 7683 }, { "epoch": 0.92, "learning_rate": 1.641914969194147e-07, "loss": 2.5306, "step": 7684 }, { "epoch": 0.92, "learning_rate": 1.6368161517219317e-07, "loss": 2.4456, "step": 7685 }, { "epoch": 0.92, "learning_rate": 1.6317251317776673e-07, "loss": 2.5982, "step": 7686 }, { "epoch": 0.92, "learning_rate": 1.626641910182164e-07, "loss": 2.5303, "step": 7687 }, { "epoch": 0.92, "learning_rate": 1.6215664877549774e-07, "loss": 2.4269, "step": 7688 }, { "epoch": 0.92, "learning_rate": 1.6164988653144086e-07, "loss": 2.4469, "step": 7689 }, { "epoch": 0.92, "learning_rate": 1.6114390436775095e-07, "loss": 2.432, "step": 7690 }, { "epoch": 0.92, "learning_rate": 1.6063870236600777e-07, "loss": 2.4317, "step": 7691 }, { "epoch": 0.92, "learning_rate": 1.6013428060766168e-07, "loss": 2.5498, "step": 7692 }, { "epoch": 0.92, "learning_rate": 1.5963063917404263e-07, "loss": 2.3484, "step": 7693 }, { "epoch": 0.92, "learning_rate": 1.5912777814635018e-07, "loss": 2.389, "step": 7694 }, { "epoch": 0.92, "learning_rate": 1.5862569760565994e-07, "loss": 2.4911, "step": 7695 }, { "epoch": 0.92, "learning_rate": 1.581243976329233e-07, "loss": 2.4631, "step": 7696 }, { "epoch": 0.92, "learning_rate": 1.5762387830896174e-07, "loss": 2.5091, "step": 7697 }, { "epoch": 0.92, "learning_rate": 1.571241397144757e-07, "loss": 2.4213, "step": 7698 }, { "epoch": 0.92, "learning_rate": 1.5662518193003628e-07, "loss": 2.4258, "step": 7699 }, { "epoch": 0.93, "learning_rate": 1.561270050360897e-07, "loss": 2.6934, "step": 7700 }, { "epoch": 0.93, "learning_rate": 1.5562960911295556e-07, "loss": 2.5769, "step": 7701 }, { "epoch": 0.93, "learning_rate": 1.5513299424082973e-07, "loss": 2.464, "step": 7702 }, { "epoch": 0.93, "learning_rate": 1.546371604997804e-07, "loss": 2.5145, "step": 7703 }, { "epoch": 0.93, "learning_rate": 1.541421079697486e-07, "loss": 2.5964, "step": 7704 }, { "epoch": 0.93, "learning_rate": 1.5364783673055328e-07, "loss": 2.5034, "step": 7705 }, { "epoch": 0.93, "learning_rate": 1.5315434686188345e-07, "loss": 2.4922, "step": 7706 }, { "epoch": 0.93, "learning_rate": 1.5266163844330439e-07, "loss": 2.5152, "step": 7707 }, { "epoch": 0.93, "learning_rate": 1.5216971155425474e-07, "loss": 2.562, "step": 7708 }, { "epoch": 0.93, "learning_rate": 1.5167856627404664e-07, "loss": 2.4872, "step": 7709 }, { "epoch": 0.93, "learning_rate": 1.511882026818684e-07, "loss": 2.5838, "step": 7710 }, { "epoch": 0.93, "learning_rate": 1.5069862085677845e-07, "loss": 2.5677, "step": 7711 }, { "epoch": 0.93, "learning_rate": 1.5020982087771362e-07, "loss": 2.5326, "step": 7712 }, { "epoch": 0.93, "learning_rate": 1.497218028234798e-07, "loss": 2.3291, "step": 7713 }, { "epoch": 0.93, "learning_rate": 1.4923456677276183e-07, "loss": 2.5942, "step": 7714 }, { "epoch": 0.93, "learning_rate": 1.4874811280411518e-07, "loss": 2.3984, "step": 7715 }, { "epoch": 0.93, "learning_rate": 1.4826244099596986e-07, "loss": 2.3906, "step": 7716 }, { "epoch": 0.93, "learning_rate": 1.4777755142663054e-07, "loss": 2.5648, "step": 7717 }, { "epoch": 0.93, "learning_rate": 1.472934441742746e-07, "loss": 2.5364, "step": 7718 }, { "epoch": 0.93, "learning_rate": 1.4681011931695466e-07, "loss": 2.6065, "step": 7719 }, { "epoch": 0.93, "learning_rate": 1.4632757693259615e-07, "loss": 2.4225, "step": 7720 }, { "epoch": 0.93, "learning_rate": 1.4584581709899848e-07, "loss": 2.3998, "step": 7721 }, { "epoch": 0.93, "learning_rate": 1.4536483989383676e-07, "loss": 2.5006, "step": 7722 }, { "epoch": 0.93, "learning_rate": 1.4488464539465563e-07, "loss": 2.593, "step": 7723 }, { "epoch": 0.93, "learning_rate": 1.444052336788787e-07, "loss": 2.5751, "step": 7724 }, { "epoch": 0.93, "learning_rate": 1.439266048237986e-07, "loss": 2.6022, "step": 7725 }, { "epoch": 0.93, "learning_rate": 1.4344875890658526e-07, "loss": 2.5078, "step": 7726 }, { "epoch": 0.93, "learning_rate": 1.4297169600428096e-07, "loss": 2.48, "step": 7727 }, { "epoch": 0.93, "learning_rate": 1.424954161938019e-07, "loss": 2.456, "step": 7728 }, { "epoch": 0.93, "learning_rate": 1.420199195519384e-07, "loss": 2.4964, "step": 7729 }, { "epoch": 0.93, "learning_rate": 1.4154520615535185e-07, "loss": 2.4319, "step": 7730 }, { "epoch": 0.93, "learning_rate": 1.4107127608058325e-07, "loss": 2.5435, "step": 7731 }, { "epoch": 0.93, "learning_rate": 1.4059812940404093e-07, "loss": 2.4659, "step": 7732 }, { "epoch": 0.93, "learning_rate": 1.4012576620201057e-07, "loss": 2.584, "step": 7733 }, { "epoch": 0.93, "learning_rate": 1.3965418655065122e-07, "loss": 2.5757, "step": 7734 }, { "epoch": 0.93, "learning_rate": 1.3918339052599372e-07, "loss": 2.6635, "step": 7735 }, { "epoch": 0.93, "learning_rate": 1.3871337820394404e-07, "loss": 2.3891, "step": 7736 }, { "epoch": 0.93, "learning_rate": 1.3824414966028321e-07, "loss": 2.2799, "step": 7737 }, { "epoch": 0.93, "learning_rate": 1.377757049706624e-07, "loss": 2.5217, "step": 7738 }, { "epoch": 0.93, "learning_rate": 1.3730804421061006e-07, "loss": 2.4137, "step": 7739 }, { "epoch": 0.93, "learning_rate": 1.3684116745552423e-07, "loss": 2.4882, "step": 7740 }, { "epoch": 0.93, "learning_rate": 1.3637507478068023e-07, "loss": 2.4651, "step": 7741 }, { "epoch": 0.93, "learning_rate": 1.359097662612252e-07, "loss": 2.4582, "step": 7742 }, { "epoch": 0.93, "learning_rate": 1.3544524197218078e-07, "loss": 2.5012, "step": 7743 }, { "epoch": 0.93, "learning_rate": 1.3498150198844094e-07, "loss": 2.6082, "step": 7744 }, { "epoch": 0.93, "learning_rate": 1.3451854638477367e-07, "loss": 2.5283, "step": 7745 }, { "epoch": 0.93, "learning_rate": 1.340563752358215e-07, "loss": 2.4916, "step": 7746 }, { "epoch": 0.93, "learning_rate": 1.3359498861609866e-07, "loss": 2.4254, "step": 7747 }, { "epoch": 0.93, "learning_rate": 1.33134386599994e-07, "loss": 2.4628, "step": 7748 }, { "epoch": 0.93, "learning_rate": 1.3267456926177091e-07, "loss": 2.5108, "step": 7749 }, { "epoch": 0.93, "learning_rate": 1.3221553667556342e-07, "loss": 2.4836, "step": 7750 }, { "epoch": 0.93, "learning_rate": 1.3175728891538175e-07, "loss": 2.5129, "step": 7751 }, { "epoch": 0.93, "learning_rate": 1.3129982605510738e-07, "loss": 2.5184, "step": 7752 }, { "epoch": 0.93, "learning_rate": 1.3084314816849853e-07, "loss": 2.5712, "step": 7753 }, { "epoch": 0.93, "learning_rate": 1.303872553291824e-07, "loss": 2.3172, "step": 7754 }, { "epoch": 0.93, "learning_rate": 1.2993214761066354e-07, "loss": 2.4905, "step": 7755 }, { "epoch": 0.93, "learning_rate": 1.2947782508631823e-07, "loss": 2.4209, "step": 7756 }, { "epoch": 0.93, "learning_rate": 1.2902428782939514e-07, "loss": 2.574, "step": 7757 }, { "epoch": 0.93, "learning_rate": 1.2857153591301907e-07, "loss": 2.5354, "step": 7758 }, { "epoch": 0.93, "learning_rate": 1.28119569410185e-07, "loss": 2.3728, "step": 7759 }, { "epoch": 0.93, "learning_rate": 1.2766838839376294e-07, "loss": 2.5698, "step": 7760 }, { "epoch": 0.93, "learning_rate": 1.2721799293649807e-07, "loss": 2.4668, "step": 7761 }, { "epoch": 0.93, "learning_rate": 1.267683831110045e-07, "loss": 2.4992, "step": 7762 }, { "epoch": 0.93, "learning_rate": 1.2631955898977366e-07, "loss": 2.3982, "step": 7763 }, { "epoch": 0.93, "learning_rate": 1.2587152064516828e-07, "loss": 2.4879, "step": 7764 }, { "epoch": 0.93, "learning_rate": 1.254242681494261e-07, "loss": 2.5005, "step": 7765 }, { "epoch": 0.93, "learning_rate": 1.24977801574655e-07, "loss": 2.5777, "step": 7766 }, { "epoch": 0.93, "learning_rate": 1.2453212099283962e-07, "loss": 2.487, "step": 7767 }, { "epoch": 0.93, "learning_rate": 1.2408722647583692e-07, "loss": 2.451, "step": 7768 }, { "epoch": 0.93, "learning_rate": 1.2364311809537456e-07, "loss": 2.2638, "step": 7769 }, { "epoch": 0.93, "learning_rate": 1.2319979592305798e-07, "loss": 2.3659, "step": 7770 }, { "epoch": 0.93, "learning_rate": 1.2275726003036114e-07, "loss": 2.5344, "step": 7771 }, { "epoch": 0.93, "learning_rate": 1.2231551048863421e-07, "loss": 2.5267, "step": 7772 }, { "epoch": 0.93, "learning_rate": 1.2187454736910077e-07, "loss": 2.3894, "step": 7773 }, { "epoch": 0.93, "learning_rate": 1.2143437074285503e-07, "loss": 2.6083, "step": 7774 }, { "epoch": 0.93, "learning_rate": 1.2099498068086802e-07, "loss": 2.4971, "step": 7775 }, { "epoch": 0.93, "learning_rate": 1.205563772539803e-07, "loss": 2.4029, "step": 7776 }, { "epoch": 0.93, "learning_rate": 1.201185605329086e-07, "loss": 2.4083, "step": 7777 }, { "epoch": 0.93, "learning_rate": 1.196815305882404e-07, "loss": 2.5014, "step": 7778 }, { "epoch": 0.93, "learning_rate": 1.1924528749043818e-07, "loss": 2.4891, "step": 7779 }, { "epoch": 0.93, "learning_rate": 1.1880983130983626e-07, "loss": 2.3971, "step": 7780 }, { "epoch": 0.93, "learning_rate": 1.183751621166429e-07, "loss": 2.2928, "step": 7781 }, { "epoch": 0.93, "learning_rate": 1.1794127998093929e-07, "loss": 2.5015, "step": 7782 }, { "epoch": 0.94, "learning_rate": 1.1750818497267946e-07, "loss": 2.3475, "step": 7783 }, { "epoch": 0.94, "learning_rate": 1.1707587716169033e-07, "loss": 2.505, "step": 7784 }, { "epoch": 0.94, "learning_rate": 1.1664435661767281e-07, "loss": 2.431, "step": 7785 }, { "epoch": 0.94, "learning_rate": 1.1621362341020014e-07, "loss": 2.5514, "step": 7786 }, { "epoch": 0.94, "learning_rate": 1.1578367760871956e-07, "loss": 2.4214, "step": 7787 }, { "epoch": 0.94, "learning_rate": 1.1535451928254948e-07, "loss": 2.3808, "step": 7788 }, { "epoch": 0.94, "learning_rate": 1.149261485008829e-07, "loss": 2.5442, "step": 7789 }, { "epoch": 0.94, "learning_rate": 1.1449856533278624e-07, "loss": 2.5828, "step": 7790 }, { "epoch": 0.94, "learning_rate": 1.1407176984719658e-07, "loss": 2.435, "step": 7791 }, { "epoch": 0.94, "learning_rate": 1.1364576211292722e-07, "loss": 2.3238, "step": 7792 }, { "epoch": 0.94, "learning_rate": 1.1322054219866096e-07, "loss": 2.4528, "step": 7793 }, { "epoch": 0.94, "learning_rate": 1.1279611017295689e-07, "loss": 2.562, "step": 7794 }, { "epoch": 0.94, "learning_rate": 1.1237246610424579e-07, "loss": 2.4713, "step": 7795 }, { "epoch": 0.94, "learning_rate": 1.1194961006082972e-07, "loss": 2.4013, "step": 7796 }, { "epoch": 0.94, "learning_rate": 1.115275421108858e-07, "loss": 2.3863, "step": 7797 }, { "epoch": 0.94, "learning_rate": 1.1110626232246347e-07, "loss": 2.5661, "step": 7798 }, { "epoch": 0.94, "learning_rate": 1.1068577076348619e-07, "loss": 2.6861, "step": 7799 }, { "epoch": 0.94, "learning_rate": 1.102660675017475e-07, "loss": 2.4688, "step": 7800 }, { "epoch": 0.94, "learning_rate": 1.0984715260491663e-07, "loss": 2.3044, "step": 7801 }, { "epoch": 0.94, "learning_rate": 1.0942902614053453e-07, "loss": 2.5173, "step": 7802 }, { "epoch": 0.94, "learning_rate": 1.0901168817601448e-07, "loss": 2.6059, "step": 7803 }, { "epoch": 0.94, "learning_rate": 1.0859513877864381e-07, "loss": 2.4244, "step": 7804 }, { "epoch": 0.94, "learning_rate": 1.081793780155821e-07, "loss": 2.512, "step": 7805 }, { "epoch": 0.94, "learning_rate": 1.0776440595386184e-07, "loss": 2.4523, "step": 7806 }, { "epoch": 0.94, "learning_rate": 1.0735022266038898e-07, "loss": 2.5974, "step": 7807 }, { "epoch": 0.94, "learning_rate": 1.0693682820194062e-07, "loss": 2.4321, "step": 7808 }, { "epoch": 0.94, "learning_rate": 1.0652422264516848e-07, "loss": 2.5084, "step": 7809 }, { "epoch": 0.94, "learning_rate": 1.0611240605659601e-07, "loss": 2.4907, "step": 7810 }, { "epoch": 0.94, "learning_rate": 1.0570137850262064e-07, "loss": 2.4921, "step": 7811 }, { "epoch": 0.94, "learning_rate": 1.0529114004951047e-07, "loss": 2.7171, "step": 7812 }, { "epoch": 0.94, "learning_rate": 1.048816907634087e-07, "loss": 2.4455, "step": 7813 }, { "epoch": 0.94, "learning_rate": 1.0447303071032977e-07, "loss": 2.5449, "step": 7814 }, { "epoch": 0.94, "learning_rate": 1.0406515995616152e-07, "loss": 2.5396, "step": 7815 }, { "epoch": 0.94, "learning_rate": 1.0365807856666465e-07, "loss": 2.3989, "step": 7816 }, { "epoch": 0.94, "learning_rate": 1.0325178660747171e-07, "loss": 2.5713, "step": 7817 }, { "epoch": 0.94, "learning_rate": 1.028462841440886e-07, "loss": 2.541, "step": 7818 }, { "epoch": 0.94, "learning_rate": 1.024415712418947e-07, "loss": 2.5355, "step": 7819 }, { "epoch": 0.94, "learning_rate": 1.0203764796614057e-07, "loss": 2.3239, "step": 7820 }, { "epoch": 0.94, "learning_rate": 1.0163451438195083e-07, "loss": 2.4575, "step": 7821 }, { "epoch": 0.94, "learning_rate": 1.0123217055432121e-07, "loss": 2.493, "step": 7822 }, { "epoch": 0.94, "learning_rate": 1.0083061654812154e-07, "loss": 2.617, "step": 7823 }, { "epoch": 0.94, "learning_rate": 1.0042985242809389e-07, "loss": 2.6842, "step": 7824 }, { "epoch": 0.94, "learning_rate": 1.0002987825885324e-07, "loss": 2.339, "step": 7825 }, { "epoch": 0.94, "learning_rate": 9.963069410488635e-08, "loss": 2.532, "step": 7826 }, { "epoch": 0.94, "learning_rate": 9.923230003055284e-08, "loss": 2.4053, "step": 7827 }, { "epoch": 0.94, "learning_rate": 9.883469610008578e-08, "loss": 2.5451, "step": 7828 }, { "epoch": 0.94, "learning_rate": 9.843788237759e-08, "loss": 2.4263, "step": 7829 }, { "epoch": 0.94, "learning_rate": 9.804185892704376e-08, "loss": 2.5106, "step": 7830 }, { "epoch": 0.94, "learning_rate": 9.7646625812296e-08, "loss": 2.4816, "step": 7831 }, { "epoch": 0.94, "learning_rate": 9.725218309707129e-08, "loss": 2.6836, "step": 7832 }, { "epoch": 0.94, "learning_rate": 9.685853084496433e-08, "loss": 2.4785, "step": 7833 }, { "epoch": 0.94, "learning_rate": 9.646566911944266e-08, "loss": 2.4941, "step": 7834 }, { "epoch": 0.94, "learning_rate": 9.607359798384785e-08, "loss": 2.4946, "step": 7835 }, { "epoch": 0.94, "learning_rate": 9.568231750139212e-08, "loss": 2.6624, "step": 7836 }, { "epoch": 0.94, "learning_rate": 9.52918277351611e-08, "loss": 2.4036, "step": 7837 }, { "epoch": 0.94, "learning_rate": 9.490212874811388e-08, "loss": 2.4882, "step": 7838 }, { "epoch": 0.94, "learning_rate": 9.451322060307966e-08, "loss": 2.639, "step": 7839 }, { "epoch": 0.94, "learning_rate": 9.412510336276214e-08, "loss": 2.5369, "step": 7840 }, { "epoch": 0.94, "learning_rate": 9.373777708973741e-08, "loss": 2.6328, "step": 7841 }, { "epoch": 0.94, "learning_rate": 9.335124184645272e-08, "loss": 2.4092, "step": 7842 }, { "epoch": 0.94, "learning_rate": 9.296549769522933e-08, "loss": 2.5696, "step": 7843 }, { "epoch": 0.94, "learning_rate": 9.258054469825972e-08, "loss": 2.5333, "step": 7844 }, { "epoch": 0.94, "learning_rate": 9.219638291761035e-08, "loss": 2.5723, "step": 7845 }, { "epoch": 0.94, "learning_rate": 9.181301241521723e-08, "loss": 2.3422, "step": 7846 }, { "epoch": 0.94, "learning_rate": 9.143043325289202e-08, "loss": 2.4904, "step": 7847 }, { "epoch": 0.94, "learning_rate": 9.104864549231706e-08, "loss": 2.5112, "step": 7848 }, { "epoch": 0.94, "learning_rate": 9.066764919504756e-08, "loss": 2.5179, "step": 7849 }, { "epoch": 0.94, "learning_rate": 9.028744442251103e-08, "loss": 2.4185, "step": 7850 }, { "epoch": 0.94, "learning_rate": 8.990803123600677e-08, "loss": 2.6487, "step": 7851 }, { "epoch": 0.94, "learning_rate": 8.952940969670809e-08, "loss": 2.6766, "step": 7852 }, { "epoch": 0.94, "learning_rate": 8.915157986565837e-08, "loss": 2.4392, "step": 7853 }, { "epoch": 0.94, "learning_rate": 8.877454180377553e-08, "loss": 2.4316, "step": 7854 }, { "epoch": 0.94, "learning_rate": 8.839829557184876e-08, "loss": 2.4406, "step": 7855 }, { "epoch": 0.94, "learning_rate": 8.802284123053894e-08, "loss": 2.5106, "step": 7856 }, { "epoch": 0.94, "learning_rate": 8.764817884038157e-08, "loss": 2.4984, "step": 7857 }, { "epoch": 0.94, "learning_rate": 8.727430846178109e-08, "loss": 2.5036, "step": 7858 }, { "epoch": 0.94, "learning_rate": 8.690123015501705e-08, "loss": 2.5099, "step": 7859 }, { "epoch": 0.94, "learning_rate": 8.652894398024137e-08, "loss": 2.5362, "step": 7860 }, { "epoch": 0.94, "learning_rate": 8.615744999747489e-08, "loss": 2.6241, "step": 7861 }, { "epoch": 0.94, "learning_rate": 8.578674826661527e-08, "loss": 2.3797, "step": 7862 }, { "epoch": 0.94, "learning_rate": 8.541683884742802e-08, "loss": 2.5823, "step": 7863 }, { "epoch": 0.94, "learning_rate": 8.504772179955546e-08, "loss": 2.1053, "step": 7864 }, { "epoch": 0.94, "learning_rate": 8.467939718250828e-08, "loss": 2.5822, "step": 7865 }, { "epoch": 0.94, "learning_rate": 8.431186505567179e-08, "loss": 2.4693, "step": 7866 }, { "epoch": 0.95, "learning_rate": 8.394512547830191e-08, "loss": 2.251, "step": 7867 }, { "epoch": 0.95, "learning_rate": 8.357917850952802e-08, "loss": 2.6286, "step": 7868 }, { "epoch": 0.95, "learning_rate": 8.321402420835123e-08, "loss": 2.5579, "step": 7869 }, { "epoch": 0.95, "learning_rate": 8.284966263364447e-08, "loss": 2.4881, "step": 7870 }, { "epoch": 0.95, "learning_rate": 8.248609384415352e-08, "loss": 2.4689, "step": 7871 }, { "epoch": 0.95, "learning_rate": 8.212331789849648e-08, "loss": 2.6223, "step": 7872 }, { "epoch": 0.95, "learning_rate": 8.176133485516213e-08, "loss": 2.5208, "step": 7873 }, { "epoch": 0.95, "learning_rate": 8.140014477251379e-08, "loss": 2.5481, "step": 7874 }, { "epoch": 0.95, "learning_rate": 8.10397477087843e-08, "loss": 2.4135, "step": 7875 }, { "epoch": 0.95, "learning_rate": 8.06801437220811e-08, "loss": 2.49, "step": 7876 }, { "epoch": 0.95, "learning_rate": 8.032133287038224e-08, "loss": 2.3021, "step": 7877 }, { "epoch": 0.95, "learning_rate": 7.99633152115381e-08, "loss": 2.6466, "step": 7878 }, { "epoch": 0.95, "learning_rate": 7.960609080327141e-08, "loss": 2.5567, "step": 7879 }, { "epoch": 0.95, "learning_rate": 7.924965970317722e-08, "loss": 2.4246, "step": 7880 }, { "epoch": 0.95, "learning_rate": 7.889402196872231e-08, "loss": 2.7354, "step": 7881 }, { "epoch": 0.95, "learning_rate": 7.853917765724528e-08, "loss": 2.7613, "step": 7882 }, { "epoch": 0.95, "learning_rate": 7.818512682595702e-08, "loss": 2.548, "step": 7883 }, { "epoch": 0.95, "learning_rate": 7.783186953194189e-08, "loss": 2.4719, "step": 7884 }, { "epoch": 0.95, "learning_rate": 7.74794058321543e-08, "loss": 2.4591, "step": 7885 }, { "epoch": 0.95, "learning_rate": 7.712773578342047e-08, "loss": 2.5747, "step": 7886 }, { "epoch": 0.95, "learning_rate": 7.677685944244118e-08, "loss": 2.5344, "step": 7887 }, { "epoch": 0.95, "learning_rate": 7.642677686578726e-08, "loss": 2.4681, "step": 7888 }, { "epoch": 0.95, "learning_rate": 7.607748810990246e-08, "loss": 2.4397, "step": 7889 }, { "epoch": 0.95, "learning_rate": 7.572899323110116e-08, "loss": 2.3186, "step": 7890 }, { "epoch": 0.95, "learning_rate": 7.538129228557123e-08, "loss": 2.5402, "step": 7891 }, { "epoch": 0.95, "learning_rate": 7.503438532937169e-08, "loss": 2.6091, "step": 7892 }, { "epoch": 0.95, "learning_rate": 7.46882724184339e-08, "loss": 2.5396, "step": 7893 }, { "epoch": 0.95, "learning_rate": 7.434295360856214e-08, "loss": 2.4622, "step": 7894 }, { "epoch": 0.95, "learning_rate": 7.399842895543019e-08, "loss": 2.6297, "step": 7895 }, { "epoch": 0.95, "learning_rate": 7.36546985145864e-08, "loss": 2.7383, "step": 7896 }, { "epoch": 0.95, "learning_rate": 7.331176234144921e-08, "loss": 2.4209, "step": 7897 }, { "epoch": 0.95, "learning_rate": 7.296962049131051e-08, "loss": 2.5079, "step": 7898 }, { "epoch": 0.95, "learning_rate": 7.262827301933229e-08, "loss": 2.4959, "step": 7899 }, { "epoch": 0.95, "learning_rate": 7.228771998054995e-08, "loss": 2.5505, "step": 7900 }, { "epoch": 0.95, "learning_rate": 7.194796142987127e-08, "loss": 2.465, "step": 7901 }, { "epoch": 0.95, "learning_rate": 7.160899742207406e-08, "loss": 2.5698, "step": 7902 }, { "epoch": 0.95, "learning_rate": 7.127082801180907e-08, "loss": 2.4795, "step": 7903 }, { "epoch": 0.95, "learning_rate": 7.093345325359935e-08, "loss": 2.4868, "step": 7904 }, { "epoch": 0.95, "learning_rate": 7.059687320183862e-08, "loss": 2.4002, "step": 7905 }, { "epoch": 0.95, "learning_rate": 7.0261087910794e-08, "loss": 2.6033, "step": 7906 }, { "epoch": 0.95, "learning_rate": 6.992609743460332e-08, "loss": 2.5269, "step": 7907 }, { "epoch": 0.95, "learning_rate": 6.959190182727616e-08, "loss": 2.5741, "step": 7908 }, { "epoch": 0.95, "learning_rate": 6.925850114269494e-08, "loss": 2.505, "step": 7909 }, { "epoch": 0.95, "learning_rate": 6.892589543461392e-08, "loss": 2.5686, "step": 7910 }, { "epoch": 0.95, "learning_rate": 6.859408475665796e-08, "loss": 2.5264, "step": 7911 }, { "epoch": 0.95, "learning_rate": 6.826306916232428e-08, "loss": 2.6221, "step": 7912 }, { "epoch": 0.95, "learning_rate": 6.79328487049824e-08, "loss": 2.4873, "step": 7913 }, { "epoch": 0.95, "learning_rate": 6.760342343787307e-08, "loss": 2.3416, "step": 7914 }, { "epoch": 0.95, "learning_rate": 6.727479341410937e-08, "loss": 2.4067, "step": 7915 }, { "epoch": 0.95, "learning_rate": 6.694695868667556e-08, "loss": 2.641, "step": 7916 }, { "epoch": 0.95, "learning_rate": 6.661991930842826e-08, "loss": 2.4694, "step": 7917 }, { "epoch": 0.95, "learning_rate": 6.629367533209529e-08, "loss": 2.5393, "step": 7918 }, { "epoch": 0.95, "learning_rate": 6.596822681027626e-08, "loss": 2.5646, "step": 7919 }, { "epoch": 0.95, "learning_rate": 6.564357379544361e-08, "loss": 2.4901, "step": 7920 }, { "epoch": 0.95, "learning_rate": 6.531971633993994e-08, "loss": 2.4935, "step": 7921 }, { "epoch": 0.95, "learning_rate": 6.49966544959807e-08, "loss": 2.37, "step": 7922 }, { "epoch": 0.95, "learning_rate": 6.467438831565254e-08, "loss": 2.5289, "step": 7923 }, { "epoch": 0.95, "learning_rate": 6.43529178509139e-08, "loss": 2.4308, "step": 7924 }, { "epoch": 0.95, "learning_rate": 6.403224315359558e-08, "loss": 2.5588, "step": 7925 }, { "epoch": 0.95, "learning_rate": 6.371236427539895e-08, "loss": 2.4023, "step": 7926 }, { "epoch": 0.95, "learning_rate": 6.339328126789778e-08, "loss": 2.4589, "step": 7927 }, { "epoch": 0.95, "learning_rate": 6.307499418253705e-08, "loss": 2.542, "step": 7928 }, { "epoch": 0.95, "learning_rate": 6.2757503070634e-08, "loss": 2.5726, "step": 7929 }, { "epoch": 0.95, "learning_rate": 6.244080798337715e-08, "loss": 2.5009, "step": 7930 }, { "epoch": 0.95, "learning_rate": 6.212490897182732e-08, "loss": 2.3909, "step": 7931 }, { "epoch": 0.95, "learning_rate": 6.180980608691656e-08, "loss": 2.5154, "step": 7932 }, { "epoch": 0.95, "learning_rate": 6.149549937944698e-08, "loss": 2.4099, "step": 7933 }, { "epoch": 0.95, "learning_rate": 6.118198890009586e-08, "loss": 2.5711, "step": 7934 }, { "epoch": 0.95, "learning_rate": 6.086927469940829e-08, "loss": 2.4319, "step": 7935 }, { "epoch": 0.95, "learning_rate": 6.055735682780395e-08, "loss": 2.5646, "step": 7936 }, { "epoch": 0.95, "learning_rate": 6.024623533557206e-08, "loss": 2.3425, "step": 7937 }, { "epoch": 0.95, "learning_rate": 5.993591027287471e-08, "loss": 2.4871, "step": 7938 }, { "epoch": 0.95, "learning_rate": 5.962638168974522e-08, "loss": 2.4894, "step": 7939 }, { "epoch": 0.95, "learning_rate": 5.9317649636088656e-08, "loss": 2.4981, "step": 7940 }, { "epoch": 0.95, "learning_rate": 5.9009714161680774e-08, "loss": 2.6045, "step": 7941 }, { "epoch": 0.95, "learning_rate": 5.870257531617019e-08, "loss": 2.5136, "step": 7942 }, { "epoch": 0.95, "learning_rate": 5.8396233149076165e-08, "loss": 2.4809, "step": 7943 }, { "epoch": 0.95, "learning_rate": 5.809068770979032e-08, "loss": 2.4325, "step": 7944 }, { "epoch": 0.95, "learning_rate": 5.778593904757435e-08, "loss": 2.5616, "step": 7945 }, { "epoch": 0.95, "learning_rate": 5.748198721156284e-08, "loss": 2.4539, "step": 7946 }, { "epoch": 0.95, "learning_rate": 5.717883225076215e-08, "loss": 2.5822, "step": 7947 }, { "epoch": 0.95, "learning_rate": 5.687647421404874e-08, "loss": 2.4633, "step": 7948 }, { "epoch": 0.95, "learning_rate": 5.657491315017194e-08, "loss": 2.5609, "step": 7949 }, { "epoch": 0.96, "learning_rate": 5.627414910775175e-08, "loss": 2.594, "step": 7950 }, { "epoch": 0.96, "learning_rate": 5.597418213527939e-08, "loss": 2.3858, "step": 7951 }, { "epoch": 0.96, "learning_rate": 5.5675012281119486e-08, "loss": 2.4699, "step": 7952 }, { "epoch": 0.96, "learning_rate": 5.537663959350514e-08, "loss": 2.3078, "step": 7953 }, { "epoch": 0.96, "learning_rate": 5.507906412054398e-08, "loss": 2.553, "step": 7954 }, { "epoch": 0.96, "learning_rate": 5.478228591021262e-08, "loss": 2.5887, "step": 7955 }, { "epoch": 0.96, "learning_rate": 5.4486305010361116e-08, "loss": 2.4975, "step": 7956 }, { "epoch": 0.96, "learning_rate": 5.419112146870964e-08, "loss": 2.4709, "step": 7957 }, { "epoch": 0.96, "learning_rate": 5.389673533284956e-08, "loss": 2.5744, "step": 7958 }, { "epoch": 0.96, "learning_rate": 5.360314665024513e-08, "loss": 2.3592, "step": 7959 }, { "epoch": 0.96, "learning_rate": 5.3310355468231266e-08, "loss": 2.5321, "step": 7960 }, { "epoch": 0.96, "learning_rate": 5.3018361834014095e-08, "loss": 2.4584, "step": 7961 }, { "epoch": 0.96, "learning_rate": 5.272716579467097e-08, "loss": 2.5314, "step": 7962 }, { "epoch": 0.96, "learning_rate": 5.243676739715153e-08, "loss": 2.4053, "step": 7963 }, { "epoch": 0.96, "learning_rate": 5.214716668827558e-08, "loss": 2.6091, "step": 7964 }, { "epoch": 0.96, "learning_rate": 5.1858363714736294e-08, "loss": 2.4558, "step": 7965 }, { "epoch": 0.96, "learning_rate": 5.157035852309589e-08, "loss": 2.3415, "step": 7966 }, { "epoch": 0.96, "learning_rate": 5.128315115978943e-08, "loss": 2.5186, "step": 7967 }, { "epoch": 0.96, "learning_rate": 5.0996741671123226e-08, "loss": 2.4359, "step": 7968 }, { "epoch": 0.96, "learning_rate": 5.071113010327366e-08, "loss": 2.5279, "step": 7969 }, { "epoch": 0.96, "learning_rate": 5.042631650229057e-08, "loss": 2.4521, "step": 7970 }, { "epoch": 0.96, "learning_rate": 5.014230091409389e-08, "loss": 2.6516, "step": 7971 }, { "epoch": 0.96, "learning_rate": 4.985908338447476e-08, "loss": 2.2857, "step": 7972 }, { "epoch": 0.96, "learning_rate": 4.9576663959096104e-08, "loss": 2.5611, "step": 7973 }, { "epoch": 0.96, "learning_rate": 4.929504268349095e-08, "loss": 2.4419, "step": 7974 }, { "epoch": 0.96, "learning_rate": 4.901421960306685e-08, "loss": 2.45, "step": 7975 }, { "epoch": 0.96, "learning_rate": 4.8734194763098706e-08, "loss": 2.5355, "step": 7976 }, { "epoch": 0.96, "learning_rate": 4.845496820873541e-08, "loss": 2.4989, "step": 7977 }, { "epoch": 0.96, "learning_rate": 4.817653998499594e-08, "loss": 2.5958, "step": 7978 }, { "epoch": 0.96, "learning_rate": 4.7898910136770505e-08, "loss": 2.4397, "step": 7979 }, { "epoch": 0.96, "learning_rate": 4.7622078708822184e-08, "loss": 2.4935, "step": 7980 }, { "epoch": 0.96, "learning_rate": 4.734604574578305e-08, "loss": 2.4365, "step": 7981 }, { "epoch": 0.96, "learning_rate": 4.7070811292157513e-08, "loss": 2.6389, "step": 7982 }, { "epoch": 0.96, "learning_rate": 4.6796375392321734e-08, "loss": 2.5946, "step": 7983 }, { "epoch": 0.96, "learning_rate": 4.6522738090522545e-08, "loss": 2.5094, "step": 7984 }, { "epoch": 0.96, "learning_rate": 4.624989943087799e-08, "loss": 2.6543, "step": 7985 }, { "epoch": 0.96, "learning_rate": 4.597785945737732e-08, "loss": 2.5055, "step": 7986 }, { "epoch": 0.96, "learning_rate": 4.5706618213881005e-08, "loss": 2.4786, "step": 7987 }, { "epoch": 0.96, "learning_rate": 4.543617574412185e-08, "loss": 2.6198, "step": 7988 }, { "epoch": 0.96, "learning_rate": 4.516653209170163e-08, "loss": 2.4092, "step": 7989 }, { "epoch": 0.96, "learning_rate": 4.489768730009558e-08, "loss": 2.5965, "step": 7990 }, { "epoch": 0.96, "learning_rate": 4.462964141264847e-08, "loss": 2.4933, "step": 7991 }, { "epoch": 0.96, "learning_rate": 4.43623944725774e-08, "loss": 2.5014, "step": 7992 }, { "epoch": 0.96, "learning_rate": 4.4095946522970664e-08, "loss": 2.445, "step": 7993 }, { "epoch": 0.96, "learning_rate": 4.383029760678614e-08, "loss": 2.4396, "step": 7994 }, { "epoch": 0.96, "learning_rate": 4.356544776685456e-08, "loss": 2.7581, "step": 7995 }, { "epoch": 0.96, "learning_rate": 4.330139704587788e-08, "loss": 2.6582, "step": 7996 }, { "epoch": 0.96, "learning_rate": 4.30381454864276e-08, "loss": 2.6077, "step": 7997 }, { "epoch": 0.96, "learning_rate": 4.2775693130948094e-08, "loss": 2.4998, "step": 7998 }, { "epoch": 0.96, "learning_rate": 4.2514040021753856e-08, "loss": 2.5785, "step": 7999 }, { "epoch": 0.96, "learning_rate": 4.2253186201031135e-08, "loss": 2.6848, "step": 8000 }, { "epoch": 0.96, "learning_rate": 4.1993131710836855e-08, "loss": 2.5215, "step": 8001 }, { "epoch": 0.96, "learning_rate": 4.173387659309913e-08, "loss": 2.4724, "step": 8002 }, { "epoch": 0.96, "learning_rate": 4.147542088961787e-08, "loss": 2.4318, "step": 8003 }, { "epoch": 0.96, "learning_rate": 4.1217764642062505e-08, "loss": 2.5185, "step": 8004 }, { "epoch": 0.96, "learning_rate": 4.0960907891975376e-08, "loss": 2.5431, "step": 8005 }, { "epoch": 0.96, "learning_rate": 4.07048506807689e-08, "loss": 2.3466, "step": 8006 }, { "epoch": 0.96, "learning_rate": 4.044959304972673e-08, "loss": 2.4217, "step": 8007 }, { "epoch": 0.96, "learning_rate": 4.019513504000372e-08, "loss": 2.4986, "step": 8008 }, { "epoch": 0.96, "learning_rate": 3.994147669262649e-08, "loss": 2.5625, "step": 8009 }, { "epoch": 0.96, "learning_rate": 3.968861804849067e-08, "loss": 2.5648, "step": 8010 }, { "epoch": 0.96, "learning_rate": 3.9436559148365304e-08, "loss": 2.4397, "step": 8011 }, { "epoch": 0.96, "learning_rate": 3.9185300032889005e-08, "loss": 2.411, "step": 8012 }, { "epoch": 0.96, "learning_rate": 3.8934840742572145e-08, "loss": 2.3682, "step": 8013 }, { "epoch": 0.96, "learning_rate": 3.8685181317796306e-08, "loss": 2.5185, "step": 8014 }, { "epoch": 0.96, "learning_rate": 3.843632179881318e-08, "loss": 2.4517, "step": 8015 }, { "epoch": 0.96, "learning_rate": 3.818826222574568e-08, "loss": 2.5366, "step": 8016 }, { "epoch": 0.96, "learning_rate": 3.7941002638589577e-08, "loss": 2.5976, "step": 8017 }, { "epoch": 0.96, "learning_rate": 3.7694543077208546e-08, "loss": 2.5096, "step": 8018 }, { "epoch": 0.96, "learning_rate": 3.744888358133913e-08, "loss": 2.3945, "step": 8019 }, { "epoch": 0.96, "learning_rate": 3.720402419058966e-08, "loss": 2.5915, "step": 8020 }, { "epoch": 0.96, "learning_rate": 3.695996494443799e-08, "loss": 2.5585, "step": 8021 }, { "epoch": 0.96, "learning_rate": 3.6716705882233194e-08, "loss": 2.5558, "step": 8022 }, { "epoch": 0.96, "learning_rate": 3.647424704319558e-08, "loss": 2.4261, "step": 8023 }, { "epoch": 0.96, "learning_rate": 3.6232588466417195e-08, "loss": 2.5114, "step": 8024 }, { "epoch": 0.96, "learning_rate": 3.5991730190859666e-08, "loss": 2.555, "step": 8025 }, { "epoch": 0.96, "learning_rate": 3.5751672255355806e-08, "loss": 2.5462, "step": 8026 }, { "epoch": 0.96, "learning_rate": 3.551241469861077e-08, "loss": 2.4342, "step": 8027 }, { "epoch": 0.96, "learning_rate": 3.5273957559199265e-08, "loss": 2.3793, "step": 8028 }, { "epoch": 0.96, "learning_rate": 3.50363008755672e-08, "loss": 2.4913, "step": 8029 }, { "epoch": 0.96, "learning_rate": 3.479944468603169e-08, "loss": 2.4706, "step": 8030 }, { "epoch": 0.96, "learning_rate": 3.456338902878109e-08, "loss": 2.4413, "step": 8031 }, { "epoch": 0.96, "learning_rate": 3.4328133941873844e-08, "loss": 2.5269, "step": 8032 }, { "epoch": 0.97, "learning_rate": 3.409367946324071e-08, "loss": 2.726, "step": 8033 }, { "epoch": 0.97, "learning_rate": 3.386002563068147e-08, "loss": 2.4281, "step": 8034 }, { "epoch": 0.97, "learning_rate": 3.362717248186764e-08, "loss": 2.5992, "step": 8035 }, { "epoch": 0.97, "learning_rate": 3.339512005434309e-08, "loss": 2.3747, "step": 8036 }, { "epoch": 0.97, "learning_rate": 3.316386838552011e-08, "loss": 2.5118, "step": 8037 }, { "epoch": 0.97, "learning_rate": 3.293341751268386e-08, "loss": 2.5261, "step": 8038 }, { "epoch": 0.97, "learning_rate": 3.270376747298853e-08, "loss": 2.4839, "step": 8039 }, { "epoch": 0.97, "learning_rate": 3.2474918303461165e-08, "loss": 2.3934, "step": 8040 }, { "epoch": 0.97, "learning_rate": 3.224687004099891e-08, "loss": 2.5952, "step": 8041 }, { "epoch": 0.97, "learning_rate": 3.2019622722369024e-08, "loss": 2.5002, "step": 8042 }, { "epoch": 0.97, "learning_rate": 3.179317638421109e-08, "loss": 2.492, "step": 8043 }, { "epoch": 0.97, "learning_rate": 3.156753106303367e-08, "loss": 2.425, "step": 8044 }, { "epoch": 0.97, "learning_rate": 3.134268679521824e-08, "loss": 2.5371, "step": 8045 }, { "epoch": 0.97, "learning_rate": 3.1118643617015775e-08, "loss": 2.4483, "step": 8046 }, { "epoch": 0.97, "learning_rate": 3.0895401564547954e-08, "loss": 2.4316, "step": 8047 }, { "epoch": 0.97, "learning_rate": 3.0672960673808205e-08, "loss": 2.5201, "step": 8048 }, { "epoch": 0.97, "learning_rate": 3.0451320980660615e-08, "loss": 2.4943, "step": 8049 }, { "epoch": 0.97, "learning_rate": 3.0230482520839376e-08, "loss": 2.4389, "step": 8050 }, { "epoch": 0.97, "learning_rate": 3.0010445329950456e-08, "loss": 2.4476, "step": 8051 }, { "epoch": 0.97, "learning_rate": 2.979120944346936e-08, "loss": 2.5211, "step": 8052 }, { "epoch": 0.97, "learning_rate": 2.9572774896743928e-08, "loss": 2.6114, "step": 8053 }, { "epoch": 0.97, "learning_rate": 2.93551417249921e-08, "loss": 2.5514, "step": 8054 }, { "epoch": 0.97, "learning_rate": 2.9138309963301913e-08, "loss": 2.4543, "step": 8055 }, { "epoch": 0.97, "learning_rate": 2.892227964663319e-08, "loss": 2.4639, "step": 8056 }, { "epoch": 0.97, "learning_rate": 2.8707050809816394e-08, "loss": 2.2849, "step": 8057 }, { "epoch": 0.97, "learning_rate": 2.8492623487552106e-08, "loss": 2.4419, "step": 8058 }, { "epoch": 0.97, "learning_rate": 2.827899771441267e-08, "loss": 2.7205, "step": 8059 }, { "epoch": 0.97, "learning_rate": 2.8066173524839978e-08, "loss": 2.2535, "step": 8060 }, { "epoch": 0.97, "learning_rate": 2.7854150953148253e-08, "loss": 2.3218, "step": 8061 }, { "epoch": 0.97, "learning_rate": 2.76429300335207e-08, "loss": 2.4108, "step": 8062 }, { "epoch": 0.97, "learning_rate": 2.7432510800012855e-08, "loss": 2.4714, "step": 8063 }, { "epoch": 0.97, "learning_rate": 2.722289328654981e-08, "loss": 2.4038, "step": 8064 }, { "epoch": 0.97, "learning_rate": 2.7014077526928418e-08, "loss": 2.6233, "step": 8065 }, { "epoch": 0.97, "learning_rate": 2.6806063554815632e-08, "loss": 2.4373, "step": 8066 }, { "epoch": 0.97, "learning_rate": 2.659885140374907e-08, "loss": 2.593, "step": 8067 }, { "epoch": 0.97, "learning_rate": 2.6392441107137013e-08, "loss": 2.4281, "step": 8068 }, { "epoch": 0.97, "learning_rate": 2.6186832698258946e-08, "loss": 2.4735, "step": 8069 }, { "epoch": 0.97, "learning_rate": 2.5982026210265575e-08, "loss": 2.4899, "step": 8070 }, { "epoch": 0.97, "learning_rate": 2.5778021676176047e-08, "loss": 2.4278, "step": 8071 }, { "epoch": 0.97, "learning_rate": 2.5574819128882933e-08, "loss": 2.4526, "step": 8072 }, { "epoch": 0.97, "learning_rate": 2.5372418601147807e-08, "loss": 2.6938, "step": 8073 }, { "epoch": 0.97, "learning_rate": 2.5170820125602902e-08, "loss": 2.3191, "step": 8074 }, { "epoch": 0.97, "learning_rate": 2.497002373475277e-08, "loss": 2.5696, "step": 8075 }, { "epoch": 0.97, "learning_rate": 2.4770029460970956e-08, "loss": 2.4943, "step": 8076 }, { "epoch": 0.97, "learning_rate": 2.4570837336502784e-08, "loss": 2.475, "step": 8077 }, { "epoch": 0.97, "learning_rate": 2.4372447393462562e-08, "loss": 2.5633, "step": 8078 }, { "epoch": 0.97, "learning_rate": 2.417485966383748e-08, "loss": 2.4631, "step": 8079 }, { "epoch": 0.97, "learning_rate": 2.3978074179483722e-08, "loss": 2.5786, "step": 8080 }, { "epoch": 0.97, "learning_rate": 2.3782090972129244e-08, "loss": 2.5463, "step": 8081 }, { "epoch": 0.97, "learning_rate": 2.3586910073371548e-08, "loss": 2.6023, "step": 8082 }, { "epoch": 0.97, "learning_rate": 2.3392531514679906e-08, "loss": 2.4445, "step": 8083 }, { "epoch": 0.97, "learning_rate": 2.319895532739369e-08, "loss": 2.6117, "step": 8084 }, { "epoch": 0.97, "learning_rate": 2.3006181542722384e-08, "loss": 2.4663, "step": 8085 }, { "epoch": 0.97, "learning_rate": 2.281421019174668e-08, "loss": 2.3659, "step": 8086 }, { "epoch": 0.97, "learning_rate": 2.262304130541848e-08, "loss": 2.2293, "step": 8087 }, { "epoch": 0.97, "learning_rate": 2.243267491455925e-08, "loss": 2.4403, "step": 8088 }, { "epoch": 0.97, "learning_rate": 2.2243111049861655e-08, "loss": 2.4967, "step": 8089 }, { "epoch": 0.97, "learning_rate": 2.205434974188847e-08, "loss": 2.3527, "step": 8090 }, { "epoch": 0.97, "learning_rate": 2.186639102107424e-08, "loss": 2.4984, "step": 8091 }, { "epoch": 0.97, "learning_rate": 2.1679234917721946e-08, "loss": 2.4879, "step": 8092 }, { "epoch": 0.97, "learning_rate": 2.1492881462007452e-08, "loss": 2.602, "step": 8093 }, { "epoch": 0.97, "learning_rate": 2.1307330683976722e-08, "loss": 2.4107, "step": 8094 }, { "epoch": 0.97, "learning_rate": 2.1122582613544718e-08, "loss": 2.468, "step": 8095 }, { "epoch": 0.97, "learning_rate": 2.093863728049872e-08, "loss": 2.3734, "step": 8096 }, { "epoch": 0.97, "learning_rate": 2.075549471449556e-08, "loss": 2.4779, "step": 8097 }, { "epoch": 0.97, "learning_rate": 2.057315494506329e-08, "loss": 2.5257, "step": 8098 }, { "epoch": 0.97, "learning_rate": 2.039161800160061e-08, "loss": 2.501, "step": 8099 }, { "epoch": 0.97, "learning_rate": 2.0210883913376334e-08, "loss": 2.5441, "step": 8100 }, { "epoch": 0.97, "learning_rate": 2.0030952709529927e-08, "loss": 2.5297, "step": 8101 }, { "epoch": 0.97, "learning_rate": 1.9851824419070965e-08, "loss": 2.513, "step": 8102 }, { "epoch": 0.97, "learning_rate": 1.967349907088023e-08, "loss": 2.5316, "step": 8103 }, { "epoch": 0.97, "learning_rate": 1.9495976693709727e-08, "loss": 2.4145, "step": 8104 }, { "epoch": 0.97, "learning_rate": 1.9319257316179894e-08, "loss": 2.3765, "step": 8105 }, { "epoch": 0.97, "learning_rate": 1.914334096678405e-08, "loss": 2.4922, "step": 8106 }, { "epoch": 0.97, "learning_rate": 1.8968227673883956e-08, "loss": 2.5679, "step": 8107 }, { "epoch": 0.97, "learning_rate": 1.8793917465713686e-08, "loss": 2.4788, "step": 8108 }, { "epoch": 0.97, "learning_rate": 1.8620410370376875e-08, "loss": 2.5197, "step": 8109 }, { "epoch": 0.97, "learning_rate": 1.8447706415847255e-08, "loss": 2.5933, "step": 8110 }, { "epoch": 0.97, "learning_rate": 1.8275805629969778e-08, "loss": 2.5009, "step": 8111 }, { "epoch": 0.97, "learning_rate": 1.8104708040460605e-08, "loss": 2.4543, "step": 8112 }, { "epoch": 0.97, "learning_rate": 1.7934413674904894e-08, "loss": 2.4384, "step": 8113 }, { "epoch": 0.97, "learning_rate": 1.7764922560759014e-08, "loss": 2.4955, "step": 8114 }, { "epoch": 0.97, "learning_rate": 1.7596234725349437e-08, "loss": 2.4736, "step": 8115 }, { "epoch": 0.98, "learning_rate": 1.742835019587441e-08, "loss": 2.4556, "step": 8116 }, { "epoch": 0.98, "learning_rate": 1.7261268999400616e-08, "loss": 2.4773, "step": 8117 }, { "epoch": 0.98, "learning_rate": 1.7094991162867057e-08, "loss": 2.4661, "step": 8118 }, { "epoch": 0.98, "learning_rate": 1.6929516713082295e-08, "loss": 2.3319, "step": 8119 }, { "epoch": 0.98, "learning_rate": 1.676484567672554e-08, "loss": 2.5926, "step": 8120 }, { "epoch": 0.98, "learning_rate": 1.6600978080346108e-08, "loss": 2.398, "step": 8121 }, { "epoch": 0.98, "learning_rate": 1.6437913950364538e-08, "loss": 2.4773, "step": 8122 }, { "epoch": 0.98, "learning_rate": 1.6275653313072015e-08, "loss": 2.6735, "step": 8123 }, { "epoch": 0.98, "learning_rate": 1.6114196194628174e-08, "loss": 2.4705, "step": 8124 }, { "epoch": 0.98, "learning_rate": 1.5953542621066075e-08, "loss": 2.5295, "step": 8125 }, { "epoch": 0.98, "learning_rate": 1.5793692618286115e-08, "loss": 2.5514, "step": 8126 }, { "epoch": 0.98, "learning_rate": 1.563464621206212e-08, "loss": 2.4929, "step": 8127 }, { "epoch": 0.98, "learning_rate": 1.5476403428035803e-08, "loss": 2.3954, "step": 8128 }, { "epoch": 0.98, "learning_rate": 1.5318964291721196e-08, "loss": 2.6618, "step": 8129 }, { "epoch": 0.98, "learning_rate": 1.5162328828501328e-08, "loss": 2.6144, "step": 8130 }, { "epoch": 0.98, "learning_rate": 1.5006497063631e-08, "loss": 2.7542, "step": 8131 }, { "epoch": 0.98, "learning_rate": 1.4851469022234e-08, "loss": 2.2789, "step": 8132 }, { "epoch": 0.98, "learning_rate": 1.4697244729305894e-08, "loss": 2.5679, "step": 8133 }, { "epoch": 0.98, "learning_rate": 1.4543824209711788e-08, "loss": 2.3904, "step": 8134 }, { "epoch": 0.98, "learning_rate": 1.4391207488187453e-08, "loss": 2.5307, "step": 8135 }, { "epoch": 0.98, "learning_rate": 1.4239394589339317e-08, "loss": 2.3717, "step": 8136 }, { "epoch": 0.98, "learning_rate": 1.4088385537643912e-08, "loss": 2.4622, "step": 8137 }, { "epoch": 0.98, "learning_rate": 1.3938180357447318e-08, "loss": 2.5982, "step": 8138 }, { "epoch": 0.98, "learning_rate": 1.3788779072968495e-08, "loss": 2.5639, "step": 8139 }, { "epoch": 0.98, "learning_rate": 1.3640181708293731e-08, "loss": 2.7357, "step": 8140 }, { "epoch": 0.98, "learning_rate": 1.3492388287382196e-08, "loss": 2.3608, "step": 8141 }, { "epoch": 0.98, "learning_rate": 1.3345398834062051e-08, "loss": 2.3723, "step": 8142 }, { "epoch": 0.98, "learning_rate": 1.3199213372031561e-08, "loss": 2.4542, "step": 8143 }, { "epoch": 0.98, "learning_rate": 1.3053831924861315e-08, "loss": 2.3731, "step": 8144 }, { "epoch": 0.98, "learning_rate": 1.2909254515989788e-08, "loss": 2.5814, "step": 8145 }, { "epoch": 0.98, "learning_rate": 1.2765481168727779e-08, "loss": 2.649, "step": 8146 }, { "epoch": 0.98, "learning_rate": 1.2622511906255075e-08, "loss": 2.5635, "step": 8147 }, { "epoch": 0.98, "learning_rate": 1.2480346751622686e-08, "loss": 2.4383, "step": 8148 }, { "epoch": 0.98, "learning_rate": 1.2338985727751719e-08, "loss": 2.5835, "step": 8149 }, { "epoch": 0.98, "learning_rate": 1.2198428857433941e-08, "loss": 2.5639, "step": 8150 }, { "epoch": 0.98, "learning_rate": 1.2058676163330119e-08, "loss": 2.5097, "step": 8151 }, { "epoch": 0.98, "learning_rate": 1.1919727667973335e-08, "loss": 2.6043, "step": 8152 }, { "epoch": 0.98, "learning_rate": 1.1781583393765673e-08, "loss": 2.6138, "step": 8153 }, { "epoch": 0.98, "learning_rate": 1.1644243362980423e-08, "loss": 2.4462, "step": 8154 }, { "epoch": 0.98, "learning_rate": 1.1507707597759876e-08, "loss": 2.5627, "step": 8155 }, { "epoch": 0.98, "learning_rate": 1.137197612011809e-08, "loss": 2.4642, "step": 8156 }, { "epoch": 0.98, "learning_rate": 1.1237048951938666e-08, "loss": 2.563, "step": 8157 }, { "epoch": 0.98, "learning_rate": 1.1102926114975877e-08, "loss": 2.4635, "step": 8158 }, { "epoch": 0.98, "learning_rate": 1.0969607630854084e-08, "loss": 2.4442, "step": 8159 }, { "epoch": 0.98, "learning_rate": 1.0837093521067765e-08, "loss": 2.5965, "step": 8160 }, { "epoch": 0.98, "learning_rate": 1.0705383806982606e-08, "loss": 2.5469, "step": 8161 }, { "epoch": 0.98, "learning_rate": 1.0574478509833286e-08, "loss": 2.5637, "step": 8162 }, { "epoch": 0.98, "learning_rate": 1.0444377650725702e-08, "loss": 2.5458, "step": 8163 }, { "epoch": 0.98, "learning_rate": 1.0315081250636405e-08, "loss": 2.4314, "step": 8164 }, { "epoch": 0.98, "learning_rate": 1.0186589330410945e-08, "loss": 2.5568, "step": 8165 }, { "epoch": 0.98, "learning_rate": 1.0058901910766083e-08, "loss": 2.5783, "step": 8166 }, { "epoch": 0.98, "learning_rate": 9.932019012288685e-09, "loss": 2.55, "step": 8167 }, { "epoch": 0.98, "learning_rate": 9.805940655436274e-09, "loss": 2.3963, "step": 8168 }, { "epoch": 0.98, "learning_rate": 9.68066686053537e-09, "loss": 2.482, "step": 8169 }, { "epoch": 0.98, "learning_rate": 9.556197647784814e-09, "loss": 2.4012, "step": 8170 }, { "epoch": 0.98, "learning_rate": 9.43253303725189e-09, "loss": 2.465, "step": 8171 }, { "epoch": 0.98, "learning_rate": 9.30967304887509e-09, "loss": 2.5418, "step": 8172 }, { "epoch": 0.98, "learning_rate": 9.187617702463014e-09, "loss": 2.5482, "step": 8173 }, { "epoch": 0.98, "learning_rate": 9.066367017694366e-09, "loss": 2.381, "step": 8174 }, { "epoch": 0.98, "learning_rate": 8.945921014117954e-09, "loss": 2.5039, "step": 8175 }, { "epoch": 0.98, "learning_rate": 8.826279711153795e-09, "loss": 2.5449, "step": 8176 }, { "epoch": 0.98, "learning_rate": 8.707443128090908e-09, "loss": 2.5104, "step": 8177 }, { "epoch": 0.98, "learning_rate": 8.589411284089522e-09, "loss": 2.6798, "step": 8178 }, { "epoch": 0.98, "learning_rate": 8.472184198179412e-09, "loss": 2.4502, "step": 8179 }, { "epoch": 0.98, "learning_rate": 8.35576188926046e-09, "loss": 2.4924, "step": 8180 }, { "epoch": 0.98, "learning_rate": 8.240144376104876e-09, "loss": 2.5149, "step": 8181 }, { "epoch": 0.98, "learning_rate": 8.125331677352188e-09, "loss": 2.3395, "step": 8182 }, { "epoch": 0.98, "learning_rate": 8.011323811513704e-09, "loss": 2.4903, "step": 8183 }, { "epoch": 0.98, "learning_rate": 7.898120796970831e-09, "loss": 2.6128, "step": 8184 }, { "epoch": 0.98, "learning_rate": 7.78572265197508e-09, "loss": 2.5722, "step": 8185 }, { "epoch": 0.98, "learning_rate": 7.674129394648623e-09, "loss": 2.4804, "step": 8186 }, { "epoch": 0.98, "learning_rate": 7.563341042983174e-09, "loss": 2.4066, "step": 8187 }, { "epoch": 0.98, "learning_rate": 7.453357614841116e-09, "loss": 2.401, "step": 8188 }, { "epoch": 0.98, "learning_rate": 7.344179127954376e-09, "loss": 2.5883, "step": 8189 }, { "epoch": 0.98, "learning_rate": 7.235805599926093e-09, "loss": 2.5615, "step": 8190 }, { "epoch": 0.98, "learning_rate": 7.128237048229514e-09, "loss": 2.4466, "step": 8191 }, { "epoch": 0.98, "learning_rate": 7.0214734902074314e-09, "loss": 2.4612, "step": 8192 }, { "epoch": 0.98, "learning_rate": 6.9155149430732985e-09, "loss": 2.4596, "step": 8193 }, { "epoch": 0.98, "learning_rate": 6.810361423910117e-09, "loss": 2.5326, "step": 8194 }, { "epoch": 0.98, "learning_rate": 6.706012949672103e-09, "loss": 2.3822, "step": 8195 }, { "epoch": 0.98, "learning_rate": 6.60246953718302e-09, "loss": 2.5622, "step": 8196 }, { "epoch": 0.98, "learning_rate": 6.499731203137294e-09, "loss": 2.6148, "step": 8197 }, { "epoch": 0.98, "learning_rate": 6.3977979640994504e-09, "loss": 2.4227, "step": 8198 }, { "epoch": 0.98, "learning_rate": 6.296669836503566e-09, "loss": 2.3367, "step": 8199 }, { "epoch": 0.99, "learning_rate": 6.196346836654932e-09, "loss": 2.571, "step": 8200 }, { "epoch": 0.99, "learning_rate": 6.096828980727832e-09, "loss": 2.3922, "step": 8201 }, { "epoch": 0.99, "learning_rate": 5.9981162847672085e-09, "loss": 2.4372, "step": 8202 }, { "epoch": 0.99, "learning_rate": 5.900208764689774e-09, "loss": 2.6134, "step": 8203 }, { "epoch": 0.99, "learning_rate": 5.803106436279571e-09, "loss": 2.4157, "step": 8204 }, { "epoch": 0.99, "learning_rate": 5.706809315192963e-09, "loss": 2.5498, "step": 8205 }, { "epoch": 0.99, "learning_rate": 5.611317416955308e-09, "loss": 2.4451, "step": 8206 }, { "epoch": 0.99, "learning_rate": 5.516630756963182e-09, "loss": 2.3918, "step": 8207 }, { "epoch": 0.99, "learning_rate": 5.422749350482148e-09, "loss": 2.3648, "step": 8208 }, { "epoch": 0.99, "learning_rate": 5.329673212649544e-09, "loss": 2.4885, "step": 8209 }, { "epoch": 0.99, "learning_rate": 5.237402358471144e-09, "loss": 2.3634, "step": 8210 }, { "epoch": 0.99, "learning_rate": 5.145936802823937e-09, "loss": 2.4086, "step": 8211 }, { "epoch": 0.99, "learning_rate": 5.055276560454459e-09, "loss": 2.5217, "step": 8212 }, { "epoch": 0.99, "learning_rate": 4.965421645979907e-09, "loss": 2.4708, "step": 8213 }, { "epoch": 0.99, "learning_rate": 4.876372073887581e-09, "loss": 2.3934, "step": 8214 }, { "epoch": 0.99, "learning_rate": 4.788127858534886e-09, "loss": 2.4085, "step": 8215 }, { "epoch": 0.99, "learning_rate": 4.700689014149329e-09, "loss": 2.528, "step": 8216 }, { "epoch": 0.99, "learning_rate": 4.614055554827967e-09, "loss": 2.557, "step": 8217 }, { "epoch": 0.99, "learning_rate": 4.5282274945396276e-09, "loss": 2.497, "step": 8218 }, { "epoch": 0.99, "learning_rate": 4.443204847121019e-09, "loss": 2.5316, "step": 8219 }, { "epoch": 0.99, "learning_rate": 4.358987626281175e-09, "loss": 2.4091, "step": 8220 }, { "epoch": 0.99, "learning_rate": 4.275575845597568e-09, "loss": 2.4405, "step": 8221 }, { "epoch": 0.99, "learning_rate": 4.192969518519441e-09, "loss": 2.4955, "step": 8222 }, { "epoch": 0.99, "learning_rate": 4.111168658365028e-09, "loss": 2.4421, "step": 8223 }, { "epoch": 0.99, "learning_rate": 4.0301732783226685e-09, "loss": 2.4354, "step": 8224 }, { "epoch": 0.99, "learning_rate": 3.949983391450807e-09, "loss": 2.4029, "step": 8225 }, { "epoch": 0.99, "learning_rate": 3.870599010679099e-09, "loss": 2.6248, "step": 8226 }, { "epoch": 0.99, "learning_rate": 3.792020148806197e-09, "loss": 2.3476, "step": 8227 }, { "epoch": 0.99, "learning_rate": 3.71424681850141e-09, "loss": 2.462, "step": 8228 }, { "epoch": 0.99, "learning_rate": 3.637279032304153e-09, "loss": 2.5265, "step": 8229 }, { "epoch": 0.99, "learning_rate": 3.5611168026228326e-09, "loss": 2.6097, "step": 8230 }, { "epoch": 0.99, "learning_rate": 3.4857601417387365e-09, "loss": 2.4939, "step": 8231 }, { "epoch": 0.99, "learning_rate": 3.411209061799925e-09, "loss": 2.3645, "step": 8232 }, { "epoch": 0.99, "learning_rate": 3.3374635748267827e-09, "loss": 2.2656, "step": 8233 }, { "epoch": 0.99, "learning_rate": 3.2645236927092426e-09, "loss": 2.5451, "step": 8234 }, { "epoch": 0.99, "learning_rate": 3.192389427207343e-09, "loss": 2.5124, "step": 8235 }, { "epoch": 0.99, "learning_rate": 3.1210607899512244e-09, "loss": 2.6119, "step": 8236 }, { "epoch": 0.99, "learning_rate": 3.0505377924405778e-09, "loss": 2.428, "step": 8237 }, { "epoch": 0.99, "learning_rate": 2.9808204460463064e-09, "loss": 2.3868, "step": 8238 }, { "epoch": 0.99, "learning_rate": 2.911908762008864e-09, "loss": 2.4861, "step": 8239 }, { "epoch": 0.99, "learning_rate": 2.8438027514382517e-09, "loss": 2.5844, "step": 8240 }, { "epoch": 0.99, "learning_rate": 2.7765024253156856e-09, "loss": 2.6198, "step": 8241 }, { "epoch": 0.99, "learning_rate": 2.710007794491376e-09, "loss": 2.4432, "step": 8242 }, { "epoch": 0.99, "learning_rate": 2.6443188696867462e-09, "loss": 2.4262, "step": 8243 }, { "epoch": 0.99, "learning_rate": 2.579435661492213e-09, "loss": 2.5472, "step": 8244 }, { "epoch": 0.99, "learning_rate": 2.5153581803688544e-09, "loss": 2.5657, "step": 8245 }, { "epoch": 0.99, "learning_rate": 2.452086436648404e-09, "loss": 2.4245, "step": 8246 }, { "epoch": 0.99, "learning_rate": 2.3896204405310373e-09, "loss": 2.4933, "step": 8247 }, { "epoch": 0.99, "learning_rate": 2.3279602020892522e-09, "loss": 2.6031, "step": 8248 }, { "epoch": 0.99, "learning_rate": 2.2671057312634305e-09, "loss": 2.4978, "step": 8249 }, { "epoch": 0.99, "learning_rate": 2.207057037865168e-09, "loss": 2.4621, "step": 8250 }, { "epoch": 0.99, "learning_rate": 2.14781413157672e-09, "loss": 2.6318, "step": 8251 }, { "epoch": 0.99, "learning_rate": 2.0893770219493347e-09, "loss": 2.5875, "step": 8252 }, { "epoch": 0.99, "learning_rate": 2.0317457184043654e-09, "loss": 2.4807, "step": 8253 }, { "epoch": 0.99, "learning_rate": 1.9749202302343784e-09, "loss": 2.5129, "step": 8254 }, { "epoch": 0.99, "learning_rate": 1.918900566600379e-09, "loss": 2.5663, "step": 8255 }, { "epoch": 0.99, "learning_rate": 1.863686736535697e-09, "loss": 2.4534, "step": 8256 }, { "epoch": 0.99, "learning_rate": 1.8092787489404352e-09, "loss": 2.6267, "step": 8257 }, { "epoch": 0.99, "learning_rate": 1.755676612588686e-09, "loss": 2.3115, "step": 8258 }, { "epoch": 0.99, "learning_rate": 1.7028803361213152e-09, "loss": 2.4257, "step": 8259 }, { "epoch": 0.99, "learning_rate": 1.6508899280515134e-09, "loss": 2.5104, "step": 8260 }, { "epoch": 0.99, "learning_rate": 1.5997053967603538e-09, "loss": 2.5339, "step": 8261 }, { "epoch": 0.99, "learning_rate": 1.5493267505017895e-09, "loss": 2.3132, "step": 8262 }, { "epoch": 0.99, "learning_rate": 1.499753997397102e-09, "loss": 2.448, "step": 8263 }, { "epoch": 0.99, "learning_rate": 1.450987145439342e-09, "loss": 2.5244, "step": 8264 }, { "epoch": 0.99, "learning_rate": 1.403026202491109e-09, "loss": 2.355, "step": 8265 }, { "epoch": 0.99, "learning_rate": 1.3558711762851063e-09, "loss": 2.5497, "step": 8266 }, { "epoch": 0.99, "learning_rate": 1.309522074424141e-09, "loss": 2.4854, "step": 8267 }, { "epoch": 0.99, "learning_rate": 1.2639789043805695e-09, "loss": 2.4989, "step": 8268 }, { "epoch": 0.99, "learning_rate": 1.2192416734979617e-09, "loss": 2.3725, "step": 8269 }, { "epoch": 0.99, "learning_rate": 1.1753103889883267e-09, "loss": 2.5154, "step": 8270 }, { "epoch": 0.99, "learning_rate": 1.132185057935442e-09, "loss": 2.3742, "step": 8271 }, { "epoch": 0.99, "learning_rate": 1.0898656872920798e-09, "loss": 2.5806, "step": 8272 }, { "epoch": 0.99, "learning_rate": 1.0483522838811155e-09, "loss": 2.4613, "step": 8273 }, { "epoch": 0.99, "learning_rate": 1.0076448543960838e-09, "loss": 2.4708, "step": 8274 }, { "epoch": 0.99, "learning_rate": 9.677434053995127e-10, "loss": 2.4681, "step": 8275 }, { "epoch": 0.99, "learning_rate": 9.286479433257e-10, "loss": 2.5984, "step": 8276 }, { "epoch": 0.99, "learning_rate": 8.903584744768268e-10, "loss": 2.494, "step": 8277 }, { "epoch": 0.99, "learning_rate": 8.528750050273982e-10, "loss": 2.5161, "step": 8278 }, { "epoch": 0.99, "learning_rate": 8.161975410198031e-10, "loss": 2.3601, "step": 8279 }, { "epoch": 0.99, "learning_rate": 7.803260883681996e-10, "loss": 2.5558, "step": 8280 }, { "epoch": 0.99, "learning_rate": 7.452606528557393e-10, "loss": 2.5375, "step": 8281 }, { "epoch": 0.99, "learning_rate": 7.110012401362332e-10, "loss": 2.5502, "step": 8282 }, { "epoch": 1.0, "learning_rate": 6.775478557324855e-10, "loss": 2.6348, "step": 8283 }, { "epoch": 1.0, "learning_rate": 6.4490050503907e-10, "loss": 2.5907, "step": 8284 }, { "epoch": 1.0, "learning_rate": 6.13059193319554e-10, "loss": 2.5646, "step": 8285 }, { "epoch": 1.0, "learning_rate": 5.820239257070537e-10, "loss": 2.281, "step": 8286 }, { "epoch": 1.0, "learning_rate": 5.517947072064544e-10, "loss": 2.5137, "step": 8287 }, { "epoch": 1.0, "learning_rate": 5.2237154268997e-10, "loss": 2.714, "step": 8288 }, { "epoch": 1.0, "learning_rate": 4.937544369032488e-10, "loss": 2.6214, "step": 8289 }, { "epoch": 1.0, "learning_rate": 4.659433944587122e-10, "loss": 2.5226, "step": 8290 }, { "epoch": 1.0, "learning_rate": 4.389384198405511e-10, "loss": 2.6566, "step": 8291 }, { "epoch": 1.0, "learning_rate": 4.127395174036153e-10, "loss": 2.3989, "step": 8292 }, { "epoch": 1.0, "learning_rate": 3.8734669137119316e-10, "loss": 2.3277, "step": 8293 }, { "epoch": 1.0, "learning_rate": 3.627599458377873e-10, "loss": 2.5224, "step": 8294 }, { "epoch": 1.0, "learning_rate": 3.389792847668938e-10, "loss": 2.6145, "step": 8295 }, { "epoch": 1.0, "learning_rate": 3.1600471199322304e-10, "loss": 2.4101, "step": 8296 }, { "epoch": 1.0, "learning_rate": 2.938362312199239e-10, "loss": 2.4066, "step": 8297 }, { "epoch": 1.0, "learning_rate": 2.7247384602246964e-10, "loss": 2.3178, "step": 8298 }, { "epoch": 1.0, "learning_rate": 2.5191755984477204e-10, "loss": 2.4465, "step": 8299 }, { "epoch": 1.0, "learning_rate": 2.321673760002918e-10, "loss": 2.392, "step": 8300 }, { "epoch": 1.0, "learning_rate": 2.1322329767425875e-10, "loss": 2.497, "step": 8301 }, { "epoch": 1.0, "learning_rate": 1.950853279203413e-10, "loss": 2.365, "step": 8302 }, { "epoch": 1.0, "learning_rate": 1.77753469663422e-10, "loss": 2.5538, "step": 8303 }, { "epoch": 1.0, "learning_rate": 1.6122772569793221e-10, "loss": 2.5754, "step": 8304 }, { "epoch": 1.0, "learning_rate": 1.4550809868729698e-10, "loss": 2.3786, "step": 8305 }, { "epoch": 1.0, "learning_rate": 1.305945911672657e-10, "loss": 2.2847, "step": 8306 }, { "epoch": 1.0, "learning_rate": 1.164872055414712e-10, "loss": 2.3156, "step": 8307 }, { "epoch": 1.0, "learning_rate": 1.0318594408476045e-10, "loss": 2.5269, "step": 8308 }, { "epoch": 1.0, "learning_rate": 9.069080894152926e-11, "loss": 2.4647, "step": 8309 }, { "epoch": 1.0, "learning_rate": 7.90018021268324e-11, "loss": 2.339, "step": 8310 }, { "epoch": 1.0, "learning_rate": 6.811892552471832e-11, "loss": 2.3976, "step": 8311 }, { "epoch": 1.0, "learning_rate": 5.804218088933944e-11, "loss": 2.4379, "step": 8312 }, { "epoch": 1.0, "learning_rate": 4.877156984661735e-11, "loss": 2.5229, "step": 8313 }, { "epoch": 1.0, "learning_rate": 4.030709389035714e-11, "loss": 2.5463, "step": 8314 }, { "epoch": 1.0, "learning_rate": 3.264875438613313e-11, "loss": 2.5688, "step": 8315 }, { "epoch": 1.0, "learning_rate": 2.57965525674031e-11, "loss": 2.4653, "step": 8316 }, { "epoch": 1.0, "learning_rate": 1.975048953994918e-11, "loss": 2.4684, "step": 8317 }, { "epoch": 1.0, "learning_rate": 1.4510566277992077e-11, "loss": 2.5291, "step": 8318 }, { "epoch": 1.0, "learning_rate": 1.0076783626966625e-11, "loss": 2.4207, "step": 8319 }, { "epoch": 1.0, "learning_rate": 6.449142300746225e-12, "loss": 2.5677, "step": 8320 }, { "epoch": 1.0, "learning_rate": 3.6276428855286373e-12, "loss": 2.5879, "step": 8321 }, { "epoch": 1.0, "learning_rate": 1.6122858353950776e-12, "loss": 2.5597, "step": 8322 }, { "epoch": 1.0, "learning_rate": 4.030714750857811e-13, "loss": 2.5695, "step": 8323 }, { "epoch": 1.0, "learning_rate": 0.0, "loss": 2.521, "step": 8324 }, { "epoch": 1.0, "step": 8324, "total_flos": 1.0732074279370752e+18, "train_loss": 2.5607235752465, "train_runtime": 9425.8937, "train_samples_per_second": 56.515, "train_steps_per_second": 0.883 } ], "max_steps": 8324, "num_train_epochs": 1, "total_flos": 1.0732074279370752e+18, "trial_name": null, "trial_params": null }