diff --git "a/trainer_state.json" "b/trainer_state.json" new file mode 100644--- /dev/null +++ "b/trainer_state.json" @@ -0,0 +1,199195 @@ +{ + "best_metric": null, + "best_model_checkpoint": null, + "epoch": 1.0, + "global_step": 33195, + "is_hyper_param_search": false, + "is_local_process_zero": true, + "is_world_process_zero": true, + "log_history": [ + { + "epoch": 0.0, + "learning_rate": 5.02008032128514e-09, + "loss": 2.4155, + "step": 1 + }, + { + "epoch": 0.0, + "learning_rate": 1.004016064257028e-08, + "loss": 2.5479, + "step": 2 + }, + { + "epoch": 0.0, + "learning_rate": 1.5060240963855425e-08, + "loss": 2.5901, + "step": 3 + }, + { + "epoch": 0.0, + "learning_rate": 2.008032128514056e-08, + "loss": 2.7227, + "step": 4 + }, + { + "epoch": 0.0, + "learning_rate": 2.5100401606425703e-08, + "loss": 2.562, + "step": 5 + }, + { + "epoch": 0.0, + "learning_rate": 3.012048192771085e-08, + "loss": 2.8206, + "step": 6 + }, + { + "epoch": 0.0, + "learning_rate": 3.5140562248995985e-08, + "loss": 2.6187, + "step": 7 + }, + { + "epoch": 0.0, + "learning_rate": 4.016064257028112e-08, + "loss": 2.5796, + "step": 8 + }, + { + "epoch": 0.0, + "learning_rate": 4.5180722891566264e-08, + "loss": 2.5427, + "step": 9 + }, + { + "epoch": 0.0, + "learning_rate": 5.0200803212851406e-08, + "loss": 2.6848, + "step": 10 + }, + { + "epoch": 0.0, + "learning_rate": 5.522088353413655e-08, + "loss": 2.696, + "step": 11 + }, + { + "epoch": 0.0, + "learning_rate": 6.02409638554217e-08, + "loss": 2.8428, + "step": 12 + }, + { + "epoch": 0.0, + "learning_rate": 6.526104417670683e-08, + "loss": 2.7173, + "step": 13 + }, + { + "epoch": 0.0, + "learning_rate": 7.028112449799197e-08, + "loss": 2.4712, + "step": 14 + }, + { + "epoch": 0.0, + "learning_rate": 7.530120481927711e-08, + "loss": 2.3896, + "step": 15 + }, + { + "epoch": 0.0, + "learning_rate": 8.032128514056224e-08, + "loss": 2.5011, + "step": 16 + }, + { + "epoch": 0.0, + "learning_rate": 8.53413654618474e-08, + "loss": 2.7654, + "step": 17 + }, + { + "epoch": 0.0, + "learning_rate": 9.036144578313253e-08, + "loss": 2.8972, + "step": 18 + }, + { + "epoch": 0.0, + "learning_rate": 9.538152610441768e-08, + "loss": 2.7473, + "step": 19 + }, + { + "epoch": 0.0, + "learning_rate": 1.0040160642570281e-07, + "loss": 2.4688, + "step": 20 + }, + { + "epoch": 0.0, + "learning_rate": 1.0542168674698796e-07, + "loss": 2.4634, + "step": 21 + }, + { + "epoch": 0.0, + "learning_rate": 1.104417670682731e-07, + "loss": 2.5532, + "step": 22 + }, + { + "epoch": 0.0, + "learning_rate": 1.1546184738955824e-07, + "loss": 2.6824, + "step": 23 + }, + { + "epoch": 0.0, + "learning_rate": 1.204819277108434e-07, + "loss": 2.5073, + "step": 24 + }, + { + "epoch": 0.0, + "learning_rate": 1.2550200803212853e-07, + "loss": 2.9604, + "step": 25 + }, + { + "epoch": 0.0, + "learning_rate": 1.3052208835341366e-07, + "loss": 2.2404, + "step": 26 + }, + { + "epoch": 0.0, + "learning_rate": 1.355421686746988e-07, + "loss": 2.3335, + "step": 27 + }, + { + "epoch": 0.0, + "learning_rate": 1.4056224899598394e-07, + "loss": 2.2633, + "step": 28 + }, + { + "epoch": 0.0, + "learning_rate": 1.455823293172691e-07, + "loss": 2.1682, + "step": 29 + }, + { + "epoch": 0.0, + "learning_rate": 1.5060240963855423e-07, + "loss": 2.259, + "step": 30 + }, + { + "epoch": 0.0, + "learning_rate": 1.5562248995983936e-07, + "loss": 2.3323, + "step": 31 + }, + { + "epoch": 0.0, + "learning_rate": 1.6064257028112448e-07, + "loss": 2.1294, + "step": 32 + }, + { + "epoch": 0.0, + "learning_rate": 1.6566265060240967e-07, + "loss": 1.9897, + "step": 33 + }, + { + "epoch": 0.0, + "learning_rate": 1.706827309236948e-07, + "loss": 1.9979, + "step": 34 + }, + { + "epoch": 0.0, + "learning_rate": 1.7570281124497993e-07, + "loss": 2.1283, + "step": 35 + }, + { + "epoch": 0.0, + "learning_rate": 1.8072289156626505e-07, + "loss": 2.0967, + "step": 36 + }, + { + "epoch": 0.0, + "learning_rate": 1.857429718875502e-07, + "loss": 2.1406, + "step": 37 + }, + { + "epoch": 0.0, + "learning_rate": 1.9076305220883537e-07, + "loss": 2.1028, + "step": 38 + }, + { + "epoch": 0.0, + "learning_rate": 1.957831325301205e-07, + "loss": 1.8724, + "step": 39 + }, + { + "epoch": 0.0, + "learning_rate": 2.0080321285140563e-07, + "loss": 1.9177, + "step": 40 + }, + { + "epoch": 0.0, + "learning_rate": 2.0582329317269078e-07, + "loss": 1.9093, + "step": 41 + }, + { + "epoch": 0.0, + "learning_rate": 2.108433734939759e-07, + "loss": 1.8374, + "step": 42 + }, + { + "epoch": 0.0, + "learning_rate": 2.1586345381526107e-07, + "loss": 1.8722, + "step": 43 + }, + { + "epoch": 0.0, + "learning_rate": 2.208835341365462e-07, + "loss": 1.8756, + "step": 44 + }, + { + "epoch": 0.0, + "learning_rate": 2.2590361445783135e-07, + "loss": 1.7311, + "step": 45 + }, + { + "epoch": 0.0, + "learning_rate": 2.3092369477911648e-07, + "loss": 1.7499, + "step": 46 + }, + { + "epoch": 0.0, + "learning_rate": 2.359437751004016e-07, + "loss": 1.6642, + "step": 47 + }, + { + "epoch": 0.0, + "learning_rate": 2.409638554216868e-07, + "loss": 1.7401, + "step": 48 + }, + { + "epoch": 0.0, + "learning_rate": 2.459839357429719e-07, + "loss": 1.7141, + "step": 49 + }, + { + "epoch": 0.0, + "learning_rate": 2.5100401606425705e-07, + "loss": 1.8718, + "step": 50 + }, + { + "epoch": 0.0, + "learning_rate": 2.560240963855422e-07, + "loss": 1.6438, + "step": 51 + }, + { + "epoch": 0.0, + "learning_rate": 2.610441767068273e-07, + "loss": 1.5062, + "step": 52 + }, + { + "epoch": 0.0, + "learning_rate": 2.6606425702811247e-07, + "loss": 1.6093, + "step": 53 + }, + { + "epoch": 0.0, + "learning_rate": 2.710843373493976e-07, + "loss": 1.5728, + "step": 54 + }, + { + "epoch": 0.0, + "learning_rate": 2.761044176706828e-07, + "loss": 1.6921, + "step": 55 + }, + { + "epoch": 0.0, + "learning_rate": 2.811244979919679e-07, + "loss": 1.7946, + "step": 56 + }, + { + "epoch": 0.0, + "learning_rate": 2.8614457831325304e-07, + "loss": 1.604, + "step": 57 + }, + { + "epoch": 0.0, + "learning_rate": 2.911646586345382e-07, + "loss": 1.5355, + "step": 58 + }, + { + "epoch": 0.0, + "learning_rate": 2.9618473895582335e-07, + "loss": 1.5288, + "step": 59 + }, + { + "epoch": 0.0, + "learning_rate": 3.0120481927710845e-07, + "loss": 1.5636, + "step": 60 + }, + { + "epoch": 0.0, + "learning_rate": 3.062248995983936e-07, + "loss": 1.5856, + "step": 61 + }, + { + "epoch": 0.0, + "learning_rate": 3.112449799196787e-07, + "loss": 1.5604, + "step": 62 + }, + { + "epoch": 0.0, + "learning_rate": 3.1626506024096387e-07, + "loss": 1.537, + "step": 63 + }, + { + "epoch": 0.0, + "learning_rate": 3.2128514056224897e-07, + "loss": 1.5649, + "step": 64 + }, + { + "epoch": 0.0, + "learning_rate": 3.263052208835342e-07, + "loss": 1.5441, + "step": 65 + }, + { + "epoch": 0.0, + "learning_rate": 3.3132530120481933e-07, + "loss": 1.4779, + "step": 66 + }, + { + "epoch": 0.0, + "learning_rate": 3.363453815261045e-07, + "loss": 1.5302, + "step": 67 + }, + { + "epoch": 0.0, + "learning_rate": 3.413654618473896e-07, + "loss": 1.6504, + "step": 68 + }, + { + "epoch": 0.0, + "learning_rate": 3.4638554216867475e-07, + "loss": 1.5765, + "step": 69 + }, + { + "epoch": 0.0, + "learning_rate": 3.5140562248995985e-07, + "loss": 1.4261, + "step": 70 + }, + { + "epoch": 0.0, + "learning_rate": 3.56425702811245e-07, + "loss": 1.5109, + "step": 71 + }, + { + "epoch": 0.0, + "learning_rate": 3.614457831325301e-07, + "loss": 1.4829, + "step": 72 + }, + { + "epoch": 0.0, + "learning_rate": 3.6646586345381527e-07, + "loss": 1.3701, + "step": 73 + }, + { + "epoch": 0.0, + "learning_rate": 3.714859437751004e-07, + "loss": 1.5048, + "step": 74 + }, + { + "epoch": 0.0, + "learning_rate": 3.7650602409638563e-07, + "loss": 1.5005, + "step": 75 + }, + { + "epoch": 0.0, + "learning_rate": 3.8152610441767073e-07, + "loss": 1.4692, + "step": 76 + }, + { + "epoch": 0.0, + "learning_rate": 3.865461847389559e-07, + "loss": 1.4747, + "step": 77 + }, + { + "epoch": 0.0, + "learning_rate": 3.91566265060241e-07, + "loss": 1.478, + "step": 78 + }, + { + "epoch": 0.0, + "learning_rate": 3.9658634538152615e-07, + "loss": 1.4521, + "step": 79 + }, + { + "epoch": 0.0, + "learning_rate": 4.0160642570281125e-07, + "loss": 1.4882, + "step": 80 + }, + { + "epoch": 0.0, + "learning_rate": 4.066265060240964e-07, + "loss": 1.5562, + "step": 81 + }, + { + "epoch": 0.0, + "learning_rate": 4.1164658634538156e-07, + "loss": 1.458, + "step": 82 + }, + { + "epoch": 0.0, + "learning_rate": 4.1666666666666667e-07, + "loss": 1.4043, + "step": 83 + }, + { + "epoch": 0.0, + "learning_rate": 4.216867469879518e-07, + "loss": 1.3, + "step": 84 + }, + { + "epoch": 0.0, + "learning_rate": 4.2670682730923703e-07, + "loss": 1.4576, + "step": 85 + }, + { + "epoch": 0.0, + "learning_rate": 4.3172690763052213e-07, + "loss": 1.4498, + "step": 86 + }, + { + "epoch": 0.0, + "learning_rate": 4.367469879518073e-07, + "loss": 1.506, + "step": 87 + }, + { + "epoch": 0.0, + "learning_rate": 4.417670682730924e-07, + "loss": 1.3972, + "step": 88 + }, + { + "epoch": 0.0, + "learning_rate": 4.4678714859437755e-07, + "loss": 1.4575, + "step": 89 + }, + { + "epoch": 0.0, + "learning_rate": 4.518072289156627e-07, + "loss": 1.4003, + "step": 90 + }, + { + "epoch": 0.0, + "learning_rate": 4.568273092369478e-07, + "loss": 1.2924, + "step": 91 + }, + { + "epoch": 0.0, + "learning_rate": 4.6184738955823296e-07, + "loss": 1.3619, + "step": 92 + }, + { + "epoch": 0.0, + "learning_rate": 4.6686746987951807e-07, + "loss": 1.5461, + "step": 93 + }, + { + "epoch": 0.0, + "learning_rate": 4.718875502008032e-07, + "loss": 1.572, + "step": 94 + }, + { + "epoch": 0.0, + "learning_rate": 4.769076305220884e-07, + "loss": 1.3987, + "step": 95 + }, + { + "epoch": 0.0, + "learning_rate": 4.819277108433736e-07, + "loss": 1.4033, + "step": 96 + }, + { + "epoch": 0.0, + "learning_rate": 4.869477911646587e-07, + "loss": 1.3839, + "step": 97 + }, + { + "epoch": 0.0, + "learning_rate": 4.919678714859438e-07, + "loss": 1.3643, + "step": 98 + }, + { + "epoch": 0.0, + "learning_rate": 4.96987951807229e-07, + "loss": 1.2183, + "step": 99 + }, + { + "epoch": 0.0, + "learning_rate": 5.020080321285141e-07, + "loss": 1.577, + "step": 100 + }, + { + "epoch": 0.0, + "learning_rate": 5.070281124497993e-07, + "loss": 1.3492, + "step": 101 + }, + { + "epoch": 0.0, + "learning_rate": 5.120481927710844e-07, + "loss": 1.267, + "step": 102 + }, + { + "epoch": 0.0, + "learning_rate": 5.170682730923695e-07, + "loss": 1.3755, + "step": 103 + }, + { + "epoch": 0.0, + "learning_rate": 5.220883534136546e-07, + "loss": 1.3232, + "step": 104 + }, + { + "epoch": 0.0, + "learning_rate": 5.271084337349399e-07, + "loss": 1.2084, + "step": 105 + }, + { + "epoch": 0.0, + "learning_rate": 5.321285140562249e-07, + "loss": 1.4172, + "step": 106 + }, + { + "epoch": 0.0, + "learning_rate": 5.371485943775101e-07, + "loss": 1.3521, + "step": 107 + }, + { + "epoch": 0.0, + "learning_rate": 5.421686746987952e-07, + "loss": 1.4406, + "step": 108 + }, + { + "epoch": 0.0, + "learning_rate": 5.471887550200804e-07, + "loss": 1.3184, + "step": 109 + }, + { + "epoch": 0.0, + "learning_rate": 5.522088353413656e-07, + "loss": 1.204, + "step": 110 + }, + { + "epoch": 0.0, + "learning_rate": 5.572289156626506e-07, + "loss": 1.3633, + "step": 111 + }, + { + "epoch": 0.0, + "learning_rate": 5.622489959839358e-07, + "loss": 1.3525, + "step": 112 + }, + { + "epoch": 0.0, + "learning_rate": 5.672690763052209e-07, + "loss": 1.2325, + "step": 113 + }, + { + "epoch": 0.0, + "learning_rate": 5.722891566265061e-07, + "loss": 1.2248, + "step": 114 + }, + { + "epoch": 0.0, + "learning_rate": 5.773092369477912e-07, + "loss": 1.2024, + "step": 115 + }, + { + "epoch": 0.0, + "learning_rate": 5.823293172690764e-07, + "loss": 1.3489, + "step": 116 + }, + { + "epoch": 0.0, + "learning_rate": 5.873493975903615e-07, + "loss": 1.3716, + "step": 117 + }, + { + "epoch": 0.0, + "learning_rate": 5.923694779116467e-07, + "loss": 1.2109, + "step": 118 + }, + { + "epoch": 0.0, + "learning_rate": 5.973895582329317e-07, + "loss": 1.2858, + "step": 119 + }, + { + "epoch": 0.0, + "learning_rate": 6.024096385542169e-07, + "loss": 1.3219, + "step": 120 + }, + { + "epoch": 0.0, + "learning_rate": 6.074297188755021e-07, + "loss": 1.2228, + "step": 121 + }, + { + "epoch": 0.0, + "learning_rate": 6.124497991967872e-07, + "loss": 1.3014, + "step": 122 + }, + { + "epoch": 0.0, + "learning_rate": 6.174698795180723e-07, + "loss": 1.2285, + "step": 123 + }, + { + "epoch": 0.0, + "learning_rate": 6.224899598393574e-07, + "loss": 1.1723, + "step": 124 + }, + { + "epoch": 0.0, + "learning_rate": 6.275100401606427e-07, + "loss": 1.4469, + "step": 125 + }, + { + "epoch": 0.0, + "learning_rate": 6.325301204819277e-07, + "loss": 1.2423, + "step": 126 + }, + { + "epoch": 0.0, + "learning_rate": 6.375502008032129e-07, + "loss": 1.2848, + "step": 127 + }, + { + "epoch": 0.0, + "learning_rate": 6.425702811244979e-07, + "loss": 1.3463, + "step": 128 + }, + { + "epoch": 0.0, + "learning_rate": 6.475903614457832e-07, + "loss": 1.3191, + "step": 129 + }, + { + "epoch": 0.0, + "learning_rate": 6.526104417670684e-07, + "loss": 1.1904, + "step": 130 + }, + { + "epoch": 0.0, + "learning_rate": 6.576305220883534e-07, + "loss": 1.4174, + "step": 131 + }, + { + "epoch": 0.0, + "learning_rate": 6.626506024096387e-07, + "loss": 1.135, + "step": 132 + }, + { + "epoch": 0.0, + "learning_rate": 6.676706827309237e-07, + "loss": 1.2214, + "step": 133 + }, + { + "epoch": 0.0, + "learning_rate": 6.72690763052209e-07, + "loss": 1.22, + "step": 134 + }, + { + "epoch": 0.0, + "learning_rate": 6.77710843373494e-07, + "loss": 1.2402, + "step": 135 + }, + { + "epoch": 0.0, + "learning_rate": 6.827309236947792e-07, + "loss": 1.4093, + "step": 136 + }, + { + "epoch": 0.0, + "learning_rate": 6.877510040160642e-07, + "loss": 1.4006, + "step": 137 + }, + { + "epoch": 0.0, + "learning_rate": 6.927710843373495e-07, + "loss": 1.1896, + "step": 138 + }, + { + "epoch": 0.0, + "learning_rate": 6.977911646586345e-07, + "loss": 1.2017, + "step": 139 + }, + { + "epoch": 0.0, + "learning_rate": 7.028112449799197e-07, + "loss": 1.0653, + "step": 140 + }, + { + "epoch": 0.0, + "learning_rate": 7.07831325301205e-07, + "loss": 1.3293, + "step": 141 + }, + { + "epoch": 0.0, + "learning_rate": 7.1285140562249e-07, + "loss": 1.3657, + "step": 142 + }, + { + "epoch": 0.0, + "learning_rate": 7.178714859437752e-07, + "loss": 1.1977, + "step": 143 + }, + { + "epoch": 0.0, + "learning_rate": 7.228915662650602e-07, + "loss": 1.3591, + "step": 144 + }, + { + "epoch": 0.0, + "learning_rate": 7.279116465863455e-07, + "loss": 1.2922, + "step": 145 + }, + { + "epoch": 0.0, + "learning_rate": 7.329317269076305e-07, + "loss": 1.3021, + "step": 146 + }, + { + "epoch": 0.0, + "learning_rate": 7.379518072289157e-07, + "loss": 1.2247, + "step": 147 + }, + { + "epoch": 0.0, + "learning_rate": 7.429718875502008e-07, + "loss": 1.2728, + "step": 148 + }, + { + "epoch": 0.0, + "learning_rate": 7.47991967871486e-07, + "loss": 1.2058, + "step": 149 + }, + { + "epoch": 0.0, + "learning_rate": 7.530120481927713e-07, + "loss": 1.2694, + "step": 150 + }, + { + "epoch": 0.0, + "learning_rate": 7.580321285140563e-07, + "loss": 1.2841, + "step": 151 + }, + { + "epoch": 0.0, + "learning_rate": 7.630522088353415e-07, + "loss": 1.2338, + "step": 152 + }, + { + "epoch": 0.0, + "learning_rate": 7.680722891566265e-07, + "loss": 1.1969, + "step": 153 + }, + { + "epoch": 0.0, + "learning_rate": 7.730923694779118e-07, + "loss": 1.1537, + "step": 154 + }, + { + "epoch": 0.0, + "learning_rate": 7.781124497991968e-07, + "loss": 1.2491, + "step": 155 + }, + { + "epoch": 0.0, + "learning_rate": 7.83132530120482e-07, + "loss": 1.2469, + "step": 156 + }, + { + "epoch": 0.0, + "learning_rate": 7.88152610441767e-07, + "loss": 1.302, + "step": 157 + }, + { + "epoch": 0.0, + "learning_rate": 7.931726907630523e-07, + "loss": 1.1821, + "step": 158 + }, + { + "epoch": 0.0, + "learning_rate": 7.981927710843373e-07, + "loss": 1.1961, + "step": 159 + }, + { + "epoch": 0.0, + "learning_rate": 8.032128514056225e-07, + "loss": 1.2323, + "step": 160 + }, + { + "epoch": 0.0, + "learning_rate": 8.082329317269078e-07, + "loss": 1.1526, + "step": 161 + }, + { + "epoch": 0.0, + "learning_rate": 8.132530120481928e-07, + "loss": 1.2313, + "step": 162 + }, + { + "epoch": 0.0, + "learning_rate": 8.182730923694781e-07, + "loss": 1.2028, + "step": 163 + }, + { + "epoch": 0.0, + "learning_rate": 8.232931726907631e-07, + "loss": 1.4237, + "step": 164 + }, + { + "epoch": 0.0, + "learning_rate": 8.283132530120483e-07, + "loss": 1.1572, + "step": 165 + }, + { + "epoch": 0.01, + "learning_rate": 8.333333333333333e-07, + "loss": 1.2743, + "step": 166 + }, + { + "epoch": 0.01, + "learning_rate": 8.383534136546186e-07, + "loss": 1.1199, + "step": 167 + }, + { + "epoch": 0.01, + "learning_rate": 8.433734939759036e-07, + "loss": 1.2889, + "step": 168 + }, + { + "epoch": 0.01, + "learning_rate": 8.483935742971888e-07, + "loss": 1.281, + "step": 169 + }, + { + "epoch": 0.01, + "learning_rate": 8.534136546184741e-07, + "loss": 1.2972, + "step": 170 + }, + { + "epoch": 0.01, + "learning_rate": 8.584337349397591e-07, + "loss": 1.2623, + "step": 171 + }, + { + "epoch": 0.01, + "learning_rate": 8.634538152610443e-07, + "loss": 1.2565, + "step": 172 + }, + { + "epoch": 0.01, + "learning_rate": 8.684738955823293e-07, + "loss": 1.2812, + "step": 173 + }, + { + "epoch": 0.01, + "learning_rate": 8.734939759036146e-07, + "loss": 1.2247, + "step": 174 + }, + { + "epoch": 0.01, + "learning_rate": 8.785140562248996e-07, + "loss": 1.3257, + "step": 175 + }, + { + "epoch": 0.01, + "learning_rate": 8.835341365461848e-07, + "loss": 1.3358, + "step": 176 + }, + { + "epoch": 0.01, + "learning_rate": 8.885542168674699e-07, + "loss": 1.3177, + "step": 177 + }, + { + "epoch": 0.01, + "learning_rate": 8.935742971887551e-07, + "loss": 1.2667, + "step": 178 + }, + { + "epoch": 0.01, + "learning_rate": 8.985943775100401e-07, + "loss": 1.2096, + "step": 179 + }, + { + "epoch": 0.01, + "learning_rate": 9.036144578313254e-07, + "loss": 1.2301, + "step": 180 + }, + { + "epoch": 0.01, + "learning_rate": 9.086345381526106e-07, + "loss": 1.2493, + "step": 181 + }, + { + "epoch": 0.01, + "learning_rate": 9.136546184738956e-07, + "loss": 1.1779, + "step": 182 + }, + { + "epoch": 0.01, + "learning_rate": 9.186746987951809e-07, + "loss": 1.1583, + "step": 183 + }, + { + "epoch": 0.01, + "learning_rate": 9.236947791164659e-07, + "loss": 1.2643, + "step": 184 + }, + { + "epoch": 0.01, + "learning_rate": 9.287148594377511e-07, + "loss": 1.1299, + "step": 185 + }, + { + "epoch": 0.01, + "learning_rate": 9.337349397590361e-07, + "loss": 1.2518, + "step": 186 + }, + { + "epoch": 0.01, + "learning_rate": 9.387550200803214e-07, + "loss": 1.2502, + "step": 187 + }, + { + "epoch": 0.01, + "learning_rate": 9.437751004016064e-07, + "loss": 1.1628, + "step": 188 + }, + { + "epoch": 0.01, + "learning_rate": 9.487951807228916e-07, + "loss": 1.2582, + "step": 189 + }, + { + "epoch": 0.01, + "learning_rate": 9.538152610441769e-07, + "loss": 1.2424, + "step": 190 + }, + { + "epoch": 0.01, + "learning_rate": 9.58835341365462e-07, + "loss": 1.2504, + "step": 191 + }, + { + "epoch": 0.01, + "learning_rate": 9.638554216867472e-07, + "loss": 1.2153, + "step": 192 + }, + { + "epoch": 0.01, + "learning_rate": 9.688755020080322e-07, + "loss": 1.3019, + "step": 193 + }, + { + "epoch": 0.01, + "learning_rate": 9.738955823293175e-07, + "loss": 1.1819, + "step": 194 + }, + { + "epoch": 0.01, + "learning_rate": 9.789156626506025e-07, + "loss": 1.2485, + "step": 195 + }, + { + "epoch": 0.01, + "learning_rate": 9.839357429718876e-07, + "loss": 1.272, + "step": 196 + }, + { + "epoch": 0.01, + "learning_rate": 9.889558232931726e-07, + "loss": 1.257, + "step": 197 + }, + { + "epoch": 0.01, + "learning_rate": 9.93975903614458e-07, + "loss": 1.2561, + "step": 198 + }, + { + "epoch": 0.01, + "learning_rate": 9.98995983935743e-07, + "loss": 1.1905, + "step": 199 + }, + { + "epoch": 0.01, + "learning_rate": 1.0040160642570282e-06, + "loss": 1.1709, + "step": 200 + }, + { + "epoch": 0.01, + "learning_rate": 1.0090361445783135e-06, + "loss": 1.3597, + "step": 201 + }, + { + "epoch": 0.01, + "learning_rate": 1.0140562248995985e-06, + "loss": 1.1508, + "step": 202 + }, + { + "epoch": 0.01, + "learning_rate": 1.0190763052208836e-06, + "loss": 1.2331, + "step": 203 + }, + { + "epoch": 0.01, + "learning_rate": 1.0240963855421688e-06, + "loss": 1.2838, + "step": 204 + }, + { + "epoch": 0.01, + "learning_rate": 1.0291164658634539e-06, + "loss": 1.1999, + "step": 205 + }, + { + "epoch": 0.01, + "learning_rate": 1.034136546184739e-06, + "loss": 1.1559, + "step": 206 + }, + { + "epoch": 0.01, + "learning_rate": 1.0391566265060242e-06, + "loss": 1.2174, + "step": 207 + }, + { + "epoch": 0.01, + "learning_rate": 1.0441767068273092e-06, + "loss": 1.2364, + "step": 208 + }, + { + "epoch": 0.01, + "learning_rate": 1.0491967871485945e-06, + "loss": 1.1697, + "step": 209 + }, + { + "epoch": 0.01, + "learning_rate": 1.0542168674698798e-06, + "loss": 1.1979, + "step": 210 + }, + { + "epoch": 0.01, + "learning_rate": 1.0592369477911648e-06, + "loss": 1.1682, + "step": 211 + }, + { + "epoch": 0.01, + "learning_rate": 1.0642570281124499e-06, + "loss": 1.2386, + "step": 212 + }, + { + "epoch": 0.01, + "learning_rate": 1.069277108433735e-06, + "loss": 1.2647, + "step": 213 + }, + { + "epoch": 0.01, + "learning_rate": 1.0742971887550202e-06, + "loss": 1.2115, + "step": 214 + }, + { + "epoch": 0.01, + "learning_rate": 1.0793172690763052e-06, + "loss": 1.1761, + "step": 215 + }, + { + "epoch": 0.01, + "learning_rate": 1.0843373493975905e-06, + "loss": 1.1451, + "step": 216 + }, + { + "epoch": 0.01, + "learning_rate": 1.0893574297188755e-06, + "loss": 1.1812, + "step": 217 + }, + { + "epoch": 0.01, + "learning_rate": 1.0943775100401608e-06, + "loss": 1.2293, + "step": 218 + }, + { + "epoch": 0.01, + "learning_rate": 1.0993975903614459e-06, + "loss": 1.0367, + "step": 219 + }, + { + "epoch": 0.01, + "learning_rate": 1.1044176706827311e-06, + "loss": 1.2104, + "step": 220 + }, + { + "epoch": 0.01, + "learning_rate": 1.1094377510040162e-06, + "loss": 1.2677, + "step": 221 + }, + { + "epoch": 0.01, + "learning_rate": 1.1144578313253012e-06, + "loss": 1.2855, + "step": 222 + }, + { + "epoch": 0.01, + "learning_rate": 1.1194779116465865e-06, + "loss": 1.2546, + "step": 223 + }, + { + "epoch": 0.01, + "learning_rate": 1.1244979919678715e-06, + "loss": 1.2147, + "step": 224 + }, + { + "epoch": 0.01, + "learning_rate": 1.1295180722891568e-06, + "loss": 1.27, + "step": 225 + }, + { + "epoch": 0.01, + "learning_rate": 1.1345381526104418e-06, + "loss": 1.3188, + "step": 226 + }, + { + "epoch": 0.01, + "learning_rate": 1.139558232931727e-06, + "loss": 1.1672, + "step": 227 + }, + { + "epoch": 0.01, + "learning_rate": 1.1445783132530121e-06, + "loss": 1.2582, + "step": 228 + }, + { + "epoch": 0.01, + "learning_rate": 1.1495983935742972e-06, + "loss": 1.2856, + "step": 229 + }, + { + "epoch": 0.01, + "learning_rate": 1.1546184738955825e-06, + "loss": 1.1485, + "step": 230 + }, + { + "epoch": 0.01, + "learning_rate": 1.1596385542168675e-06, + "loss": 1.3519, + "step": 231 + }, + { + "epoch": 0.01, + "learning_rate": 1.1646586345381528e-06, + "loss": 1.1606, + "step": 232 + }, + { + "epoch": 0.01, + "learning_rate": 1.1696787148594378e-06, + "loss": 1.2258, + "step": 233 + }, + { + "epoch": 0.01, + "learning_rate": 1.174698795180723e-06, + "loss": 1.2924, + "step": 234 + }, + { + "epoch": 0.01, + "learning_rate": 1.1797188755020081e-06, + "loss": 1.1928, + "step": 235 + }, + { + "epoch": 0.01, + "learning_rate": 1.1847389558232934e-06, + "loss": 1.1589, + "step": 236 + }, + { + "epoch": 0.01, + "learning_rate": 1.1897590361445784e-06, + "loss": 1.2564, + "step": 237 + }, + { + "epoch": 0.01, + "learning_rate": 1.1947791164658635e-06, + "loss": 1.2231, + "step": 238 + }, + { + "epoch": 0.01, + "learning_rate": 1.1997991967871485e-06, + "loss": 1.2137, + "step": 239 + }, + { + "epoch": 0.01, + "learning_rate": 1.2048192771084338e-06, + "loss": 1.2245, + "step": 240 + }, + { + "epoch": 0.01, + "learning_rate": 1.209839357429719e-06, + "loss": 1.223, + "step": 241 + }, + { + "epoch": 0.01, + "learning_rate": 1.2148594377510041e-06, + "loss": 1.1696, + "step": 242 + }, + { + "epoch": 0.01, + "learning_rate": 1.2198795180722894e-06, + "loss": 1.1564, + "step": 243 + }, + { + "epoch": 0.01, + "learning_rate": 1.2248995983935744e-06, + "loss": 1.2292, + "step": 244 + }, + { + "epoch": 0.01, + "learning_rate": 1.2299196787148595e-06, + "loss": 1.2714, + "step": 245 + }, + { + "epoch": 0.01, + "learning_rate": 1.2349397590361445e-06, + "loss": 1.0826, + "step": 246 + }, + { + "epoch": 0.01, + "learning_rate": 1.2399598393574298e-06, + "loss": 1.2193, + "step": 247 + }, + { + "epoch": 0.01, + "learning_rate": 1.2449799196787148e-06, + "loss": 1.1747, + "step": 248 + }, + { + "epoch": 0.01, + "learning_rate": 1.25e-06, + "loss": 1.2124, + "step": 249 + }, + { + "epoch": 0.01, + "learning_rate": 1.2550200803212854e-06, + "loss": 1.2631, + "step": 250 + }, + { + "epoch": 0.01, + "learning_rate": 1.2600401606425704e-06, + "loss": 1.2247, + "step": 251 + }, + { + "epoch": 0.01, + "learning_rate": 1.2650602409638555e-06, + "loss": 1.215, + "step": 252 + }, + { + "epoch": 0.01, + "learning_rate": 1.2700803212851407e-06, + "loss": 1.2162, + "step": 253 + }, + { + "epoch": 0.01, + "learning_rate": 1.2751004016064258e-06, + "loss": 1.3363, + "step": 254 + }, + { + "epoch": 0.01, + "learning_rate": 1.280120481927711e-06, + "loss": 1.2678, + "step": 255 + }, + { + "epoch": 0.01, + "learning_rate": 1.2851405622489959e-06, + "loss": 1.2551, + "step": 256 + }, + { + "epoch": 0.01, + "learning_rate": 1.2901606425702811e-06, + "loss": 1.2805, + "step": 257 + }, + { + "epoch": 0.01, + "learning_rate": 1.2951807228915664e-06, + "loss": 1.2622, + "step": 258 + }, + { + "epoch": 0.01, + "learning_rate": 1.3002008032128517e-06, + "loss": 1.1876, + "step": 259 + }, + { + "epoch": 0.01, + "learning_rate": 1.3052208835341367e-06, + "loss": 1.2773, + "step": 260 + }, + { + "epoch": 0.01, + "learning_rate": 1.3102409638554218e-06, + "loss": 1.2065, + "step": 261 + }, + { + "epoch": 0.01, + "learning_rate": 1.3152610441767068e-06, + "loss": 1.256, + "step": 262 + }, + { + "epoch": 0.01, + "learning_rate": 1.320281124497992e-06, + "loss": 1.2609, + "step": 263 + }, + { + "epoch": 0.01, + "learning_rate": 1.3253012048192773e-06, + "loss": 1.152, + "step": 264 + }, + { + "epoch": 0.01, + "learning_rate": 1.3303212851405622e-06, + "loss": 1.1904, + "step": 265 + }, + { + "epoch": 0.01, + "learning_rate": 1.3353413654618474e-06, + "loss": 1.095, + "step": 266 + }, + { + "epoch": 0.01, + "learning_rate": 1.3403614457831327e-06, + "loss": 1.0817, + "step": 267 + }, + { + "epoch": 0.01, + "learning_rate": 1.345381526104418e-06, + "loss": 1.2191, + "step": 268 + }, + { + "epoch": 0.01, + "learning_rate": 1.350401606425703e-06, + "loss": 1.257, + "step": 269 + }, + { + "epoch": 0.01, + "learning_rate": 1.355421686746988e-06, + "loss": 1.2578, + "step": 270 + }, + { + "epoch": 0.01, + "learning_rate": 1.3604417670682731e-06, + "loss": 1.0878, + "step": 271 + }, + { + "epoch": 0.01, + "learning_rate": 1.3654618473895584e-06, + "loss": 1.1508, + "step": 272 + }, + { + "epoch": 0.01, + "learning_rate": 1.3704819277108436e-06, + "loss": 1.141, + "step": 273 + }, + { + "epoch": 0.01, + "learning_rate": 1.3755020080321285e-06, + "loss": 1.3189, + "step": 274 + }, + { + "epoch": 0.01, + "learning_rate": 1.3805220883534137e-06, + "loss": 1.3882, + "step": 275 + }, + { + "epoch": 0.01, + "learning_rate": 1.385542168674699e-06, + "loss": 1.2175, + "step": 276 + }, + { + "epoch": 0.01, + "learning_rate": 1.390562248995984e-06, + "loss": 1.2643, + "step": 277 + }, + { + "epoch": 0.01, + "learning_rate": 1.395582329317269e-06, + "loss": 1.1188, + "step": 278 + }, + { + "epoch": 0.01, + "learning_rate": 1.4006024096385544e-06, + "loss": 1.1735, + "step": 279 + }, + { + "epoch": 0.01, + "learning_rate": 1.4056224899598394e-06, + "loss": 1.2126, + "step": 280 + }, + { + "epoch": 0.01, + "learning_rate": 1.4106425702811247e-06, + "loss": 1.1843, + "step": 281 + }, + { + "epoch": 0.01, + "learning_rate": 1.41566265060241e-06, + "loss": 1.1759, + "step": 282 + }, + { + "epoch": 0.01, + "learning_rate": 1.4206827309236948e-06, + "loss": 1.2499, + "step": 283 + }, + { + "epoch": 0.01, + "learning_rate": 1.42570281124498e-06, + "loss": 1.2172, + "step": 284 + }, + { + "epoch": 0.01, + "learning_rate": 1.4307228915662653e-06, + "loss": 1.1891, + "step": 285 + }, + { + "epoch": 0.01, + "learning_rate": 1.4357429718875503e-06, + "loss": 1.2121, + "step": 286 + }, + { + "epoch": 0.01, + "learning_rate": 1.4407630522088354e-06, + "loss": 1.2007, + "step": 287 + }, + { + "epoch": 0.01, + "learning_rate": 1.4457831325301204e-06, + "loss": 1.3286, + "step": 288 + }, + { + "epoch": 0.01, + "learning_rate": 1.4508032128514057e-06, + "loss": 1.1889, + "step": 289 + }, + { + "epoch": 0.01, + "learning_rate": 1.455823293172691e-06, + "loss": 1.1826, + "step": 290 + }, + { + "epoch": 0.01, + "learning_rate": 1.4608433734939762e-06, + "loss": 1.2377, + "step": 291 + }, + { + "epoch": 0.01, + "learning_rate": 1.465863453815261e-06, + "loss": 1.1615, + "step": 292 + }, + { + "epoch": 0.01, + "learning_rate": 1.4708835341365463e-06, + "loss": 1.1628, + "step": 293 + }, + { + "epoch": 0.01, + "learning_rate": 1.4759036144578314e-06, + "loss": 1.2023, + "step": 294 + }, + { + "epoch": 0.01, + "learning_rate": 1.4809236947791166e-06, + "loss": 1.2427, + "step": 295 + }, + { + "epoch": 0.01, + "learning_rate": 1.4859437751004017e-06, + "loss": 1.3179, + "step": 296 + }, + { + "epoch": 0.01, + "learning_rate": 1.4909638554216867e-06, + "loss": 1.2139, + "step": 297 + }, + { + "epoch": 0.01, + "learning_rate": 1.495983935742972e-06, + "loss": 1.163, + "step": 298 + }, + { + "epoch": 0.01, + "learning_rate": 1.5010040160642573e-06, + "loss": 1.2454, + "step": 299 + }, + { + "epoch": 0.01, + "learning_rate": 1.5060240963855425e-06, + "loss": 1.2241, + "step": 300 + }, + { + "epoch": 0.01, + "learning_rate": 1.5110441767068274e-06, + "loss": 1.1454, + "step": 301 + }, + { + "epoch": 0.01, + "learning_rate": 1.5160642570281126e-06, + "loss": 1.0392, + "step": 302 + }, + { + "epoch": 0.01, + "learning_rate": 1.5210843373493977e-06, + "loss": 1.1556, + "step": 303 + }, + { + "epoch": 0.01, + "learning_rate": 1.526104417670683e-06, + "loss": 1.1982, + "step": 304 + }, + { + "epoch": 0.01, + "learning_rate": 1.531124497991968e-06, + "loss": 1.1326, + "step": 305 + }, + { + "epoch": 0.01, + "learning_rate": 1.536144578313253e-06, + "loss": 1.2527, + "step": 306 + }, + { + "epoch": 0.01, + "learning_rate": 1.5411646586345383e-06, + "loss": 1.2538, + "step": 307 + }, + { + "epoch": 0.01, + "learning_rate": 1.5461847389558236e-06, + "loss": 1.2006, + "step": 308 + }, + { + "epoch": 0.01, + "learning_rate": 1.5512048192771086e-06, + "loss": 1.1517, + "step": 309 + }, + { + "epoch": 0.01, + "learning_rate": 1.5562248995983937e-06, + "loss": 1.2192, + "step": 310 + }, + { + "epoch": 0.01, + "learning_rate": 1.561244979919679e-06, + "loss": 1.2582, + "step": 311 + }, + { + "epoch": 0.01, + "learning_rate": 1.566265060240964e-06, + "loss": 1.3518, + "step": 312 + }, + { + "epoch": 0.01, + "learning_rate": 1.5712851405622492e-06, + "loss": 1.2488, + "step": 313 + }, + { + "epoch": 0.01, + "learning_rate": 1.576305220883534e-06, + "loss": 1.1938, + "step": 314 + }, + { + "epoch": 0.01, + "learning_rate": 1.5813253012048193e-06, + "loss": 1.09, + "step": 315 + }, + { + "epoch": 0.01, + "learning_rate": 1.5863453815261046e-06, + "loss": 1.3279, + "step": 316 + }, + { + "epoch": 0.01, + "learning_rate": 1.5913654618473899e-06, + "loss": 1.2167, + "step": 317 + }, + { + "epoch": 0.01, + "learning_rate": 1.5963855421686747e-06, + "loss": 1.2066, + "step": 318 + }, + { + "epoch": 0.01, + "learning_rate": 1.60140562248996e-06, + "loss": 1.1867, + "step": 319 + }, + { + "epoch": 0.01, + "learning_rate": 1.606425702811245e-06, + "loss": 1.2032, + "step": 320 + }, + { + "epoch": 0.01, + "learning_rate": 1.6114457831325303e-06, + "loss": 1.2404, + "step": 321 + }, + { + "epoch": 0.01, + "learning_rate": 1.6164658634538155e-06, + "loss": 1.2045, + "step": 322 + }, + { + "epoch": 0.01, + "learning_rate": 1.6214859437751004e-06, + "loss": 1.1906, + "step": 323 + }, + { + "epoch": 0.01, + "learning_rate": 1.6265060240963856e-06, + "loss": 1.1741, + "step": 324 + }, + { + "epoch": 0.01, + "learning_rate": 1.6315261044176709e-06, + "loss": 1.1714, + "step": 325 + }, + { + "epoch": 0.01, + "learning_rate": 1.6365461847389562e-06, + "loss": 1.185, + "step": 326 + }, + { + "epoch": 0.01, + "learning_rate": 1.641566265060241e-06, + "loss": 1.1835, + "step": 327 + }, + { + "epoch": 0.01, + "learning_rate": 1.6465863453815263e-06, + "loss": 1.1339, + "step": 328 + }, + { + "epoch": 0.01, + "learning_rate": 1.6516064257028113e-06, + "loss": 1.1839, + "step": 329 + }, + { + "epoch": 0.01, + "learning_rate": 1.6566265060240966e-06, + "loss": 1.1918, + "step": 330 + }, + { + "epoch": 0.01, + "learning_rate": 1.6616465863453818e-06, + "loss": 1.2167, + "step": 331 + }, + { + "epoch": 0.01, + "learning_rate": 1.6666666666666667e-06, + "loss": 1.1165, + "step": 332 + }, + { + "epoch": 0.01, + "learning_rate": 1.671686746987952e-06, + "loss": 1.131, + "step": 333 + }, + { + "epoch": 0.01, + "learning_rate": 1.6767068273092372e-06, + "loss": 1.2279, + "step": 334 + }, + { + "epoch": 0.01, + "learning_rate": 1.6817269076305222e-06, + "loss": 1.0715, + "step": 335 + }, + { + "epoch": 0.01, + "learning_rate": 1.6867469879518073e-06, + "loss": 1.2137, + "step": 336 + }, + { + "epoch": 0.01, + "learning_rate": 1.6917670682730925e-06, + "loss": 1.291, + "step": 337 + }, + { + "epoch": 0.01, + "learning_rate": 1.6967871485943776e-06, + "loss": 1.1602, + "step": 338 + }, + { + "epoch": 0.01, + "learning_rate": 1.7018072289156629e-06, + "loss": 1.2395, + "step": 339 + }, + { + "epoch": 0.01, + "learning_rate": 1.7068273092369481e-06, + "loss": 1.1719, + "step": 340 + }, + { + "epoch": 0.01, + "learning_rate": 1.711847389558233e-06, + "loss": 1.2139, + "step": 341 + }, + { + "epoch": 0.01, + "learning_rate": 1.7168674698795182e-06, + "loss": 1.1998, + "step": 342 + }, + { + "epoch": 0.01, + "learning_rate": 1.7218875502008035e-06, + "loss": 1.2675, + "step": 343 + }, + { + "epoch": 0.01, + "learning_rate": 1.7269076305220885e-06, + "loss": 1.2324, + "step": 344 + }, + { + "epoch": 0.01, + "learning_rate": 1.7319277108433736e-06, + "loss": 1.2469, + "step": 345 + }, + { + "epoch": 0.01, + "learning_rate": 1.7369477911646586e-06, + "loss": 1.1636, + "step": 346 + }, + { + "epoch": 0.01, + "learning_rate": 1.7419678714859439e-06, + "loss": 1.1909, + "step": 347 + }, + { + "epoch": 0.01, + "learning_rate": 1.7469879518072292e-06, + "loss": 1.2151, + "step": 348 + }, + { + "epoch": 0.01, + "learning_rate": 1.7520080321285144e-06, + "loss": 1.1005, + "step": 349 + }, + { + "epoch": 0.01, + "learning_rate": 1.7570281124497993e-06, + "loss": 1.2531, + "step": 350 + }, + { + "epoch": 0.01, + "learning_rate": 1.7620481927710845e-06, + "loss": 1.1937, + "step": 351 + }, + { + "epoch": 0.01, + "learning_rate": 1.7670682730923696e-06, + "loss": 1.0992, + "step": 352 + }, + { + "epoch": 0.01, + "learning_rate": 1.7720883534136548e-06, + "loss": 1.1724, + "step": 353 + }, + { + "epoch": 0.01, + "learning_rate": 1.7771084337349399e-06, + "loss": 1.2111, + "step": 354 + }, + { + "epoch": 0.01, + "learning_rate": 1.782128514056225e-06, + "loss": 1.2114, + "step": 355 + }, + { + "epoch": 0.01, + "learning_rate": 1.7871485943775102e-06, + "loss": 1.2166, + "step": 356 + }, + { + "epoch": 0.01, + "learning_rate": 1.7921686746987955e-06, + "loss": 1.3374, + "step": 357 + }, + { + "epoch": 0.01, + "learning_rate": 1.7971887550200803e-06, + "loss": 1.2357, + "step": 358 + }, + { + "epoch": 0.01, + "learning_rate": 1.8022088353413656e-06, + "loss": 1.1055, + "step": 359 + }, + { + "epoch": 0.01, + "learning_rate": 1.8072289156626508e-06, + "loss": 1.2325, + "step": 360 + }, + { + "epoch": 0.01, + "learning_rate": 1.8122489959839359e-06, + "loss": 1.2216, + "step": 361 + }, + { + "epoch": 0.01, + "learning_rate": 1.8172690763052211e-06, + "loss": 1.3123, + "step": 362 + }, + { + "epoch": 0.01, + "learning_rate": 1.8222891566265062e-06, + "loss": 1.118, + "step": 363 + }, + { + "epoch": 0.01, + "learning_rate": 1.8273092369477912e-06, + "loss": 1.2112, + "step": 364 + }, + { + "epoch": 0.01, + "learning_rate": 1.8323293172690765e-06, + "loss": 1.1956, + "step": 365 + }, + { + "epoch": 0.01, + "learning_rate": 1.8373493975903617e-06, + "loss": 1.2161, + "step": 366 + }, + { + "epoch": 0.01, + "learning_rate": 1.8423694779116466e-06, + "loss": 1.1689, + "step": 367 + }, + { + "epoch": 0.01, + "learning_rate": 1.8473895582329318e-06, + "loss": 1.1291, + "step": 368 + }, + { + "epoch": 0.01, + "learning_rate": 1.8524096385542171e-06, + "loss": 1.0608, + "step": 369 + }, + { + "epoch": 0.01, + "learning_rate": 1.8574297188755022e-06, + "loss": 1.1381, + "step": 370 + }, + { + "epoch": 0.01, + "learning_rate": 1.8624497991967874e-06, + "loss": 1.0233, + "step": 371 + }, + { + "epoch": 0.01, + "learning_rate": 1.8674698795180723e-06, + "loss": 1.2103, + "step": 372 + }, + { + "epoch": 0.01, + "learning_rate": 1.8724899598393575e-06, + "loss": 1.0747, + "step": 373 + }, + { + "epoch": 0.01, + "learning_rate": 1.8775100401606428e-06, + "loss": 1.3341, + "step": 374 + }, + { + "epoch": 0.01, + "learning_rate": 1.882530120481928e-06, + "loss": 1.105, + "step": 375 + }, + { + "epoch": 0.01, + "learning_rate": 1.8875502008032129e-06, + "loss": 1.1721, + "step": 376 + }, + { + "epoch": 0.01, + "learning_rate": 1.8925702811244981e-06, + "loss": 1.2074, + "step": 377 + }, + { + "epoch": 0.01, + "learning_rate": 1.8975903614457832e-06, + "loss": 1.1992, + "step": 378 + }, + { + "epoch": 0.01, + "learning_rate": 1.9026104417670685e-06, + "loss": 1.3135, + "step": 379 + }, + { + "epoch": 0.01, + "learning_rate": 1.9076305220883537e-06, + "loss": 1.2535, + "step": 380 + }, + { + "epoch": 0.01, + "learning_rate": 1.9126506024096388e-06, + "loss": 1.1398, + "step": 381 + }, + { + "epoch": 0.01, + "learning_rate": 1.917670682730924e-06, + "loss": 1.2048, + "step": 382 + }, + { + "epoch": 0.01, + "learning_rate": 1.922690763052209e-06, + "loss": 1.2257, + "step": 383 + }, + { + "epoch": 0.01, + "learning_rate": 1.9277108433734943e-06, + "loss": 1.1011, + "step": 384 + }, + { + "epoch": 0.01, + "learning_rate": 1.932730923694779e-06, + "loss": 1.2583, + "step": 385 + }, + { + "epoch": 0.01, + "learning_rate": 1.9377510040160644e-06, + "loss": 1.1926, + "step": 386 + }, + { + "epoch": 0.01, + "learning_rate": 1.9427710843373495e-06, + "loss": 1.1757, + "step": 387 + }, + { + "epoch": 0.01, + "learning_rate": 1.947791164658635e-06, + "loss": 1.2224, + "step": 388 + }, + { + "epoch": 0.01, + "learning_rate": 1.95281124497992e-06, + "loss": 1.1533, + "step": 389 + }, + { + "epoch": 0.01, + "learning_rate": 1.957831325301205e-06, + "loss": 1.2163, + "step": 390 + }, + { + "epoch": 0.01, + "learning_rate": 1.96285140562249e-06, + "loss": 1.2047, + "step": 391 + }, + { + "epoch": 0.01, + "learning_rate": 1.967871485943775e-06, + "loss": 1.1746, + "step": 392 + }, + { + "epoch": 0.01, + "learning_rate": 1.9728915662650606e-06, + "loss": 1.1678, + "step": 393 + }, + { + "epoch": 0.01, + "learning_rate": 1.9779116465863453e-06, + "loss": 1.1834, + "step": 394 + }, + { + "epoch": 0.01, + "learning_rate": 1.9829317269076307e-06, + "loss": 1.2194, + "step": 395 + }, + { + "epoch": 0.01, + "learning_rate": 1.987951807228916e-06, + "loss": 1.1625, + "step": 396 + }, + { + "epoch": 0.01, + "learning_rate": 1.992971887550201e-06, + "loss": 1.1104, + "step": 397 + }, + { + "epoch": 0.01, + "learning_rate": 1.997991967871486e-06, + "loss": 1.1923, + "step": 398 + }, + { + "epoch": 0.01, + "learning_rate": 2.0030120481927714e-06, + "loss": 1.2935, + "step": 399 + }, + { + "epoch": 0.01, + "learning_rate": 2.0080321285140564e-06, + "loss": 1.1905, + "step": 400 + }, + { + "epoch": 0.01, + "learning_rate": 2.0130522088353415e-06, + "loss": 1.2489, + "step": 401 + }, + { + "epoch": 0.01, + "learning_rate": 2.018072289156627e-06, + "loss": 1.2571, + "step": 402 + }, + { + "epoch": 0.01, + "learning_rate": 2.0230923694779116e-06, + "loss": 0.9643, + "step": 403 + }, + { + "epoch": 0.01, + "learning_rate": 2.028112449799197e-06, + "loss": 1.1662, + "step": 404 + }, + { + "epoch": 0.01, + "learning_rate": 2.033132530120482e-06, + "loss": 1.2767, + "step": 405 + }, + { + "epoch": 0.01, + "learning_rate": 2.038152610441767e-06, + "loss": 1.1814, + "step": 406 + }, + { + "epoch": 0.01, + "learning_rate": 2.043172690763052e-06, + "loss": 1.2408, + "step": 407 + }, + { + "epoch": 0.01, + "learning_rate": 2.0481927710843377e-06, + "loss": 1.1976, + "step": 408 + }, + { + "epoch": 0.01, + "learning_rate": 2.0532128514056227e-06, + "loss": 1.1796, + "step": 409 + }, + { + "epoch": 0.01, + "learning_rate": 2.0582329317269078e-06, + "loss": 1.1853, + "step": 410 + }, + { + "epoch": 0.01, + "learning_rate": 2.0632530120481932e-06, + "loss": 1.215, + "step": 411 + }, + { + "epoch": 0.01, + "learning_rate": 2.068273092369478e-06, + "loss": 1.1127, + "step": 412 + }, + { + "epoch": 0.01, + "learning_rate": 2.0732931726907633e-06, + "loss": 1.1558, + "step": 413 + }, + { + "epoch": 0.01, + "learning_rate": 2.0783132530120484e-06, + "loss": 1.1968, + "step": 414 + }, + { + "epoch": 0.01, + "learning_rate": 2.0833333333333334e-06, + "loss": 1.2405, + "step": 415 + }, + { + "epoch": 0.01, + "learning_rate": 2.0883534136546185e-06, + "loss": 1.1862, + "step": 416 + }, + { + "epoch": 0.01, + "learning_rate": 2.0933734939759035e-06, + "loss": 1.25, + "step": 417 + }, + { + "epoch": 0.01, + "learning_rate": 2.098393574297189e-06, + "loss": 1.1277, + "step": 418 + }, + { + "epoch": 0.01, + "learning_rate": 2.103413654618474e-06, + "loss": 1.192, + "step": 419 + }, + { + "epoch": 0.01, + "learning_rate": 2.1084337349397595e-06, + "loss": 1.2454, + "step": 420 + }, + { + "epoch": 0.01, + "learning_rate": 2.113453815261044e-06, + "loss": 1.1712, + "step": 421 + }, + { + "epoch": 0.01, + "learning_rate": 2.1184738955823296e-06, + "loss": 1.2356, + "step": 422 + }, + { + "epoch": 0.01, + "learning_rate": 2.1234939759036147e-06, + "loss": 1.1858, + "step": 423 + }, + { + "epoch": 0.01, + "learning_rate": 2.1285140562248997e-06, + "loss": 1.1556, + "step": 424 + }, + { + "epoch": 0.01, + "learning_rate": 2.1335341365461848e-06, + "loss": 1.3066, + "step": 425 + }, + { + "epoch": 0.01, + "learning_rate": 2.13855421686747e-06, + "loss": 1.1935, + "step": 426 + }, + { + "epoch": 0.01, + "learning_rate": 2.1435742971887553e-06, + "loss": 1.0922, + "step": 427 + }, + { + "epoch": 0.01, + "learning_rate": 2.1485943775100404e-06, + "loss": 1.0898, + "step": 428 + }, + { + "epoch": 0.01, + "learning_rate": 2.1536144578313254e-06, + "loss": 1.1514, + "step": 429 + }, + { + "epoch": 0.01, + "learning_rate": 2.1586345381526105e-06, + "loss": 1.3051, + "step": 430 + }, + { + "epoch": 0.01, + "learning_rate": 2.163654618473896e-06, + "loss": 1.2433, + "step": 431 + }, + { + "epoch": 0.01, + "learning_rate": 2.168674698795181e-06, + "loss": 1.1556, + "step": 432 + }, + { + "epoch": 0.01, + "learning_rate": 2.173694779116466e-06, + "loss": 1.1682, + "step": 433 + }, + { + "epoch": 0.01, + "learning_rate": 2.178714859437751e-06, + "loss": 1.2976, + "step": 434 + }, + { + "epoch": 0.01, + "learning_rate": 2.183734939759036e-06, + "loss": 1.1681, + "step": 435 + }, + { + "epoch": 0.01, + "learning_rate": 2.1887550200803216e-06, + "loss": 1.1198, + "step": 436 + }, + { + "epoch": 0.01, + "learning_rate": 2.1937751004016067e-06, + "loss": 1.3199, + "step": 437 + }, + { + "epoch": 0.01, + "learning_rate": 2.1987951807228917e-06, + "loss": 1.2086, + "step": 438 + }, + { + "epoch": 0.01, + "learning_rate": 2.2038152610441768e-06, + "loss": 1.1592, + "step": 439 + }, + { + "epoch": 0.01, + "learning_rate": 2.2088353413654622e-06, + "loss": 1.1182, + "step": 440 + }, + { + "epoch": 0.01, + "learning_rate": 2.2138554216867473e-06, + "loss": 1.1688, + "step": 441 + }, + { + "epoch": 0.01, + "learning_rate": 2.2188755020080323e-06, + "loss": 1.1967, + "step": 442 + }, + { + "epoch": 0.01, + "learning_rate": 2.2238955823293174e-06, + "loss": 1.1482, + "step": 443 + }, + { + "epoch": 0.01, + "learning_rate": 2.2289156626506024e-06, + "loss": 1.1002, + "step": 444 + }, + { + "epoch": 0.01, + "learning_rate": 2.233935742971888e-06, + "loss": 1.146, + "step": 445 + }, + { + "epoch": 0.01, + "learning_rate": 2.238955823293173e-06, + "loss": 1.204, + "step": 446 + }, + { + "epoch": 0.01, + "learning_rate": 2.243975903614458e-06, + "loss": 1.0905, + "step": 447 + }, + { + "epoch": 0.01, + "learning_rate": 2.248995983935743e-06, + "loss": 1.2334, + "step": 448 + }, + { + "epoch": 0.01, + "learning_rate": 2.254016064257028e-06, + "loss": 1.0965, + "step": 449 + }, + { + "epoch": 0.01, + "learning_rate": 2.2590361445783136e-06, + "loss": 1.2169, + "step": 450 + }, + { + "epoch": 0.01, + "learning_rate": 2.2640562248995986e-06, + "loss": 1.1136, + "step": 451 + }, + { + "epoch": 0.01, + "learning_rate": 2.2690763052208837e-06, + "loss": 1.1423, + "step": 452 + }, + { + "epoch": 0.01, + "learning_rate": 2.2740963855421687e-06, + "loss": 1.2517, + "step": 453 + }, + { + "epoch": 0.01, + "learning_rate": 2.279116465863454e-06, + "loss": 1.2709, + "step": 454 + }, + { + "epoch": 0.01, + "learning_rate": 2.2841365461847392e-06, + "loss": 1.1757, + "step": 455 + }, + { + "epoch": 0.01, + "learning_rate": 2.2891566265060243e-06, + "loss": 1.1052, + "step": 456 + }, + { + "epoch": 0.01, + "learning_rate": 2.2941767068273093e-06, + "loss": 1.1669, + "step": 457 + }, + { + "epoch": 0.01, + "learning_rate": 2.2991967871485944e-06, + "loss": 1.1641, + "step": 458 + }, + { + "epoch": 0.01, + "learning_rate": 2.30421686746988e-06, + "loss": 1.1581, + "step": 459 + }, + { + "epoch": 0.01, + "learning_rate": 2.309236947791165e-06, + "loss": 1.1927, + "step": 460 + }, + { + "epoch": 0.01, + "learning_rate": 2.31425702811245e-06, + "loss": 1.2747, + "step": 461 + }, + { + "epoch": 0.01, + "learning_rate": 2.319277108433735e-06, + "loss": 1.1104, + "step": 462 + }, + { + "epoch": 0.01, + "learning_rate": 2.3242971887550205e-06, + "loss": 1.1898, + "step": 463 + }, + { + "epoch": 0.01, + "learning_rate": 2.3293172690763055e-06, + "loss": 1.2172, + "step": 464 + }, + { + "epoch": 0.01, + "learning_rate": 2.3343373493975906e-06, + "loss": 1.212, + "step": 465 + }, + { + "epoch": 0.01, + "learning_rate": 2.3393574297188756e-06, + "loss": 1.1635, + "step": 466 + }, + { + "epoch": 0.01, + "learning_rate": 2.3443775100401607e-06, + "loss": 1.1473, + "step": 467 + }, + { + "epoch": 0.01, + "learning_rate": 2.349397590361446e-06, + "loss": 1.2173, + "step": 468 + }, + { + "epoch": 0.01, + "learning_rate": 2.3544176706827312e-06, + "loss": 1.0703, + "step": 469 + }, + { + "epoch": 0.01, + "learning_rate": 2.3594377510040163e-06, + "loss": 1.1794, + "step": 470 + }, + { + "epoch": 0.01, + "learning_rate": 2.3644578313253013e-06, + "loss": 1.1543, + "step": 471 + }, + { + "epoch": 0.01, + "learning_rate": 2.3694779116465868e-06, + "loss": 1.0568, + "step": 472 + }, + { + "epoch": 0.01, + "learning_rate": 2.374497991967872e-06, + "loss": 1.2534, + "step": 473 + }, + { + "epoch": 0.01, + "learning_rate": 2.379518072289157e-06, + "loss": 1.2385, + "step": 474 + }, + { + "epoch": 0.01, + "learning_rate": 2.384538152610442e-06, + "loss": 1.1198, + "step": 475 + }, + { + "epoch": 0.01, + "learning_rate": 2.389558232931727e-06, + "loss": 1.1227, + "step": 476 + }, + { + "epoch": 0.01, + "learning_rate": 2.3945783132530125e-06, + "loss": 1.213, + "step": 477 + }, + { + "epoch": 0.01, + "learning_rate": 2.399598393574297e-06, + "loss": 1.1208, + "step": 478 + }, + { + "epoch": 0.01, + "learning_rate": 2.4046184738955826e-06, + "loss": 1.2943, + "step": 479 + }, + { + "epoch": 0.01, + "learning_rate": 2.4096385542168676e-06, + "loss": 1.1614, + "step": 480 + }, + { + "epoch": 0.01, + "learning_rate": 2.4146586345381527e-06, + "loss": 1.2052, + "step": 481 + }, + { + "epoch": 0.01, + "learning_rate": 2.419678714859438e-06, + "loss": 1.0342, + "step": 482 + }, + { + "epoch": 0.01, + "learning_rate": 2.424698795180723e-06, + "loss": 1.1041, + "step": 483 + }, + { + "epoch": 0.01, + "learning_rate": 2.4297188755020082e-06, + "loss": 1.2192, + "step": 484 + }, + { + "epoch": 0.01, + "learning_rate": 2.4347389558232933e-06, + "loss": 1.17, + "step": 485 + }, + { + "epoch": 0.01, + "learning_rate": 2.4397590361445788e-06, + "loss": 1.1792, + "step": 486 + }, + { + "epoch": 0.01, + "learning_rate": 2.4447791164658634e-06, + "loss": 1.2184, + "step": 487 + }, + { + "epoch": 0.01, + "learning_rate": 2.449799196787149e-06, + "loss": 1.0862, + "step": 488 + }, + { + "epoch": 0.01, + "learning_rate": 2.454819277108434e-06, + "loss": 1.1874, + "step": 489 + }, + { + "epoch": 0.01, + "learning_rate": 2.459839357429719e-06, + "loss": 1.1653, + "step": 490 + }, + { + "epoch": 0.01, + "learning_rate": 2.4648594377510044e-06, + "loss": 1.1931, + "step": 491 + }, + { + "epoch": 0.01, + "learning_rate": 2.469879518072289e-06, + "loss": 1.2485, + "step": 492 + }, + { + "epoch": 0.01, + "learning_rate": 2.4748995983935745e-06, + "loss": 1.2372, + "step": 493 + }, + { + "epoch": 0.01, + "learning_rate": 2.4799196787148596e-06, + "loss": 1.2213, + "step": 494 + }, + { + "epoch": 0.01, + "learning_rate": 2.484939759036145e-06, + "loss": 1.1373, + "step": 495 + }, + { + "epoch": 0.01, + "learning_rate": 2.4899598393574297e-06, + "loss": 1.1546, + "step": 496 + }, + { + "epoch": 0.01, + "learning_rate": 2.494979919678715e-06, + "loss": 1.001, + "step": 497 + }, + { + "epoch": 0.02, + "learning_rate": 2.5e-06, + "loss": 1.1764, + "step": 498 + }, + { + "epoch": 0.02, + "learning_rate": 2.5050200803212853e-06, + "loss": 1.2568, + "step": 499 + }, + { + "epoch": 0.02, + "learning_rate": 2.5100401606425707e-06, + "loss": 1.3071, + "step": 500 + }, + { + "epoch": 0.02, + "learning_rate": 2.5150602409638558e-06, + "loss": 1.1647, + "step": 501 + }, + { + "epoch": 0.02, + "learning_rate": 2.520080321285141e-06, + "loss": 1.1989, + "step": 502 + }, + { + "epoch": 0.02, + "learning_rate": 2.525100401606426e-06, + "loss": 1.1036, + "step": 503 + }, + { + "epoch": 0.02, + "learning_rate": 2.530120481927711e-06, + "loss": 1.1436, + "step": 504 + }, + { + "epoch": 0.02, + "learning_rate": 2.535140562248996e-06, + "loss": 1.1364, + "step": 505 + }, + { + "epoch": 0.02, + "learning_rate": 2.5401606425702815e-06, + "loss": 1.2365, + "step": 506 + }, + { + "epoch": 0.02, + "learning_rate": 2.5451807228915665e-06, + "loss": 1.1926, + "step": 507 + }, + { + "epoch": 0.02, + "learning_rate": 2.5502008032128516e-06, + "loss": 1.17, + "step": 508 + }, + { + "epoch": 0.02, + "learning_rate": 2.555220883534137e-06, + "loss": 1.2609, + "step": 509 + }, + { + "epoch": 0.02, + "learning_rate": 2.560240963855422e-06, + "loss": 1.2097, + "step": 510 + }, + { + "epoch": 0.02, + "learning_rate": 2.565261044176707e-06, + "loss": 1.2088, + "step": 511 + }, + { + "epoch": 0.02, + "learning_rate": 2.5702811244979918e-06, + "loss": 1.2088, + "step": 512 + }, + { + "epoch": 0.02, + "learning_rate": 2.5753012048192772e-06, + "loss": 1.2214, + "step": 513 + }, + { + "epoch": 0.02, + "learning_rate": 2.5803212851405623e-06, + "loss": 1.1436, + "step": 514 + }, + { + "epoch": 0.02, + "learning_rate": 2.5853413654618477e-06, + "loss": 1.0466, + "step": 515 + }, + { + "epoch": 0.02, + "learning_rate": 2.590361445783133e-06, + "loss": 1.115, + "step": 516 + }, + { + "epoch": 0.02, + "learning_rate": 2.595381526104418e-06, + "loss": 1.1993, + "step": 517 + }, + { + "epoch": 0.02, + "learning_rate": 2.6004016064257033e-06, + "loss": 1.1859, + "step": 518 + }, + { + "epoch": 0.02, + "learning_rate": 2.6054216867469884e-06, + "loss": 1.1805, + "step": 519 + }, + { + "epoch": 0.02, + "learning_rate": 2.6104417670682734e-06, + "loss": 1.205, + "step": 520 + }, + { + "epoch": 0.02, + "learning_rate": 2.615461847389558e-06, + "loss": 1.2191, + "step": 521 + }, + { + "epoch": 0.02, + "learning_rate": 2.6204819277108435e-06, + "loss": 1.0483, + "step": 522 + }, + { + "epoch": 0.02, + "learning_rate": 2.6255020080321286e-06, + "loss": 1.271, + "step": 523 + }, + { + "epoch": 0.02, + "learning_rate": 2.6305220883534136e-06, + "loss": 1.1379, + "step": 524 + }, + { + "epoch": 0.02, + "learning_rate": 2.635542168674699e-06, + "loss": 1.2911, + "step": 525 + }, + { + "epoch": 0.02, + "learning_rate": 2.640562248995984e-06, + "loss": 1.1744, + "step": 526 + }, + { + "epoch": 0.02, + "learning_rate": 2.6455823293172696e-06, + "loss": 1.0969, + "step": 527 + }, + { + "epoch": 0.02, + "learning_rate": 2.6506024096385547e-06, + "loss": 1.2247, + "step": 528 + }, + { + "epoch": 0.02, + "learning_rate": 2.6556224899598397e-06, + "loss": 1.2526, + "step": 529 + }, + { + "epoch": 0.02, + "learning_rate": 2.6606425702811243e-06, + "loss": 1.2623, + "step": 530 + }, + { + "epoch": 0.02, + "learning_rate": 2.66566265060241e-06, + "loss": 1.207, + "step": 531 + }, + { + "epoch": 0.02, + "learning_rate": 2.670682730923695e-06, + "loss": 1.0773, + "step": 532 + }, + { + "epoch": 0.02, + "learning_rate": 2.67570281124498e-06, + "loss": 1.2032, + "step": 533 + }, + { + "epoch": 0.02, + "learning_rate": 2.6807228915662654e-06, + "loss": 1.1102, + "step": 534 + }, + { + "epoch": 0.02, + "learning_rate": 2.6857429718875504e-06, + "loss": 1.237, + "step": 535 + }, + { + "epoch": 0.02, + "learning_rate": 2.690763052208836e-06, + "loss": 1.1904, + "step": 536 + }, + { + "epoch": 0.02, + "learning_rate": 2.695783132530121e-06, + "loss": 1.2063, + "step": 537 + }, + { + "epoch": 0.02, + "learning_rate": 2.700803212851406e-06, + "loss": 1.2887, + "step": 538 + }, + { + "epoch": 0.02, + "learning_rate": 2.7058232931726906e-06, + "loss": 1.1348, + "step": 539 + }, + { + "epoch": 0.02, + "learning_rate": 2.710843373493976e-06, + "loss": 1.166, + "step": 540 + }, + { + "epoch": 0.02, + "learning_rate": 2.715863453815261e-06, + "loss": 1.2218, + "step": 541 + }, + { + "epoch": 0.02, + "learning_rate": 2.7208835341365462e-06, + "loss": 1.2759, + "step": 542 + }, + { + "epoch": 0.02, + "learning_rate": 2.7259036144578317e-06, + "loss": 1.1385, + "step": 543 + }, + { + "epoch": 0.02, + "learning_rate": 2.7309236947791167e-06, + "loss": 1.0538, + "step": 544 + }, + { + "epoch": 0.02, + "learning_rate": 2.735943775100402e-06, + "loss": 1.1441, + "step": 545 + }, + { + "epoch": 0.02, + "learning_rate": 2.7409638554216873e-06, + "loss": 1.2615, + "step": 546 + }, + { + "epoch": 0.02, + "learning_rate": 2.745983935742972e-06, + "loss": 1.192, + "step": 547 + }, + { + "epoch": 0.02, + "learning_rate": 2.751004016064257e-06, + "loss": 1.2115, + "step": 548 + }, + { + "epoch": 0.02, + "learning_rate": 2.7560240963855424e-06, + "loss": 1.1034, + "step": 549 + }, + { + "epoch": 0.02, + "learning_rate": 2.7610441767068275e-06, + "loss": 1.1382, + "step": 550 + }, + { + "epoch": 0.02, + "learning_rate": 2.7660642570281125e-06, + "loss": 1.2318, + "step": 551 + }, + { + "epoch": 0.02, + "learning_rate": 2.771084337349398e-06, + "loss": 1.2134, + "step": 552 + }, + { + "epoch": 0.02, + "learning_rate": 2.776104417670683e-06, + "loss": 1.1697, + "step": 553 + }, + { + "epoch": 0.02, + "learning_rate": 2.781124497991968e-06, + "loss": 1.1258, + "step": 554 + }, + { + "epoch": 0.02, + "learning_rate": 2.7861445783132536e-06, + "loss": 1.1729, + "step": 555 + }, + { + "epoch": 0.02, + "learning_rate": 2.791164658634538e-06, + "loss": 1.2006, + "step": 556 + }, + { + "epoch": 0.02, + "learning_rate": 2.7961847389558232e-06, + "loss": 1.2927, + "step": 557 + }, + { + "epoch": 0.02, + "learning_rate": 2.8012048192771087e-06, + "loss": 1.2198, + "step": 558 + }, + { + "epoch": 0.02, + "learning_rate": 2.8062248995983938e-06, + "loss": 1.187, + "step": 559 + }, + { + "epoch": 0.02, + "learning_rate": 2.811244979919679e-06, + "loss": 1.2356, + "step": 560 + }, + { + "epoch": 0.02, + "learning_rate": 2.8162650602409643e-06, + "loss": 1.2475, + "step": 561 + }, + { + "epoch": 0.02, + "learning_rate": 2.8212851405622493e-06, + "loss": 1.212, + "step": 562 + }, + { + "epoch": 0.02, + "learning_rate": 2.8263052208835344e-06, + "loss": 1.2125, + "step": 563 + }, + { + "epoch": 0.02, + "learning_rate": 2.83132530120482e-06, + "loss": 1.2113, + "step": 564 + }, + { + "epoch": 0.02, + "learning_rate": 2.8363453815261045e-06, + "loss": 1.1117, + "step": 565 + }, + { + "epoch": 0.02, + "learning_rate": 2.8413654618473895e-06, + "loss": 1.1824, + "step": 566 + }, + { + "epoch": 0.02, + "learning_rate": 2.846385542168675e-06, + "loss": 1.1953, + "step": 567 + }, + { + "epoch": 0.02, + "learning_rate": 2.85140562248996e-06, + "loss": 1.1313, + "step": 568 + }, + { + "epoch": 0.02, + "learning_rate": 2.856425702811245e-06, + "loss": 1.2103, + "step": 569 + }, + { + "epoch": 0.02, + "learning_rate": 2.8614457831325306e-06, + "loss": 1.2441, + "step": 570 + }, + { + "epoch": 0.02, + "learning_rate": 2.8664658634538156e-06, + "loss": 1.1554, + "step": 571 + }, + { + "epoch": 0.02, + "learning_rate": 2.8714859437751007e-06, + "loss": 1.0688, + "step": 572 + }, + { + "epoch": 0.02, + "learning_rate": 2.876506024096386e-06, + "loss": 1.1511, + "step": 573 + }, + { + "epoch": 0.02, + "learning_rate": 2.8815261044176708e-06, + "loss": 1.3375, + "step": 574 + }, + { + "epoch": 0.02, + "learning_rate": 2.886546184738956e-06, + "loss": 1.3309, + "step": 575 + }, + { + "epoch": 0.02, + "learning_rate": 2.891566265060241e-06, + "loss": 1.2534, + "step": 576 + }, + { + "epoch": 0.02, + "learning_rate": 2.8965863453815264e-06, + "loss": 1.1337, + "step": 577 + }, + { + "epoch": 0.02, + "learning_rate": 2.9016064257028114e-06, + "loss": 1.1599, + "step": 578 + }, + { + "epoch": 0.02, + "learning_rate": 2.906626506024097e-06, + "loss": 1.1726, + "step": 579 + }, + { + "epoch": 0.02, + "learning_rate": 2.911646586345382e-06, + "loss": 1.2249, + "step": 580 + }, + { + "epoch": 0.02, + "learning_rate": 2.916666666666667e-06, + "loss": 1.2438, + "step": 581 + }, + { + "epoch": 0.02, + "learning_rate": 2.9216867469879524e-06, + "loss": 1.2019, + "step": 582 + }, + { + "epoch": 0.02, + "learning_rate": 2.926706827309237e-06, + "loss": 1.2097, + "step": 583 + }, + { + "epoch": 0.02, + "learning_rate": 2.931726907630522e-06, + "loss": 1.1197, + "step": 584 + }, + { + "epoch": 0.02, + "learning_rate": 2.936746987951807e-06, + "loss": 1.2189, + "step": 585 + }, + { + "epoch": 0.02, + "learning_rate": 2.9417670682730926e-06, + "loss": 1.2117, + "step": 586 + }, + { + "epoch": 0.02, + "learning_rate": 2.9467871485943777e-06, + "loss": 1.2493, + "step": 587 + }, + { + "epoch": 0.02, + "learning_rate": 2.9518072289156627e-06, + "loss": 1.2043, + "step": 588 + }, + { + "epoch": 0.02, + "learning_rate": 2.9568273092369482e-06, + "loss": 1.178, + "step": 589 + }, + { + "epoch": 0.02, + "learning_rate": 2.9618473895582333e-06, + "loss": 1.1683, + "step": 590 + }, + { + "epoch": 0.02, + "learning_rate": 2.9668674698795187e-06, + "loss": 1.1815, + "step": 591 + }, + { + "epoch": 0.02, + "learning_rate": 2.9718875502008034e-06, + "loss": 1.1632, + "step": 592 + }, + { + "epoch": 0.02, + "learning_rate": 2.9769076305220884e-06, + "loss": 1.2046, + "step": 593 + }, + { + "epoch": 0.02, + "learning_rate": 2.9819277108433735e-06, + "loss": 1.1616, + "step": 594 + }, + { + "epoch": 0.02, + "learning_rate": 2.986947791164659e-06, + "loss": 1.2184, + "step": 595 + }, + { + "epoch": 0.02, + "learning_rate": 2.991967871485944e-06, + "loss": 1.1403, + "step": 596 + }, + { + "epoch": 0.02, + "learning_rate": 2.996987951807229e-06, + "loss": 1.1066, + "step": 597 + }, + { + "epoch": 0.02, + "learning_rate": 3.0020080321285145e-06, + "loss": 1.3006, + "step": 598 + }, + { + "epoch": 0.02, + "learning_rate": 3.0070281124497996e-06, + "loss": 1.1857, + "step": 599 + }, + { + "epoch": 0.02, + "learning_rate": 3.012048192771085e-06, + "loss": 1.1275, + "step": 600 + }, + { + "epoch": 0.02, + "learning_rate": 3.0170682730923697e-06, + "loss": 1.1747, + "step": 601 + }, + { + "epoch": 0.02, + "learning_rate": 3.0220883534136547e-06, + "loss": 1.2317, + "step": 602 + }, + { + "epoch": 0.02, + "learning_rate": 3.0271084337349398e-06, + "loss": 1.0913, + "step": 603 + }, + { + "epoch": 0.02, + "learning_rate": 3.0321285140562252e-06, + "loss": 1.1472, + "step": 604 + }, + { + "epoch": 0.02, + "learning_rate": 3.0371485943775103e-06, + "loss": 1.181, + "step": 605 + }, + { + "epoch": 0.02, + "learning_rate": 3.0421686746987953e-06, + "loss": 1.1639, + "step": 606 + }, + { + "epoch": 0.02, + "learning_rate": 3.047188755020081e-06, + "loss": 1.0945, + "step": 607 + }, + { + "epoch": 0.02, + "learning_rate": 3.052208835341366e-06, + "loss": 1.2145, + "step": 608 + }, + { + "epoch": 0.02, + "learning_rate": 3.057228915662651e-06, + "loss": 1.0829, + "step": 609 + }, + { + "epoch": 0.02, + "learning_rate": 3.062248995983936e-06, + "loss": 1.1107, + "step": 610 + }, + { + "epoch": 0.02, + "learning_rate": 3.067269076305221e-06, + "loss": 1.1605, + "step": 611 + }, + { + "epoch": 0.02, + "learning_rate": 3.072289156626506e-06, + "loss": 1.1741, + "step": 612 + }, + { + "epoch": 0.02, + "learning_rate": 3.0773092369477915e-06, + "loss": 1.1684, + "step": 613 + }, + { + "epoch": 0.02, + "learning_rate": 3.0823293172690766e-06, + "loss": 1.1579, + "step": 614 + }, + { + "epoch": 0.02, + "learning_rate": 3.0873493975903616e-06, + "loss": 1.2404, + "step": 615 + }, + { + "epoch": 0.02, + "learning_rate": 3.092369477911647e-06, + "loss": 1.1518, + "step": 616 + }, + { + "epoch": 0.02, + "learning_rate": 3.097389558232932e-06, + "loss": 1.1941, + "step": 617 + }, + { + "epoch": 0.02, + "learning_rate": 3.1024096385542172e-06, + "loss": 1.212, + "step": 618 + }, + { + "epoch": 0.02, + "learning_rate": 3.107429718875502e-06, + "loss": 1.0948, + "step": 619 + }, + { + "epoch": 0.02, + "learning_rate": 3.1124497991967873e-06, + "loss": 1.1985, + "step": 620 + }, + { + "epoch": 0.02, + "learning_rate": 3.1174698795180724e-06, + "loss": 1.0709, + "step": 621 + }, + { + "epoch": 0.02, + "learning_rate": 3.122489959839358e-06, + "loss": 1.1178, + "step": 622 + }, + { + "epoch": 0.02, + "learning_rate": 3.127510040160643e-06, + "loss": 1.2018, + "step": 623 + }, + { + "epoch": 0.02, + "learning_rate": 3.132530120481928e-06, + "loss": 0.9734, + "step": 624 + }, + { + "epoch": 0.02, + "learning_rate": 3.1375502008032134e-06, + "loss": 1.1774, + "step": 625 + }, + { + "epoch": 0.02, + "learning_rate": 3.1425702811244985e-06, + "loss": 1.1783, + "step": 626 + }, + { + "epoch": 0.02, + "learning_rate": 3.147590361445783e-06, + "loss": 1.083, + "step": 627 + }, + { + "epoch": 0.02, + "learning_rate": 3.152610441767068e-06, + "loss": 1.1686, + "step": 628 + }, + { + "epoch": 0.02, + "learning_rate": 3.1576305220883536e-06, + "loss": 1.1891, + "step": 629 + }, + { + "epoch": 0.02, + "learning_rate": 3.1626506024096387e-06, + "loss": 1.2729, + "step": 630 + }, + { + "epoch": 0.02, + "learning_rate": 3.167670682730924e-06, + "loss": 1.1238, + "step": 631 + }, + { + "epoch": 0.02, + "learning_rate": 3.172690763052209e-06, + "loss": 1.1558, + "step": 632 + }, + { + "epoch": 0.02, + "learning_rate": 3.1777108433734942e-06, + "loss": 1.1774, + "step": 633 + }, + { + "epoch": 0.02, + "learning_rate": 3.1827309236947797e-06, + "loss": 1.1907, + "step": 634 + }, + { + "epoch": 0.02, + "learning_rate": 3.1877510040160648e-06, + "loss": 1.1663, + "step": 635 + }, + { + "epoch": 0.02, + "learning_rate": 3.1927710843373494e-06, + "loss": 1.255, + "step": 636 + }, + { + "epoch": 0.02, + "learning_rate": 3.1977911646586344e-06, + "loss": 1.205, + "step": 637 + }, + { + "epoch": 0.02, + "learning_rate": 3.20281124497992e-06, + "loss": 1.202, + "step": 638 + }, + { + "epoch": 0.02, + "learning_rate": 3.207831325301205e-06, + "loss": 1.1733, + "step": 639 + }, + { + "epoch": 0.02, + "learning_rate": 3.21285140562249e-06, + "loss": 1.174, + "step": 640 + }, + { + "epoch": 0.02, + "learning_rate": 3.2178714859437755e-06, + "loss": 1.1836, + "step": 641 + }, + { + "epoch": 0.02, + "learning_rate": 3.2228915662650605e-06, + "loss": 1.1837, + "step": 642 + }, + { + "epoch": 0.02, + "learning_rate": 3.227911646586346e-06, + "loss": 1.1914, + "step": 643 + }, + { + "epoch": 0.02, + "learning_rate": 3.232931726907631e-06, + "loss": 1.1087, + "step": 644 + }, + { + "epoch": 0.02, + "learning_rate": 3.2379518072289157e-06, + "loss": 1.189, + "step": 645 + }, + { + "epoch": 0.02, + "learning_rate": 3.2429718875502007e-06, + "loss": 1.1396, + "step": 646 + }, + { + "epoch": 0.02, + "learning_rate": 3.247991967871486e-06, + "loss": 1.1616, + "step": 647 + }, + { + "epoch": 0.02, + "learning_rate": 3.2530120481927713e-06, + "loss": 1.1066, + "step": 648 + }, + { + "epoch": 0.02, + "learning_rate": 3.2580321285140563e-06, + "loss": 1.0612, + "step": 649 + }, + { + "epoch": 0.02, + "learning_rate": 3.2630522088353418e-06, + "loss": 1.2165, + "step": 650 + }, + { + "epoch": 0.02, + "learning_rate": 3.268072289156627e-06, + "loss": 1.1463, + "step": 651 + }, + { + "epoch": 0.02, + "learning_rate": 3.2730923694779123e-06, + "loss": 1.1987, + "step": 652 + }, + { + "epoch": 0.02, + "learning_rate": 3.2781124497991974e-06, + "loss": 1.1287, + "step": 653 + }, + { + "epoch": 0.02, + "learning_rate": 3.283132530120482e-06, + "loss": 0.945, + "step": 654 + }, + { + "epoch": 0.02, + "learning_rate": 3.288152610441767e-06, + "loss": 1.1806, + "step": 655 + }, + { + "epoch": 0.02, + "learning_rate": 3.2931726907630525e-06, + "loss": 1.161, + "step": 656 + }, + { + "epoch": 0.02, + "learning_rate": 3.2981927710843376e-06, + "loss": 1.0748, + "step": 657 + }, + { + "epoch": 0.02, + "learning_rate": 3.3032128514056226e-06, + "loss": 1.2085, + "step": 658 + }, + { + "epoch": 0.02, + "learning_rate": 3.308232931726908e-06, + "loss": 1.243, + "step": 659 + }, + { + "epoch": 0.02, + "learning_rate": 3.313253012048193e-06, + "loss": 1.0631, + "step": 660 + }, + { + "epoch": 0.02, + "learning_rate": 3.318273092369478e-06, + "loss": 1.2524, + "step": 661 + }, + { + "epoch": 0.02, + "learning_rate": 3.3232931726907636e-06, + "loss": 1.1423, + "step": 662 + }, + { + "epoch": 0.02, + "learning_rate": 3.3283132530120483e-06, + "loss": 1.2026, + "step": 663 + }, + { + "epoch": 0.02, + "learning_rate": 3.3333333333333333e-06, + "loss": 1.124, + "step": 664 + }, + { + "epoch": 0.02, + "learning_rate": 3.338353413654619e-06, + "loss": 1.0865, + "step": 665 + }, + { + "epoch": 0.02, + "learning_rate": 3.343373493975904e-06, + "loss": 1.1572, + "step": 666 + }, + { + "epoch": 0.02, + "learning_rate": 3.348393574297189e-06, + "loss": 1.1689, + "step": 667 + }, + { + "epoch": 0.02, + "learning_rate": 3.3534136546184744e-06, + "loss": 1.3318, + "step": 668 + }, + { + "epoch": 0.02, + "learning_rate": 3.3584337349397594e-06, + "loss": 1.2412, + "step": 669 + }, + { + "epoch": 0.02, + "learning_rate": 3.3634538152610445e-06, + "loss": 1.128, + "step": 670 + }, + { + "epoch": 0.02, + "learning_rate": 3.36847389558233e-06, + "loss": 1.1482, + "step": 671 + }, + { + "epoch": 0.02, + "learning_rate": 3.3734939759036146e-06, + "loss": 1.1898, + "step": 672 + }, + { + "epoch": 0.02, + "learning_rate": 3.3785140562248996e-06, + "loss": 1.2017, + "step": 673 + }, + { + "epoch": 0.02, + "learning_rate": 3.383534136546185e-06, + "loss": 1.1882, + "step": 674 + }, + { + "epoch": 0.02, + "learning_rate": 3.38855421686747e-06, + "loss": 1.1981, + "step": 675 + }, + { + "epoch": 0.02, + "learning_rate": 3.393574297188755e-06, + "loss": 1.1197, + "step": 676 + }, + { + "epoch": 0.02, + "learning_rate": 3.3985943775100407e-06, + "loss": 1.1023, + "step": 677 + }, + { + "epoch": 0.02, + "learning_rate": 3.4036144578313257e-06, + "loss": 1.1816, + "step": 678 + }, + { + "epoch": 0.02, + "learning_rate": 3.4086345381526108e-06, + "loss": 1.1912, + "step": 679 + }, + { + "epoch": 0.02, + "learning_rate": 3.4136546184738962e-06, + "loss": 1.2328, + "step": 680 + }, + { + "epoch": 0.02, + "learning_rate": 3.418674698795181e-06, + "loss": 1.161, + "step": 681 + }, + { + "epoch": 0.02, + "learning_rate": 3.423694779116466e-06, + "loss": 1.231, + "step": 682 + }, + { + "epoch": 0.02, + "learning_rate": 3.428714859437751e-06, + "loss": 1.1907, + "step": 683 + }, + { + "epoch": 0.02, + "learning_rate": 3.4337349397590364e-06, + "loss": 1.1454, + "step": 684 + }, + { + "epoch": 0.02, + "learning_rate": 3.4387550200803215e-06, + "loss": 1.1617, + "step": 685 + }, + { + "epoch": 0.02, + "learning_rate": 3.443775100401607e-06, + "loss": 1.0974, + "step": 686 + }, + { + "epoch": 0.02, + "learning_rate": 3.448795180722892e-06, + "loss": 1.2363, + "step": 687 + }, + { + "epoch": 0.02, + "learning_rate": 3.453815261044177e-06, + "loss": 1.0786, + "step": 688 + }, + { + "epoch": 0.02, + "learning_rate": 3.4588353413654625e-06, + "loss": 1.2175, + "step": 689 + }, + { + "epoch": 0.02, + "learning_rate": 3.463855421686747e-06, + "loss": 1.2083, + "step": 690 + }, + { + "epoch": 0.02, + "learning_rate": 3.4688755020080322e-06, + "loss": 1.2068, + "step": 691 + }, + { + "epoch": 0.02, + "learning_rate": 3.4738955823293173e-06, + "loss": 1.1506, + "step": 692 + }, + { + "epoch": 0.02, + "learning_rate": 3.4789156626506027e-06, + "loss": 1.0679, + "step": 693 + }, + { + "epoch": 0.02, + "learning_rate": 3.4839357429718878e-06, + "loss": 1.2758, + "step": 694 + }, + { + "epoch": 0.02, + "learning_rate": 3.4889558232931733e-06, + "loss": 1.2507, + "step": 695 + }, + { + "epoch": 0.02, + "learning_rate": 3.4939759036144583e-06, + "loss": 1.1918, + "step": 696 + }, + { + "epoch": 0.02, + "learning_rate": 3.4989959839357434e-06, + "loss": 1.1268, + "step": 697 + }, + { + "epoch": 0.02, + "learning_rate": 3.504016064257029e-06, + "loss": 1.2251, + "step": 698 + }, + { + "epoch": 0.02, + "learning_rate": 3.5090361445783135e-06, + "loss": 1.2472, + "step": 699 + }, + { + "epoch": 0.02, + "learning_rate": 3.5140562248995985e-06, + "loss": 1.0486, + "step": 700 + }, + { + "epoch": 0.02, + "learning_rate": 3.5190763052208836e-06, + "loss": 1.1672, + "step": 701 + }, + { + "epoch": 0.02, + "learning_rate": 3.524096385542169e-06, + "loss": 1.2443, + "step": 702 + }, + { + "epoch": 0.02, + "learning_rate": 3.529116465863454e-06, + "loss": 1.2083, + "step": 703 + }, + { + "epoch": 0.02, + "learning_rate": 3.534136546184739e-06, + "loss": 1.1537, + "step": 704 + }, + { + "epoch": 0.02, + "learning_rate": 3.5391566265060246e-06, + "loss": 1.1952, + "step": 705 + }, + { + "epoch": 0.02, + "learning_rate": 3.5441767068273097e-06, + "loss": 1.3051, + "step": 706 + }, + { + "epoch": 0.02, + "learning_rate": 3.5491967871485943e-06, + "loss": 1.1139, + "step": 707 + }, + { + "epoch": 0.02, + "learning_rate": 3.5542168674698798e-06, + "loss": 1.166, + "step": 708 + }, + { + "epoch": 0.02, + "learning_rate": 3.559236947791165e-06, + "loss": 1.0823, + "step": 709 + }, + { + "epoch": 0.02, + "learning_rate": 3.56425702811245e-06, + "loss": 1.1886, + "step": 710 + }, + { + "epoch": 0.02, + "learning_rate": 3.5692771084337353e-06, + "loss": 1.2087, + "step": 711 + }, + { + "epoch": 0.02, + "learning_rate": 3.5742971887550204e-06, + "loss": 1.1559, + "step": 712 + }, + { + "epoch": 0.02, + "learning_rate": 3.5793172690763054e-06, + "loss": 1.1663, + "step": 713 + }, + { + "epoch": 0.02, + "learning_rate": 3.584337349397591e-06, + "loss": 1.2113, + "step": 714 + }, + { + "epoch": 0.02, + "learning_rate": 3.589357429718876e-06, + "loss": 1.1192, + "step": 715 + }, + { + "epoch": 0.02, + "learning_rate": 3.5943775100401606e-06, + "loss": 1.2707, + "step": 716 + }, + { + "epoch": 0.02, + "learning_rate": 3.599397590361446e-06, + "loss": 1.236, + "step": 717 + }, + { + "epoch": 0.02, + "learning_rate": 3.604417670682731e-06, + "loss": 1.2584, + "step": 718 + }, + { + "epoch": 0.02, + "learning_rate": 3.609437751004016e-06, + "loss": 1.1155, + "step": 719 + }, + { + "epoch": 0.02, + "learning_rate": 3.6144578313253016e-06, + "loss": 1.1029, + "step": 720 + }, + { + "epoch": 0.02, + "learning_rate": 3.6194779116465867e-06, + "loss": 1.1742, + "step": 721 + }, + { + "epoch": 0.02, + "learning_rate": 3.6244979919678717e-06, + "loss": 1.12, + "step": 722 + }, + { + "epoch": 0.02, + "learning_rate": 3.629518072289157e-06, + "loss": 1.166, + "step": 723 + }, + { + "epoch": 0.02, + "learning_rate": 3.6345381526104423e-06, + "loss": 1.1995, + "step": 724 + }, + { + "epoch": 0.02, + "learning_rate": 3.639558232931727e-06, + "loss": 1.203, + "step": 725 + }, + { + "epoch": 0.02, + "learning_rate": 3.6445783132530124e-06, + "loss": 1.0984, + "step": 726 + }, + { + "epoch": 0.02, + "learning_rate": 3.6495983935742974e-06, + "loss": 1.271, + "step": 727 + }, + { + "epoch": 0.02, + "learning_rate": 3.6546184738955825e-06, + "loss": 1.1285, + "step": 728 + }, + { + "epoch": 0.02, + "learning_rate": 3.659638554216868e-06, + "loss": 1.1595, + "step": 729 + }, + { + "epoch": 0.02, + "learning_rate": 3.664658634538153e-06, + "loss": 1.0826, + "step": 730 + }, + { + "epoch": 0.02, + "learning_rate": 3.669678714859438e-06, + "loss": 1.1198, + "step": 731 + }, + { + "epoch": 0.02, + "learning_rate": 3.6746987951807235e-06, + "loss": 1.2574, + "step": 732 + }, + { + "epoch": 0.02, + "learning_rate": 3.6797188755020085e-06, + "loss": 1.1336, + "step": 733 + }, + { + "epoch": 0.02, + "learning_rate": 3.684738955823293e-06, + "loss": 1.225, + "step": 734 + }, + { + "epoch": 0.02, + "learning_rate": 3.6897590361445782e-06, + "loss": 1.1661, + "step": 735 + }, + { + "epoch": 0.02, + "learning_rate": 3.6947791164658637e-06, + "loss": 1.2579, + "step": 736 + }, + { + "epoch": 0.02, + "learning_rate": 3.6997991967871487e-06, + "loss": 1.058, + "step": 737 + }, + { + "epoch": 0.02, + "learning_rate": 3.7048192771084342e-06, + "loss": 1.1254, + "step": 738 + }, + { + "epoch": 0.02, + "learning_rate": 3.7098393574297193e-06, + "loss": 1.2144, + "step": 739 + }, + { + "epoch": 0.02, + "learning_rate": 3.7148594377510043e-06, + "loss": 1.1376, + "step": 740 + }, + { + "epoch": 0.02, + "learning_rate": 3.71987951807229e-06, + "loss": 1.1866, + "step": 741 + }, + { + "epoch": 0.02, + "learning_rate": 3.724899598393575e-06, + "loss": 1.1795, + "step": 742 + }, + { + "epoch": 0.02, + "learning_rate": 3.7299196787148595e-06, + "loss": 1.1188, + "step": 743 + }, + { + "epoch": 0.02, + "learning_rate": 3.7349397590361445e-06, + "loss": 1.2007, + "step": 744 + }, + { + "epoch": 0.02, + "learning_rate": 3.73995983935743e-06, + "loss": 1.0975, + "step": 745 + }, + { + "epoch": 0.02, + "learning_rate": 3.744979919678715e-06, + "loss": 1.1866, + "step": 746 + }, + { + "epoch": 0.02, + "learning_rate": 3.7500000000000005e-06, + "loss": 1.1664, + "step": 747 + }, + { + "epoch": 0.02, + "learning_rate": 3.7550200803212856e-06, + "loss": 1.1823, + "step": 748 + }, + { + "epoch": 0.02, + "learning_rate": 3.7600401606425706e-06, + "loss": 1.1309, + "step": 749 + }, + { + "epoch": 0.02, + "learning_rate": 3.765060240963856e-06, + "loss": 1.2036, + "step": 750 + }, + { + "epoch": 0.02, + "learning_rate": 3.770080321285141e-06, + "loss": 1.2324, + "step": 751 + }, + { + "epoch": 0.02, + "learning_rate": 3.7751004016064258e-06, + "loss": 1.1739, + "step": 752 + }, + { + "epoch": 0.02, + "learning_rate": 3.780120481927711e-06, + "loss": 1.0905, + "step": 753 + }, + { + "epoch": 0.02, + "learning_rate": 3.7851405622489963e-06, + "loss": 1.1924, + "step": 754 + }, + { + "epoch": 0.02, + "learning_rate": 3.7901606425702813e-06, + "loss": 1.2185, + "step": 755 + }, + { + "epoch": 0.02, + "learning_rate": 3.7951807228915664e-06, + "loss": 1.1776, + "step": 756 + }, + { + "epoch": 0.02, + "learning_rate": 3.800200803212852e-06, + "loss": 1.1347, + "step": 757 + }, + { + "epoch": 0.02, + "learning_rate": 3.805220883534137e-06, + "loss": 1.1628, + "step": 758 + }, + { + "epoch": 0.02, + "learning_rate": 3.8102409638554224e-06, + "loss": 1.1449, + "step": 759 + }, + { + "epoch": 0.02, + "learning_rate": 3.8152610441767074e-06, + "loss": 1.1294, + "step": 760 + }, + { + "epoch": 0.02, + "learning_rate": 3.820281124497992e-06, + "loss": 1.2632, + "step": 761 + }, + { + "epoch": 0.02, + "learning_rate": 3.8253012048192775e-06, + "loss": 1.2375, + "step": 762 + }, + { + "epoch": 0.02, + "learning_rate": 3.830321285140562e-06, + "loss": 1.2219, + "step": 763 + }, + { + "epoch": 0.02, + "learning_rate": 3.835341365461848e-06, + "loss": 1.1803, + "step": 764 + }, + { + "epoch": 0.02, + "learning_rate": 3.840361445783133e-06, + "loss": 1.11, + "step": 765 + }, + { + "epoch": 0.02, + "learning_rate": 3.845381526104418e-06, + "loss": 1.2098, + "step": 766 + }, + { + "epoch": 0.02, + "learning_rate": 3.850401606425703e-06, + "loss": 1.2538, + "step": 767 + }, + { + "epoch": 0.02, + "learning_rate": 3.855421686746989e-06, + "loss": 1.2141, + "step": 768 + }, + { + "epoch": 0.02, + "learning_rate": 3.860441767068273e-06, + "loss": 1.1812, + "step": 769 + }, + { + "epoch": 0.02, + "learning_rate": 3.865461847389558e-06, + "loss": 1.1094, + "step": 770 + }, + { + "epoch": 0.02, + "learning_rate": 3.870481927710843e-06, + "loss": 1.1046, + "step": 771 + }, + { + "epoch": 0.02, + "learning_rate": 3.875502008032129e-06, + "loss": 1.1547, + "step": 772 + }, + { + "epoch": 0.02, + "learning_rate": 3.8805220883534135e-06, + "loss": 1.2114, + "step": 773 + }, + { + "epoch": 0.02, + "learning_rate": 3.885542168674699e-06, + "loss": 1.229, + "step": 774 + }, + { + "epoch": 0.02, + "learning_rate": 3.8905622489959845e-06, + "loss": 1.026, + "step": 775 + }, + { + "epoch": 0.02, + "learning_rate": 3.89558232931727e-06, + "loss": 1.2162, + "step": 776 + }, + { + "epoch": 0.02, + "learning_rate": 3.9006024096385546e-06, + "loss": 1.1267, + "step": 777 + }, + { + "epoch": 0.02, + "learning_rate": 3.90562248995984e-06, + "loss": 1.2231, + "step": 778 + }, + { + "epoch": 0.02, + "learning_rate": 3.910642570281125e-06, + "loss": 1.1613, + "step": 779 + }, + { + "epoch": 0.02, + "learning_rate": 3.91566265060241e-06, + "loss": 1.1917, + "step": 780 + }, + { + "epoch": 0.02, + "learning_rate": 3.920682730923695e-06, + "loss": 1.3037, + "step": 781 + }, + { + "epoch": 0.02, + "learning_rate": 3.92570281124498e-06, + "loss": 1.1561, + "step": 782 + }, + { + "epoch": 0.02, + "learning_rate": 3.930722891566266e-06, + "loss": 1.1202, + "step": 783 + }, + { + "epoch": 0.02, + "learning_rate": 3.93574297188755e-06, + "loss": 1.2013, + "step": 784 + }, + { + "epoch": 0.02, + "learning_rate": 3.940763052208836e-06, + "loss": 1.3037, + "step": 785 + }, + { + "epoch": 0.02, + "learning_rate": 3.945783132530121e-06, + "loss": 1.2101, + "step": 786 + }, + { + "epoch": 0.02, + "learning_rate": 3.950803212851406e-06, + "loss": 1.1733, + "step": 787 + }, + { + "epoch": 0.02, + "learning_rate": 3.9558232931726905e-06, + "loss": 1.0984, + "step": 788 + }, + { + "epoch": 0.02, + "learning_rate": 3.960843373493976e-06, + "loss": 1.2742, + "step": 789 + }, + { + "epoch": 0.02, + "learning_rate": 3.9658634538152615e-06, + "loss": 1.1224, + "step": 790 + }, + { + "epoch": 0.02, + "learning_rate": 3.970883534136546e-06, + "loss": 1.1318, + "step": 791 + }, + { + "epoch": 0.02, + "learning_rate": 3.975903614457832e-06, + "loss": 1.1938, + "step": 792 + }, + { + "epoch": 0.02, + "learning_rate": 3.980923694779117e-06, + "loss": 1.1208, + "step": 793 + }, + { + "epoch": 0.02, + "learning_rate": 3.985943775100402e-06, + "loss": 1.1153, + "step": 794 + }, + { + "epoch": 0.02, + "learning_rate": 3.990963855421687e-06, + "loss": 1.0952, + "step": 795 + }, + { + "epoch": 0.02, + "learning_rate": 3.995983935742972e-06, + "loss": 1.0912, + "step": 796 + }, + { + "epoch": 0.02, + "learning_rate": 4.001004016064257e-06, + "loss": 1.1032, + "step": 797 + }, + { + "epoch": 0.02, + "learning_rate": 4.006024096385543e-06, + "loss": 1.204, + "step": 798 + }, + { + "epoch": 0.02, + "learning_rate": 4.011044176706827e-06, + "loss": 1.2959, + "step": 799 + }, + { + "epoch": 0.02, + "learning_rate": 4.016064257028113e-06, + "loss": 1.1191, + "step": 800 + }, + { + "epoch": 0.02, + "learning_rate": 4.021084337349398e-06, + "loss": 1.2489, + "step": 801 + }, + { + "epoch": 0.02, + "learning_rate": 4.026104417670683e-06, + "loss": 1.1782, + "step": 802 + }, + { + "epoch": 0.02, + "learning_rate": 4.031124497991968e-06, + "loss": 1.1559, + "step": 803 + }, + { + "epoch": 0.02, + "learning_rate": 4.036144578313254e-06, + "loss": 1.1214, + "step": 804 + }, + { + "epoch": 0.02, + "learning_rate": 4.0411646586345385e-06, + "loss": 1.0647, + "step": 805 + }, + { + "epoch": 0.02, + "learning_rate": 4.046184738955823e-06, + "loss": 1.1761, + "step": 806 + }, + { + "epoch": 0.02, + "learning_rate": 4.051204819277109e-06, + "loss": 1.2045, + "step": 807 + }, + { + "epoch": 0.02, + "learning_rate": 4.056224899598394e-06, + "loss": 1.1516, + "step": 808 + }, + { + "epoch": 0.02, + "learning_rate": 4.061244979919679e-06, + "loss": 1.0133, + "step": 809 + }, + { + "epoch": 0.02, + "learning_rate": 4.066265060240964e-06, + "loss": 1.1262, + "step": 810 + }, + { + "epoch": 0.02, + "learning_rate": 4.07128514056225e-06, + "loss": 1.136, + "step": 811 + }, + { + "epoch": 0.02, + "learning_rate": 4.076305220883534e-06, + "loss": 1.2465, + "step": 812 + }, + { + "epoch": 0.02, + "learning_rate": 4.08132530120482e-06, + "loss": 1.121, + "step": 813 + }, + { + "epoch": 0.02, + "learning_rate": 4.086345381526104e-06, + "loss": 1.1965, + "step": 814 + }, + { + "epoch": 0.02, + "learning_rate": 4.09136546184739e-06, + "loss": 1.1956, + "step": 815 + }, + { + "epoch": 0.02, + "learning_rate": 4.096385542168675e-06, + "loss": 1.2074, + "step": 816 + }, + { + "epoch": 0.02, + "learning_rate": 4.10140562248996e-06, + "loss": 1.2259, + "step": 817 + }, + { + "epoch": 0.02, + "learning_rate": 4.106425702811245e-06, + "loss": 1.2367, + "step": 818 + }, + { + "epoch": 0.02, + "learning_rate": 4.111445783132531e-06, + "loss": 1.2288, + "step": 819 + }, + { + "epoch": 0.02, + "learning_rate": 4.1164658634538155e-06, + "loss": 1.0935, + "step": 820 + }, + { + "epoch": 0.02, + "learning_rate": 4.121485943775101e-06, + "loss": 1.1758, + "step": 821 + }, + { + "epoch": 0.02, + "learning_rate": 4.1265060240963865e-06, + "loss": 1.157, + "step": 822 + }, + { + "epoch": 0.02, + "learning_rate": 4.131526104417671e-06, + "loss": 1.2372, + "step": 823 + }, + { + "epoch": 0.02, + "learning_rate": 4.136546184738956e-06, + "loss": 1.1852, + "step": 824 + }, + { + "epoch": 0.02, + "learning_rate": 4.141566265060241e-06, + "loss": 1.2545, + "step": 825 + }, + { + "epoch": 0.02, + "learning_rate": 4.146586345381527e-06, + "loss": 1.1528, + "step": 826 + }, + { + "epoch": 0.02, + "learning_rate": 4.151606425702811e-06, + "loss": 1.2108, + "step": 827 + }, + { + "epoch": 0.02, + "learning_rate": 4.156626506024097e-06, + "loss": 1.2369, + "step": 828 + }, + { + "epoch": 0.02, + "learning_rate": 4.161646586345382e-06, + "loss": 1.1534, + "step": 829 + }, + { + "epoch": 0.03, + "learning_rate": 4.166666666666667e-06, + "loss": 1.1229, + "step": 830 + }, + { + "epoch": 0.03, + "learning_rate": 4.171686746987952e-06, + "loss": 1.1689, + "step": 831 + }, + { + "epoch": 0.03, + "learning_rate": 4.176706827309237e-06, + "loss": 1.2139, + "step": 832 + }, + { + "epoch": 0.03, + "learning_rate": 4.1817269076305224e-06, + "loss": 1.1818, + "step": 833 + }, + { + "epoch": 0.03, + "learning_rate": 4.186746987951807e-06, + "loss": 1.0599, + "step": 834 + }, + { + "epoch": 0.03, + "learning_rate": 4.1917670682730925e-06, + "loss": 1.1351, + "step": 835 + }, + { + "epoch": 0.03, + "learning_rate": 4.196787148594378e-06, + "loss": 1.193, + "step": 836 + }, + { + "epoch": 0.03, + "learning_rate": 4.201807228915663e-06, + "loss": 1.2032, + "step": 837 + }, + { + "epoch": 0.03, + "learning_rate": 4.206827309236948e-06, + "loss": 1.1447, + "step": 838 + }, + { + "epoch": 0.03, + "learning_rate": 4.211847389558234e-06, + "loss": 1.0885, + "step": 839 + }, + { + "epoch": 0.03, + "learning_rate": 4.216867469879519e-06, + "loss": 1.1421, + "step": 840 + }, + { + "epoch": 0.03, + "learning_rate": 4.221887550200804e-06, + "loss": 1.2253, + "step": 841 + }, + { + "epoch": 0.03, + "learning_rate": 4.226907630522088e-06, + "loss": 1.2026, + "step": 842 + }, + { + "epoch": 0.03, + "learning_rate": 4.231927710843374e-06, + "loss": 1.194, + "step": 843 + }, + { + "epoch": 0.03, + "learning_rate": 4.236947791164659e-06, + "loss": 1.187, + "step": 844 + }, + { + "epoch": 0.03, + "learning_rate": 4.241967871485944e-06, + "loss": 1.1255, + "step": 845 + }, + { + "epoch": 0.03, + "learning_rate": 4.246987951807229e-06, + "loss": 1.0867, + "step": 846 + }, + { + "epoch": 0.03, + "learning_rate": 4.252008032128515e-06, + "loss": 1.1239, + "step": 847 + }, + { + "epoch": 0.03, + "learning_rate": 4.2570281124497995e-06, + "loss": 1.1511, + "step": 848 + }, + { + "epoch": 0.03, + "learning_rate": 4.262048192771085e-06, + "loss": 1.2089, + "step": 849 + }, + { + "epoch": 0.03, + "learning_rate": 4.2670682730923696e-06, + "loss": 1.3069, + "step": 850 + }, + { + "epoch": 0.03, + "learning_rate": 4.272088353413655e-06, + "loss": 1.1969, + "step": 851 + }, + { + "epoch": 0.03, + "learning_rate": 4.27710843373494e-06, + "loss": 1.1122, + "step": 852 + }, + { + "epoch": 0.03, + "learning_rate": 4.282128514056225e-06, + "loss": 1.1059, + "step": 853 + }, + { + "epoch": 0.03, + "learning_rate": 4.287148594377511e-06, + "loss": 1.2266, + "step": 854 + }, + { + "epoch": 0.03, + "learning_rate": 4.292168674698795e-06, + "loss": 1.1371, + "step": 855 + }, + { + "epoch": 0.03, + "learning_rate": 4.297188755020081e-06, + "loss": 1.1995, + "step": 856 + }, + { + "epoch": 0.03, + "learning_rate": 4.302208835341366e-06, + "loss": 1.1223, + "step": 857 + }, + { + "epoch": 0.03, + "learning_rate": 4.307228915662651e-06, + "loss": 1.2378, + "step": 858 + }, + { + "epoch": 0.03, + "learning_rate": 4.312248995983936e-06, + "loss": 1.0909, + "step": 859 + }, + { + "epoch": 0.03, + "learning_rate": 4.317269076305221e-06, + "loss": 1.2485, + "step": 860 + }, + { + "epoch": 0.03, + "learning_rate": 4.322289156626506e-06, + "loss": 1.2812, + "step": 861 + }, + { + "epoch": 0.03, + "learning_rate": 4.327309236947792e-06, + "loss": 1.1661, + "step": 862 + }, + { + "epoch": 0.03, + "learning_rate": 4.3323293172690765e-06, + "loss": 1.2351, + "step": 863 + }, + { + "epoch": 0.03, + "learning_rate": 4.337349397590362e-06, + "loss": 1.0648, + "step": 864 + }, + { + "epoch": 0.03, + "learning_rate": 4.3423694779116474e-06, + "loss": 1.2664, + "step": 865 + }, + { + "epoch": 0.03, + "learning_rate": 4.347389558232932e-06, + "loss": 1.1964, + "step": 866 + }, + { + "epoch": 0.03, + "learning_rate": 4.3524096385542175e-06, + "loss": 1.2455, + "step": 867 + }, + { + "epoch": 0.03, + "learning_rate": 4.357429718875502e-06, + "loss": 1.1878, + "step": 868 + }, + { + "epoch": 0.03, + "learning_rate": 4.362449799196788e-06, + "loss": 1.1794, + "step": 869 + }, + { + "epoch": 0.03, + "learning_rate": 4.367469879518072e-06, + "loss": 1.1956, + "step": 870 + }, + { + "epoch": 0.03, + "learning_rate": 4.372489959839358e-06, + "loss": 1.2058, + "step": 871 + }, + { + "epoch": 0.03, + "learning_rate": 4.377510040160643e-06, + "loss": 1.2101, + "step": 872 + }, + { + "epoch": 0.03, + "learning_rate": 4.382530120481928e-06, + "loss": 1.153, + "step": 873 + }, + { + "epoch": 0.03, + "learning_rate": 4.387550200803213e-06, + "loss": 1.2831, + "step": 874 + }, + { + "epoch": 0.03, + "learning_rate": 4.392570281124499e-06, + "loss": 1.2347, + "step": 875 + }, + { + "epoch": 0.03, + "learning_rate": 4.397590361445783e-06, + "loss": 1.1672, + "step": 876 + }, + { + "epoch": 0.03, + "learning_rate": 4.402610441767068e-06, + "loss": 1.2123, + "step": 877 + }, + { + "epoch": 0.03, + "learning_rate": 4.4076305220883535e-06, + "loss": 1.1037, + "step": 878 + }, + { + "epoch": 0.03, + "learning_rate": 4.412650602409639e-06, + "loss": 1.2438, + "step": 879 + }, + { + "epoch": 0.03, + "learning_rate": 4.4176706827309244e-06, + "loss": 0.997, + "step": 880 + }, + { + "epoch": 0.03, + "learning_rate": 4.422690763052209e-06, + "loss": 1.2045, + "step": 881 + }, + { + "epoch": 0.03, + "learning_rate": 4.4277108433734945e-06, + "loss": 1.1196, + "step": 882 + }, + { + "epoch": 0.03, + "learning_rate": 4.43273092369478e-06, + "loss": 1.1945, + "step": 883 + }, + { + "epoch": 0.03, + "learning_rate": 4.437751004016065e-06, + "loss": 1.0784, + "step": 884 + }, + { + "epoch": 0.03, + "learning_rate": 4.442771084337349e-06, + "loss": 1.1674, + "step": 885 + }, + { + "epoch": 0.03, + "learning_rate": 4.447791164658635e-06, + "loss": 1.1193, + "step": 886 + }, + { + "epoch": 0.03, + "learning_rate": 4.45281124497992e-06, + "loss": 1.1965, + "step": 887 + }, + { + "epoch": 0.03, + "learning_rate": 4.457831325301205e-06, + "loss": 1.1005, + "step": 888 + }, + { + "epoch": 0.03, + "learning_rate": 4.46285140562249e-06, + "loss": 1.1612, + "step": 889 + }, + { + "epoch": 0.03, + "learning_rate": 4.467871485943776e-06, + "loss": 1.2306, + "step": 890 + }, + { + "epoch": 0.03, + "learning_rate": 4.47289156626506e-06, + "loss": 1.1507, + "step": 891 + }, + { + "epoch": 0.03, + "learning_rate": 4.477911646586346e-06, + "loss": 1.2439, + "step": 892 + }, + { + "epoch": 0.03, + "learning_rate": 4.482931726907631e-06, + "loss": 1.127, + "step": 893 + }, + { + "epoch": 0.03, + "learning_rate": 4.487951807228916e-06, + "loss": 1.2712, + "step": 894 + }, + { + "epoch": 0.03, + "learning_rate": 4.492971887550201e-06, + "loss": 1.1355, + "step": 895 + }, + { + "epoch": 0.03, + "learning_rate": 4.497991967871486e-06, + "loss": 1.1252, + "step": 896 + }, + { + "epoch": 0.03, + "learning_rate": 4.5030120481927716e-06, + "loss": 1.1775, + "step": 897 + }, + { + "epoch": 0.03, + "learning_rate": 4.508032128514056e-06, + "loss": 1.1984, + "step": 898 + }, + { + "epoch": 0.03, + "learning_rate": 4.513052208835342e-06, + "loss": 1.2047, + "step": 899 + }, + { + "epoch": 0.03, + "learning_rate": 4.518072289156627e-06, + "loss": 1.1887, + "step": 900 + }, + { + "epoch": 0.03, + "learning_rate": 4.523092369477913e-06, + "loss": 1.1821, + "step": 901 + }, + { + "epoch": 0.03, + "learning_rate": 4.528112449799197e-06, + "loss": 1.1843, + "step": 902 + }, + { + "epoch": 0.03, + "learning_rate": 4.533132530120482e-06, + "loss": 1.2064, + "step": 903 + }, + { + "epoch": 0.03, + "learning_rate": 4.538152610441767e-06, + "loss": 1.2113, + "step": 904 + }, + { + "epoch": 0.03, + "learning_rate": 4.543172690763053e-06, + "loss": 1.1174, + "step": 905 + }, + { + "epoch": 0.03, + "learning_rate": 4.5481927710843374e-06, + "loss": 1.2171, + "step": 906 + }, + { + "epoch": 0.03, + "learning_rate": 4.553212851405623e-06, + "loss": 1.1845, + "step": 907 + }, + { + "epoch": 0.03, + "learning_rate": 4.558232931726908e-06, + "loss": 1.1942, + "step": 908 + }, + { + "epoch": 0.03, + "learning_rate": 4.563253012048193e-06, + "loss": 1.1784, + "step": 909 + }, + { + "epoch": 0.03, + "learning_rate": 4.5682730923694785e-06, + "loss": 1.1885, + "step": 910 + }, + { + "epoch": 0.03, + "learning_rate": 4.573293172690764e-06, + "loss": 1.2352, + "step": 911 + }, + { + "epoch": 0.03, + "learning_rate": 4.578313253012049e-06, + "loss": 1.2156, + "step": 912 + }, + { + "epoch": 0.03, + "learning_rate": 4.583333333333333e-06, + "loss": 1.2905, + "step": 913 + }, + { + "epoch": 0.03, + "learning_rate": 4.588353413654619e-06, + "loss": 1.1228, + "step": 914 + }, + { + "epoch": 0.03, + "learning_rate": 4.593373493975904e-06, + "loss": 1.1265, + "step": 915 + }, + { + "epoch": 0.03, + "learning_rate": 4.598393574297189e-06, + "loss": 1.2225, + "step": 916 + }, + { + "epoch": 0.03, + "learning_rate": 4.603413654618474e-06, + "loss": 1.2507, + "step": 917 + }, + { + "epoch": 0.03, + "learning_rate": 4.60843373493976e-06, + "loss": 1.2174, + "step": 918 + }, + { + "epoch": 0.03, + "learning_rate": 4.613453815261044e-06, + "loss": 1.0972, + "step": 919 + }, + { + "epoch": 0.03, + "learning_rate": 4.61847389558233e-06, + "loss": 1.1577, + "step": 920 + }, + { + "epoch": 0.03, + "learning_rate": 4.6234939759036145e-06, + "loss": 1.1324, + "step": 921 + }, + { + "epoch": 0.03, + "learning_rate": 4.6285140562249e-06, + "loss": 1.1468, + "step": 922 + }, + { + "epoch": 0.03, + "learning_rate": 4.633534136546185e-06, + "loss": 1.0754, + "step": 923 + }, + { + "epoch": 0.03, + "learning_rate": 4.63855421686747e-06, + "loss": 1.0976, + "step": 924 + }, + { + "epoch": 0.03, + "learning_rate": 4.6435742971887555e-06, + "loss": 1.2158, + "step": 925 + }, + { + "epoch": 0.03, + "learning_rate": 4.648594377510041e-06, + "loss": 1.1849, + "step": 926 + }, + { + "epoch": 0.03, + "learning_rate": 4.653614457831326e-06, + "loss": 1.1783, + "step": 927 + }, + { + "epoch": 0.03, + "learning_rate": 4.658634538152611e-06, + "loss": 1.1724, + "step": 928 + }, + { + "epoch": 0.03, + "learning_rate": 4.6636546184738966e-06, + "loss": 1.1661, + "step": 929 + }, + { + "epoch": 0.03, + "learning_rate": 4.668674698795181e-06, + "loss": 1.0807, + "step": 930 + }, + { + "epoch": 0.03, + "learning_rate": 4.673694779116466e-06, + "loss": 1.2581, + "step": 931 + }, + { + "epoch": 0.03, + "learning_rate": 4.678714859437751e-06, + "loss": 1.1266, + "step": 932 + }, + { + "epoch": 0.03, + "learning_rate": 4.683734939759037e-06, + "loss": 1.2342, + "step": 933 + }, + { + "epoch": 0.03, + "learning_rate": 4.688755020080321e-06, + "loss": 1.1434, + "step": 934 + }, + { + "epoch": 0.03, + "learning_rate": 4.693775100401607e-06, + "loss": 1.1605, + "step": 935 + }, + { + "epoch": 0.03, + "learning_rate": 4.698795180722892e-06, + "loss": 1.1944, + "step": 936 + }, + { + "epoch": 0.03, + "learning_rate": 4.703815261044177e-06, + "loss": 1.3027, + "step": 937 + }, + { + "epoch": 0.03, + "learning_rate": 4.7088353413654624e-06, + "loss": 1.2478, + "step": 938 + }, + { + "epoch": 0.03, + "learning_rate": 4.713855421686747e-06, + "loss": 1.1047, + "step": 939 + }, + { + "epoch": 0.03, + "learning_rate": 4.7188755020080325e-06, + "loss": 1.2137, + "step": 940 + }, + { + "epoch": 0.03, + "learning_rate": 4.723895582329317e-06, + "loss": 1.1926, + "step": 941 + }, + { + "epoch": 0.03, + "learning_rate": 4.728915662650603e-06, + "loss": 1.301, + "step": 942 + }, + { + "epoch": 0.03, + "learning_rate": 4.733935742971888e-06, + "loss": 1.3237, + "step": 943 + }, + { + "epoch": 0.03, + "learning_rate": 4.7389558232931736e-06, + "loss": 1.1144, + "step": 944 + }, + { + "epoch": 0.03, + "learning_rate": 4.743975903614458e-06, + "loss": 1.1965, + "step": 945 + }, + { + "epoch": 0.03, + "learning_rate": 4.748995983935744e-06, + "loss": 1.1981, + "step": 946 + }, + { + "epoch": 0.03, + "learning_rate": 4.754016064257029e-06, + "loss": 1.2367, + "step": 947 + }, + { + "epoch": 0.03, + "learning_rate": 4.759036144578314e-06, + "loss": 1.2113, + "step": 948 + }, + { + "epoch": 0.03, + "learning_rate": 4.764056224899598e-06, + "loss": 1.092, + "step": 949 + }, + { + "epoch": 0.03, + "learning_rate": 4.769076305220884e-06, + "loss": 1.0604, + "step": 950 + }, + { + "epoch": 0.03, + "learning_rate": 4.774096385542169e-06, + "loss": 1.1526, + "step": 951 + }, + { + "epoch": 0.03, + "learning_rate": 4.779116465863454e-06, + "loss": 1.0151, + "step": 952 + }, + { + "epoch": 0.03, + "learning_rate": 4.7841365461847394e-06, + "loss": 1.1007, + "step": 953 + }, + { + "epoch": 0.03, + "learning_rate": 4.789156626506025e-06, + "loss": 1.1938, + "step": 954 + }, + { + "epoch": 0.03, + "learning_rate": 4.7941767068273095e-06, + "loss": 1.1664, + "step": 955 + }, + { + "epoch": 0.03, + "learning_rate": 4.799196787148594e-06, + "loss": 1.2405, + "step": 956 + }, + { + "epoch": 0.03, + "learning_rate": 4.80421686746988e-06, + "loss": 1.1171, + "step": 957 + }, + { + "epoch": 0.03, + "learning_rate": 4.809236947791165e-06, + "loss": 1.1636, + "step": 958 + }, + { + "epoch": 0.03, + "learning_rate": 4.81425702811245e-06, + "loss": 1.1574, + "step": 959 + }, + { + "epoch": 0.03, + "learning_rate": 4.819277108433735e-06, + "loss": 1.1075, + "step": 960 + }, + { + "epoch": 0.03, + "learning_rate": 4.824297188755021e-06, + "loss": 1.2254, + "step": 961 + }, + { + "epoch": 0.03, + "learning_rate": 4.829317269076305e-06, + "loss": 1.2274, + "step": 962 + }, + { + "epoch": 0.03, + "learning_rate": 4.834337349397591e-06, + "loss": 1.17, + "step": 963 + }, + { + "epoch": 0.03, + "learning_rate": 4.839357429718876e-06, + "loss": 1.1818, + "step": 964 + }, + { + "epoch": 0.03, + "learning_rate": 4.844377510040161e-06, + "loss": 1.215, + "step": 965 + }, + { + "epoch": 0.03, + "learning_rate": 4.849397590361446e-06, + "loss": 1.2313, + "step": 966 + }, + { + "epoch": 0.03, + "learning_rate": 4.854417670682731e-06, + "loss": 1.2126, + "step": 967 + }, + { + "epoch": 0.03, + "learning_rate": 4.8594377510040165e-06, + "loss": 1.3407, + "step": 968 + }, + { + "epoch": 0.03, + "learning_rate": 4.864457831325302e-06, + "loss": 1.0948, + "step": 969 + }, + { + "epoch": 0.03, + "learning_rate": 4.8694779116465866e-06, + "loss": 1.151, + "step": 970 + }, + { + "epoch": 0.03, + "learning_rate": 4.874497991967872e-06, + "loss": 1.1895, + "step": 971 + }, + { + "epoch": 0.03, + "learning_rate": 4.8795180722891575e-06, + "loss": 1.2261, + "step": 972 + }, + { + "epoch": 0.03, + "learning_rate": 4.884538152610442e-06, + "loss": 1.1776, + "step": 973 + }, + { + "epoch": 0.03, + "learning_rate": 4.889558232931727e-06, + "loss": 1.0862, + "step": 974 + }, + { + "epoch": 0.03, + "learning_rate": 4.894578313253012e-06, + "loss": 1.2307, + "step": 975 + }, + { + "epoch": 0.03, + "learning_rate": 4.899598393574298e-06, + "loss": 1.1899, + "step": 976 + }, + { + "epoch": 0.03, + "learning_rate": 4.904618473895582e-06, + "loss": 1.1544, + "step": 977 + }, + { + "epoch": 0.03, + "learning_rate": 4.909638554216868e-06, + "loss": 1.14, + "step": 978 + }, + { + "epoch": 0.03, + "learning_rate": 4.914658634538153e-06, + "loss": 1.147, + "step": 979 + }, + { + "epoch": 0.03, + "learning_rate": 4.919678714859438e-06, + "loss": 1.271, + "step": 980 + }, + { + "epoch": 0.03, + "learning_rate": 4.924698795180723e-06, + "loss": 1.3358, + "step": 981 + }, + { + "epoch": 0.03, + "learning_rate": 4.929718875502009e-06, + "loss": 1.1552, + "step": 982 + }, + { + "epoch": 0.03, + "learning_rate": 4.9347389558232935e-06, + "loss": 1.1945, + "step": 983 + }, + { + "epoch": 0.03, + "learning_rate": 4.939759036144578e-06, + "loss": 1.2268, + "step": 984 + }, + { + "epoch": 0.03, + "learning_rate": 4.944779116465864e-06, + "loss": 1.1343, + "step": 985 + }, + { + "epoch": 0.03, + "learning_rate": 4.949799196787149e-06, + "loss": 1.1038, + "step": 986 + }, + { + "epoch": 0.03, + "learning_rate": 4.9548192771084345e-06, + "loss": 1.14, + "step": 987 + }, + { + "epoch": 0.03, + "learning_rate": 4.959839357429719e-06, + "loss": 1.1661, + "step": 988 + }, + { + "epoch": 0.03, + "learning_rate": 4.964859437751005e-06, + "loss": 1.2185, + "step": 989 + }, + { + "epoch": 0.03, + "learning_rate": 4.96987951807229e-06, + "loss": 1.0518, + "step": 990 + }, + { + "epoch": 0.03, + "learning_rate": 4.974899598393575e-06, + "loss": 1.073, + "step": 991 + }, + { + "epoch": 0.03, + "learning_rate": 4.979919678714859e-06, + "loss": 1.1993, + "step": 992 + }, + { + "epoch": 0.03, + "learning_rate": 4.984939759036145e-06, + "loss": 1.1627, + "step": 993 + }, + { + "epoch": 0.03, + "learning_rate": 4.98995983935743e-06, + "loss": 1.1975, + "step": 994 + }, + { + "epoch": 0.03, + "learning_rate": 4.994979919678715e-06, + "loss": 1.1283, + "step": 995 + }, + { + "epoch": 0.03, + "learning_rate": 5e-06, + "loss": 1.1426, + "step": 996 + }, + { + "epoch": 0.03, + "learning_rate": 4.999999988100602e-06, + "loss": 1.0962, + "step": 997 + }, + { + "epoch": 0.03, + "learning_rate": 4.999999952402409e-06, + "loss": 1.1393, + "step": 998 + }, + { + "epoch": 0.03, + "learning_rate": 4.999999892905419e-06, + "loss": 1.2229, + "step": 999 + }, + { + "epoch": 0.03, + "learning_rate": 4.999999809609635e-06, + "loss": 1.1984, + "step": 1000 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999997025150566e-06, + "loss": 1.1069, + "step": 1001 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999995716216856e-06, + "loss": 1.2445, + "step": 1002 + }, + { + "epoch": 0.03, + "learning_rate": 4.999999416929522e-06, + "loss": 1.1068, + "step": 1003 + }, + { + "epoch": 0.03, + "learning_rate": 4.999999238438568e-06, + "loss": 1.1652, + "step": 1004 + }, + { + "epoch": 0.03, + "learning_rate": 4.999999036148825e-06, + "loss": 1.3651, + "step": 1005 + }, + { + "epoch": 0.03, + "learning_rate": 4.999998810060296e-06, + "loss": 1.2017, + "step": 1006 + }, + { + "epoch": 0.03, + "learning_rate": 4.999998560172981e-06, + "loss": 1.3706, + "step": 1007 + }, + { + "epoch": 0.03, + "learning_rate": 4.999998286486886e-06, + "loss": 1.147, + "step": 1008 + }, + { + "epoch": 0.03, + "learning_rate": 4.99999798900201e-06, + "loss": 1.1786, + "step": 1009 + }, + { + "epoch": 0.03, + "learning_rate": 4.999997667718357e-06, + "loss": 1.1466, + "step": 1010 + }, + { + "epoch": 0.03, + "learning_rate": 4.999997322635931e-06, + "loss": 1.1344, + "step": 1011 + }, + { + "epoch": 0.03, + "learning_rate": 4.999996953754734e-06, + "loss": 1.1438, + "step": 1012 + }, + { + "epoch": 0.03, + "learning_rate": 4.99999656107477e-06, + "loss": 1.1802, + "step": 1013 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999961445960435e-06, + "loss": 1.1579, + "step": 1014 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999957043185565e-06, + "loss": 1.1469, + "step": 1015 + }, + { + "epoch": 0.03, + "learning_rate": 4.999995240242315e-06, + "loss": 1.2335, + "step": 1016 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999947523673235e-06, + "loss": 1.1745, + "step": 1017 + }, + { + "epoch": 0.03, + "learning_rate": 4.999994240693585e-06, + "loss": 1.186, + "step": 1018 + }, + { + "epoch": 0.03, + "learning_rate": 4.999993705221106e-06, + "loss": 1.239, + "step": 1019 + }, + { + "epoch": 0.03, + "learning_rate": 4.999993145949891e-06, + "loss": 1.24, + "step": 1020 + }, + { + "epoch": 0.03, + "learning_rate": 4.999992562879945e-06, + "loss": 1.0895, + "step": 1021 + }, + { + "epoch": 0.03, + "learning_rate": 4.999991956011274e-06, + "loss": 1.2142, + "step": 1022 + }, + { + "epoch": 0.03, + "learning_rate": 4.999991325343883e-06, + "loss": 1.2047, + "step": 1023 + }, + { + "epoch": 0.03, + "learning_rate": 4.999990670877779e-06, + "loss": 1.1187, + "step": 1024 + }, + { + "epoch": 0.03, + "learning_rate": 4.999989992612968e-06, + "loss": 1.1071, + "step": 1025 + }, + { + "epoch": 0.03, + "learning_rate": 4.999989290549456e-06, + "loss": 1.1879, + "step": 1026 + }, + { + "epoch": 0.03, + "learning_rate": 4.999988564687251e-06, + "loss": 1.1371, + "step": 1027 + }, + { + "epoch": 0.03, + "learning_rate": 4.999987815026358e-06, + "loss": 1.0531, + "step": 1028 + }, + { + "epoch": 0.03, + "learning_rate": 4.999987041566785e-06, + "loss": 1.2164, + "step": 1029 + }, + { + "epoch": 0.03, + "learning_rate": 4.99998624430854e-06, + "loss": 1.1174, + "step": 1030 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999854232516295e-06, + "loss": 1.2925, + "step": 1031 + }, + { + "epoch": 0.03, + "learning_rate": 4.999984578396062e-06, + "loss": 1.2159, + "step": 1032 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999837097418455e-06, + "loss": 1.2043, + "step": 1033 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999828172889875e-06, + "loss": 1.1185, + "step": 1034 + }, + { + "epoch": 0.03, + "learning_rate": 4.999981901037498e-06, + "loss": 1.1368, + "step": 1035 + }, + { + "epoch": 0.03, + "learning_rate": 4.999980960987384e-06, + "loss": 1.0931, + "step": 1036 + }, + { + "epoch": 0.03, + "learning_rate": 4.999979997138656e-06, + "loss": 1.1481, + "step": 1037 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999790094913214e-06, + "loss": 1.1769, + "step": 1038 + }, + { + "epoch": 0.03, + "learning_rate": 4.999977998045391e-06, + "loss": 1.1815, + "step": 1039 + }, + { + "epoch": 0.03, + "learning_rate": 4.999976962800875e-06, + "loss": 1.1688, + "step": 1040 + }, + { + "epoch": 0.03, + "learning_rate": 4.999975903757782e-06, + "loss": 1.2178, + "step": 1041 + }, + { + "epoch": 0.03, + "learning_rate": 4.999974820916122e-06, + "loss": 1.3155, + "step": 1042 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999737142759054e-06, + "loss": 1.1658, + "step": 1043 + }, + { + "epoch": 0.03, + "learning_rate": 4.999972583837144e-06, + "loss": 1.2227, + "step": 1044 + }, + { + "epoch": 0.03, + "learning_rate": 4.999971429599847e-06, + "loss": 1.2305, + "step": 1045 + }, + { + "epoch": 0.03, + "learning_rate": 4.999970251564027e-06, + "loss": 1.1798, + "step": 1046 + }, + { + "epoch": 0.03, + "learning_rate": 4.999969049729693e-06, + "loss": 1.2107, + "step": 1047 + }, + { + "epoch": 0.03, + "learning_rate": 4.999967824096859e-06, + "loss": 1.229, + "step": 1048 + }, + { + "epoch": 0.03, + "learning_rate": 4.999966574665534e-06, + "loss": 1.2759, + "step": 1049 + }, + { + "epoch": 0.03, + "learning_rate": 4.999965301435731e-06, + "loss": 1.267, + "step": 1050 + }, + { + "epoch": 0.03, + "learning_rate": 4.999964004407463e-06, + "loss": 1.2127, + "step": 1051 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999626835807426e-06, + "loss": 1.2075, + "step": 1052 + }, + { + "epoch": 0.03, + "learning_rate": 4.99996133895558e-06, + "loss": 1.2308, + "step": 1053 + }, + { + "epoch": 0.03, + "learning_rate": 4.99995997053199e-06, + "loss": 1.1908, + "step": 1054 + }, + { + "epoch": 0.03, + "learning_rate": 4.999958578309986e-06, + "loss": 1.246, + "step": 1055 + }, + { + "epoch": 0.03, + "learning_rate": 4.999957162289579e-06, + "loss": 1.2063, + "step": 1056 + }, + { + "epoch": 0.03, + "learning_rate": 4.999955722470785e-06, + "loss": 1.2684, + "step": 1057 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999542588536155e-06, + "loss": 1.2144, + "step": 1058 + }, + { + "epoch": 0.03, + "learning_rate": 4.999952771438086e-06, + "loss": 1.215, + "step": 1059 + }, + { + "epoch": 0.03, + "learning_rate": 4.999951260224211e-06, + "loss": 1.1271, + "step": 1060 + }, + { + "epoch": 0.03, + "learning_rate": 4.999949725212002e-06, + "loss": 1.1584, + "step": 1061 + }, + { + "epoch": 0.03, + "learning_rate": 4.999948166401477e-06, + "loss": 1.2246, + "step": 1062 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999465837926495e-06, + "loss": 1.2926, + "step": 1063 + }, + { + "epoch": 0.03, + "learning_rate": 4.999944977385534e-06, + "loss": 1.2111, + "step": 1064 + }, + { + "epoch": 0.03, + "learning_rate": 4.999943347180146e-06, + "loss": 1.1289, + "step": 1065 + }, + { + "epoch": 0.03, + "learning_rate": 4.999941693176502e-06, + "loss": 1.1743, + "step": 1066 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999400153746174e-06, + "loss": 1.2651, + "step": 1067 + }, + { + "epoch": 0.03, + "learning_rate": 4.999938313774507e-06, + "loss": 1.2295, + "step": 1068 + }, + { + "epoch": 0.03, + "learning_rate": 4.999936588376189e-06, + "loss": 1.2891, + "step": 1069 + }, + { + "epoch": 0.03, + "learning_rate": 4.999934839179678e-06, + "loss": 1.2282, + "step": 1070 + }, + { + "epoch": 0.03, + "learning_rate": 4.999933066184991e-06, + "loss": 1.0869, + "step": 1071 + }, + { + "epoch": 0.03, + "learning_rate": 4.999931269392146e-06, + "loss": 1.1109, + "step": 1072 + }, + { + "epoch": 0.03, + "learning_rate": 4.999929448801159e-06, + "loss": 1.2327, + "step": 1073 + }, + { + "epoch": 0.03, + "learning_rate": 4.999927604412047e-06, + "loss": 1.2316, + "step": 1074 + }, + { + "epoch": 0.03, + "learning_rate": 4.999925736224829e-06, + "loss": 1.134, + "step": 1075 + }, + { + "epoch": 0.03, + "learning_rate": 4.999923844239522e-06, + "loss": 1.2374, + "step": 1076 + }, + { + "epoch": 0.03, + "learning_rate": 4.999921928456144e-06, + "loss": 1.0983, + "step": 1077 + }, + { + "epoch": 0.03, + "learning_rate": 4.9999199888747126e-06, + "loss": 1.2, + "step": 1078 + }, + { + "epoch": 0.03, + "learning_rate": 4.999918025495247e-06, + "loss": 1.1359, + "step": 1079 + }, + { + "epoch": 0.03, + "learning_rate": 4.999916038317767e-06, + "loss": 1.1466, + "step": 1080 + }, + { + "epoch": 0.03, + "learning_rate": 4.999914027342289e-06, + "loss": 1.1652, + "step": 1081 + }, + { + "epoch": 0.03, + "learning_rate": 4.999911992568835e-06, + "loss": 1.2798, + "step": 1082 + }, + { + "epoch": 0.03, + "learning_rate": 4.999909933997421e-06, + "loss": 1.1194, + "step": 1083 + }, + { + "epoch": 0.03, + "learning_rate": 4.999907851628069e-06, + "loss": 1.1921, + "step": 1084 + }, + { + "epoch": 0.03, + "learning_rate": 4.999905745460798e-06, + "loss": 1.1752, + "step": 1085 + }, + { + "epoch": 0.03, + "learning_rate": 4.999903615495629e-06, + "loss": 1.0582, + "step": 1086 + }, + { + "epoch": 0.03, + "learning_rate": 4.999901461732581e-06, + "loss": 1.2693, + "step": 1087 + }, + { + "epoch": 0.03, + "learning_rate": 4.9998992841716755e-06, + "loss": 1.1343, + "step": 1088 + }, + { + "epoch": 0.03, + "learning_rate": 4.999897082812933e-06, + "loss": 1.1774, + "step": 1089 + }, + { + "epoch": 0.03, + "learning_rate": 4.999894857656374e-06, + "loss": 1.1225, + "step": 1090 + }, + { + "epoch": 0.03, + "learning_rate": 4.99989260870202e-06, + "loss": 1.2132, + "step": 1091 + }, + { + "epoch": 0.03, + "learning_rate": 4.999890335949892e-06, + "loss": 1.252, + "step": 1092 + }, + { + "epoch": 0.03, + "learning_rate": 4.999888039400013e-06, + "loss": 1.3153, + "step": 1093 + }, + { + "epoch": 0.03, + "learning_rate": 4.999885719052402e-06, + "loss": 1.1531, + "step": 1094 + }, + { + "epoch": 0.03, + "learning_rate": 4.9998833749070844e-06, + "loss": 1.1693, + "step": 1095 + }, + { + "epoch": 0.03, + "learning_rate": 4.999881006964081e-06, + "loss": 1.1575, + "step": 1096 + }, + { + "epoch": 0.03, + "learning_rate": 4.999878615223414e-06, + "loss": 1.0947, + "step": 1097 + }, + { + "epoch": 0.03, + "learning_rate": 4.9998761996851064e-06, + "loss": 1.0804, + "step": 1098 + }, + { + "epoch": 0.03, + "learning_rate": 4.9998737603491824e-06, + "loss": 1.1156, + "step": 1099 + }, + { + "epoch": 0.03, + "learning_rate": 4.999871297215663e-06, + "loss": 1.3231, + "step": 1100 + }, + { + "epoch": 0.03, + "learning_rate": 4.999868810284573e-06, + "loss": 1.1637, + "step": 1101 + }, + { + "epoch": 0.03, + "learning_rate": 4.999866299555936e-06, + "loss": 1.0512, + "step": 1102 + }, + { + "epoch": 0.03, + "learning_rate": 4.999863765029776e-06, + "loss": 1.1562, + "step": 1103 + }, + { + "epoch": 0.03, + "learning_rate": 4.999861206706117e-06, + "loss": 1.3119, + "step": 1104 + }, + { + "epoch": 0.03, + "learning_rate": 4.999858624584983e-06, + "loss": 1.1174, + "step": 1105 + }, + { + "epoch": 0.03, + "learning_rate": 4.9998560186663995e-06, + "loss": 1.1951, + "step": 1106 + }, + { + "epoch": 0.03, + "learning_rate": 4.99985338895039e-06, + "loss": 1.2593, + "step": 1107 + }, + { + "epoch": 0.03, + "learning_rate": 4.99985073543698e-06, + "loss": 1.2359, + "step": 1108 + }, + { + "epoch": 0.03, + "learning_rate": 4.999848058126196e-06, + "loss": 1.167, + "step": 1109 + }, + { + "epoch": 0.03, + "learning_rate": 4.999845357018061e-06, + "loss": 1.1573, + "step": 1110 + }, + { + "epoch": 0.03, + "learning_rate": 4.999842632112603e-06, + "loss": 1.1613, + "step": 1111 + }, + { + "epoch": 0.03, + "learning_rate": 4.999839883409847e-06, + "loss": 1.2385, + "step": 1112 + }, + { + "epoch": 0.03, + "learning_rate": 4.99983711090982e-06, + "loss": 1.1591, + "step": 1113 + }, + { + "epoch": 0.03, + "learning_rate": 4.999834314612547e-06, + "loss": 1.1066, + "step": 1114 + }, + { + "epoch": 0.03, + "learning_rate": 4.999831494518055e-06, + "loss": 1.1952, + "step": 1115 + }, + { + "epoch": 0.03, + "learning_rate": 4.999828650626372e-06, + "loss": 1.2571, + "step": 1116 + }, + { + "epoch": 0.03, + "learning_rate": 4.999825782937523e-06, + "loss": 1.131, + "step": 1117 + }, + { + "epoch": 0.03, + "learning_rate": 4.999822891451537e-06, + "loss": 1.3179, + "step": 1118 + }, + { + "epoch": 0.03, + "learning_rate": 4.999819976168442e-06, + "loss": 1.1736, + "step": 1119 + }, + { + "epoch": 0.03, + "learning_rate": 4.999817037088264e-06, + "loss": 1.1879, + "step": 1120 + }, + { + "epoch": 0.03, + "learning_rate": 4.9998140742110315e-06, + "loss": 1.1242, + "step": 1121 + }, + { + "epoch": 0.03, + "learning_rate": 4.999811087536773e-06, + "loss": 1.1285, + "step": 1122 + }, + { + "epoch": 0.03, + "learning_rate": 4.9998080770655175e-06, + "loss": 0.9915, + "step": 1123 + }, + { + "epoch": 0.03, + "learning_rate": 4.999805042797292e-06, + "loss": 1.0958, + "step": 1124 + }, + { + "epoch": 0.03, + "learning_rate": 4.999801984732127e-06, + "loss": 1.3636, + "step": 1125 + }, + { + "epoch": 0.03, + "learning_rate": 4.9997989028700515e-06, + "loss": 1.1879, + "step": 1126 + }, + { + "epoch": 0.03, + "learning_rate": 4.999795797211094e-06, + "loss": 1.0811, + "step": 1127 + }, + { + "epoch": 0.03, + "learning_rate": 4.999792667755285e-06, + "loss": 1.1453, + "step": 1128 + }, + { + "epoch": 0.03, + "learning_rate": 4.999789514502653e-06, + "loss": 1.1284, + "step": 1129 + }, + { + "epoch": 0.03, + "learning_rate": 4.9997863374532285e-06, + "loss": 1.1063, + "step": 1130 + }, + { + "epoch": 0.03, + "learning_rate": 4.999783136607043e-06, + "loss": 1.2442, + "step": 1131 + }, + { + "epoch": 0.03, + "learning_rate": 4.9997799119641256e-06, + "loss": 1.2732, + "step": 1132 + }, + { + "epoch": 0.03, + "learning_rate": 4.999776663524507e-06, + "loss": 1.1505, + "step": 1133 + }, + { + "epoch": 0.03, + "learning_rate": 4.999773391288219e-06, + "loss": 1.1156, + "step": 1134 + }, + { + "epoch": 0.03, + "learning_rate": 4.999770095255292e-06, + "loss": 1.0813, + "step": 1135 + }, + { + "epoch": 0.03, + "learning_rate": 4.999766775425757e-06, + "loss": 1.0895, + "step": 1136 + }, + { + "epoch": 0.03, + "learning_rate": 4.9997634317996465e-06, + "loss": 1.136, + "step": 1137 + }, + { + "epoch": 0.03, + "learning_rate": 4.999760064376993e-06, + "loss": 1.1395, + "step": 1138 + }, + { + "epoch": 0.03, + "learning_rate": 4.9997566731578275e-06, + "loss": 1.2229, + "step": 1139 + }, + { + "epoch": 0.03, + "learning_rate": 4.999753258142182e-06, + "loss": 1.1729, + "step": 1140 + }, + { + "epoch": 0.03, + "learning_rate": 4.999749819330089e-06, + "loss": 1.1469, + "step": 1141 + }, + { + "epoch": 0.03, + "learning_rate": 4.999746356721582e-06, + "loss": 1.0867, + "step": 1142 + }, + { + "epoch": 0.03, + "learning_rate": 4.999742870316693e-06, + "loss": 1.1945, + "step": 1143 + }, + { + "epoch": 0.03, + "learning_rate": 4.999739360115457e-06, + "loss": 1.1962, + "step": 1144 + }, + { + "epoch": 0.03, + "learning_rate": 4.999735826117905e-06, + "loss": 1.2247, + "step": 1145 + }, + { + "epoch": 0.03, + "learning_rate": 4.999732268324073e-06, + "loss": 1.2083, + "step": 1146 + }, + { + "epoch": 0.03, + "learning_rate": 4.999728686733993e-06, + "loss": 1.2275, + "step": 1147 + }, + { + "epoch": 0.03, + "learning_rate": 4.9997250813477e-06, + "loss": 1.1683, + "step": 1148 + }, + { + "epoch": 0.03, + "learning_rate": 4.999721452165227e-06, + "loss": 1.3231, + "step": 1149 + }, + { + "epoch": 0.03, + "learning_rate": 4.999717799186611e-06, + "loss": 1.1262, + "step": 1150 + }, + { + "epoch": 0.03, + "learning_rate": 4.999714122411886e-06, + "loss": 1.2104, + "step": 1151 + }, + { + "epoch": 0.03, + "learning_rate": 4.999710421841085e-06, + "loss": 1.2039, + "step": 1152 + }, + { + "epoch": 0.03, + "learning_rate": 4.999706697474246e-06, + "loss": 1.1599, + "step": 1153 + }, + { + "epoch": 0.03, + "learning_rate": 4.9997029493114025e-06, + "loss": 1.2271, + "step": 1154 + }, + { + "epoch": 0.03, + "learning_rate": 4.999699177352591e-06, + "loss": 1.2039, + "step": 1155 + }, + { + "epoch": 0.03, + "learning_rate": 4.999695381597847e-06, + "loss": 1.2529, + "step": 1156 + }, + { + "epoch": 0.03, + "learning_rate": 4.999691562047206e-06, + "loss": 1.1265, + "step": 1157 + }, + { + "epoch": 0.03, + "learning_rate": 4.999687718700707e-06, + "loss": 1.1567, + "step": 1158 + }, + { + "epoch": 0.03, + "learning_rate": 4.999683851558383e-06, + "loss": 1.1328, + "step": 1159 + }, + { + "epoch": 0.03, + "learning_rate": 4.999679960620274e-06, + "loss": 1.2083, + "step": 1160 + }, + { + "epoch": 0.03, + "learning_rate": 4.999676045886415e-06, + "loss": 1.2819, + "step": 1161 + }, + { + "epoch": 0.04, + "learning_rate": 4.999672107356844e-06, + "loss": 1.1095, + "step": 1162 + }, + { + "epoch": 0.04, + "learning_rate": 4.999668145031598e-06, + "loss": 1.1825, + "step": 1163 + }, + { + "epoch": 0.04, + "learning_rate": 4.999664158910717e-06, + "loss": 1.1627, + "step": 1164 + }, + { + "epoch": 0.04, + "learning_rate": 4.999660148994235e-06, + "loss": 1.094, + "step": 1165 + }, + { + "epoch": 0.04, + "learning_rate": 4.999656115282194e-06, + "loss": 1.1273, + "step": 1166 + }, + { + "epoch": 0.04, + "learning_rate": 4.999652057774629e-06, + "loss": 1.1158, + "step": 1167 + }, + { + "epoch": 0.04, + "learning_rate": 4.999647976471581e-06, + "loss": 1.2076, + "step": 1168 + }, + { + "epoch": 0.04, + "learning_rate": 4.999643871373089e-06, + "loss": 1.1868, + "step": 1169 + }, + { + "epoch": 0.04, + "learning_rate": 4.99963974247919e-06, + "loss": 1.2659, + "step": 1170 + }, + { + "epoch": 0.04, + "learning_rate": 4.999635589789925e-06, + "loss": 1.1815, + "step": 1171 + }, + { + "epoch": 0.04, + "learning_rate": 4.999631413305332e-06, + "loss": 1.1712, + "step": 1172 + }, + { + "epoch": 0.04, + "learning_rate": 4.999627213025453e-06, + "loss": 1.2735, + "step": 1173 + }, + { + "epoch": 0.04, + "learning_rate": 4.999622988950326e-06, + "loss": 1.138, + "step": 1174 + }, + { + "epoch": 0.04, + "learning_rate": 4.9996187410799934e-06, + "loss": 1.1069, + "step": 1175 + }, + { + "epoch": 0.04, + "learning_rate": 4.999614469414493e-06, + "loss": 1.1376, + "step": 1176 + }, + { + "epoch": 0.04, + "learning_rate": 4.9996101739538674e-06, + "loss": 1.2384, + "step": 1177 + }, + { + "epoch": 0.04, + "learning_rate": 4.9996058546981565e-06, + "loss": 1.1655, + "step": 1178 + }, + { + "epoch": 0.04, + "learning_rate": 4.999601511647401e-06, + "loss": 1.1713, + "step": 1179 + }, + { + "epoch": 0.04, + "learning_rate": 4.999597144801645e-06, + "loss": 1.245, + "step": 1180 + }, + { + "epoch": 0.04, + "learning_rate": 4.999592754160925e-06, + "loss": 1.2135, + "step": 1181 + }, + { + "epoch": 0.04, + "learning_rate": 4.999588339725289e-06, + "loss": 1.169, + "step": 1182 + }, + { + "epoch": 0.04, + "learning_rate": 4.999583901494774e-06, + "loss": 1.1592, + "step": 1183 + }, + { + "epoch": 0.04, + "learning_rate": 4.999579439469424e-06, + "loss": 1.1116, + "step": 1184 + }, + { + "epoch": 0.04, + "learning_rate": 4.999574953649282e-06, + "loss": 1.26, + "step": 1185 + }, + { + "epoch": 0.04, + "learning_rate": 4.999570444034391e-06, + "loss": 1.2175, + "step": 1186 + }, + { + "epoch": 0.04, + "learning_rate": 4.9995659106247924e-06, + "loss": 1.2877, + "step": 1187 + }, + { + "epoch": 0.04, + "learning_rate": 4.99956135342053e-06, + "loss": 1.1498, + "step": 1188 + }, + { + "epoch": 0.04, + "learning_rate": 4.999556772421648e-06, + "loss": 1.1068, + "step": 1189 + }, + { + "epoch": 0.04, + "learning_rate": 4.999552167628189e-06, + "loss": 1.1841, + "step": 1190 + }, + { + "epoch": 0.04, + "learning_rate": 4.999547539040197e-06, + "loss": 1.1891, + "step": 1191 + }, + { + "epoch": 0.04, + "learning_rate": 4.999542886657717e-06, + "loss": 1.1678, + "step": 1192 + }, + { + "epoch": 0.04, + "learning_rate": 4.999538210480791e-06, + "loss": 1.1044, + "step": 1193 + }, + { + "epoch": 0.04, + "learning_rate": 4.9995335105094666e-06, + "loss": 1.1766, + "step": 1194 + }, + { + "epoch": 0.04, + "learning_rate": 4.999528786743786e-06, + "loss": 1.2372, + "step": 1195 + }, + { + "epoch": 0.04, + "learning_rate": 4.999524039183796e-06, + "loss": 1.2316, + "step": 1196 + }, + { + "epoch": 0.04, + "learning_rate": 4.99951926782954e-06, + "loss": 1.1304, + "step": 1197 + }, + { + "epoch": 0.04, + "learning_rate": 4.9995144726810655e-06, + "loss": 1.2412, + "step": 1198 + }, + { + "epoch": 0.04, + "learning_rate": 4.999509653738416e-06, + "loss": 1.2106, + "step": 1199 + }, + { + "epoch": 0.04, + "learning_rate": 4.999504811001639e-06, + "loss": 1.354, + "step": 1200 + }, + { + "epoch": 0.04, + "learning_rate": 4.99949994447078e-06, + "loss": 1.1395, + "step": 1201 + }, + { + "epoch": 0.04, + "learning_rate": 4.9994950541458855e-06, + "loss": 1.1293, + "step": 1202 + }, + { + "epoch": 0.04, + "learning_rate": 4.999490140027001e-06, + "loss": 1.2606, + "step": 1203 + }, + { + "epoch": 0.04, + "learning_rate": 4.999485202114175e-06, + "loss": 1.3185, + "step": 1204 + }, + { + "epoch": 0.04, + "learning_rate": 4.999480240407453e-06, + "loss": 1.1711, + "step": 1205 + }, + { + "epoch": 0.04, + "learning_rate": 4.999475254906884e-06, + "loss": 1.3495, + "step": 1206 + }, + { + "epoch": 0.04, + "learning_rate": 4.999470245612513e-06, + "loss": 1.1733, + "step": 1207 + }, + { + "epoch": 0.04, + "learning_rate": 4.999465212524389e-06, + "loss": 1.1832, + "step": 1208 + }, + { + "epoch": 0.04, + "learning_rate": 4.9994601556425615e-06, + "loss": 1.1779, + "step": 1209 + }, + { + "epoch": 0.04, + "learning_rate": 4.999455074967076e-06, + "loss": 1.1512, + "step": 1210 + }, + { + "epoch": 0.04, + "learning_rate": 4.999449970497982e-06, + "loss": 1.2108, + "step": 1211 + }, + { + "epoch": 0.04, + "learning_rate": 4.999444842235328e-06, + "loss": 1.0408, + "step": 1212 + }, + { + "epoch": 0.04, + "learning_rate": 4.999439690179164e-06, + "loss": 1.1809, + "step": 1213 + }, + { + "epoch": 0.04, + "learning_rate": 4.999434514329537e-06, + "loss": 1.2138, + "step": 1214 + }, + { + "epoch": 0.04, + "learning_rate": 4.999429314686497e-06, + "loss": 1.1673, + "step": 1215 + }, + { + "epoch": 0.04, + "learning_rate": 4.999424091250094e-06, + "loss": 1.1631, + "step": 1216 + }, + { + "epoch": 0.04, + "learning_rate": 4.999418844020377e-06, + "loss": 1.0941, + "step": 1217 + }, + { + "epoch": 0.04, + "learning_rate": 4.999413572997397e-06, + "loss": 1.1931, + "step": 1218 + }, + { + "epoch": 0.04, + "learning_rate": 4.999408278181204e-06, + "loss": 1.1434, + "step": 1219 + }, + { + "epoch": 0.04, + "learning_rate": 4.9994029595718465e-06, + "loss": 1.1359, + "step": 1220 + }, + { + "epoch": 0.04, + "learning_rate": 4.999397617169378e-06, + "loss": 1.1174, + "step": 1221 + }, + { + "epoch": 0.04, + "learning_rate": 4.999392250973847e-06, + "loss": 1.2052, + "step": 1222 + }, + { + "epoch": 0.04, + "learning_rate": 4.999386860985306e-06, + "loss": 1.0711, + "step": 1223 + }, + { + "epoch": 0.04, + "learning_rate": 4.999381447203805e-06, + "loss": 1.2848, + "step": 1224 + }, + { + "epoch": 0.04, + "learning_rate": 4.999376009629398e-06, + "loss": 1.1804, + "step": 1225 + }, + { + "epoch": 0.04, + "learning_rate": 4.999370548262133e-06, + "loss": 1.1987, + "step": 1226 + }, + { + "epoch": 0.04, + "learning_rate": 4.999365063102065e-06, + "loss": 1.2681, + "step": 1227 + }, + { + "epoch": 0.04, + "learning_rate": 4.999359554149246e-06, + "loss": 1.2072, + "step": 1228 + }, + { + "epoch": 0.04, + "learning_rate": 4.999354021403727e-06, + "loss": 1.1793, + "step": 1229 + }, + { + "epoch": 0.04, + "learning_rate": 4.999348464865562e-06, + "loss": 1.1714, + "step": 1230 + }, + { + "epoch": 0.04, + "learning_rate": 4.999342884534804e-06, + "loss": 1.2401, + "step": 1231 + }, + { + "epoch": 0.04, + "learning_rate": 4.999337280411503e-06, + "loss": 1.2133, + "step": 1232 + }, + { + "epoch": 0.04, + "learning_rate": 4.999331652495717e-06, + "loss": 1.1494, + "step": 1233 + }, + { + "epoch": 0.04, + "learning_rate": 4.999326000787497e-06, + "loss": 1.1611, + "step": 1234 + }, + { + "epoch": 0.04, + "learning_rate": 4.999320325286897e-06, + "loss": 1.1602, + "step": 1235 + }, + { + "epoch": 0.04, + "learning_rate": 4.999314625993971e-06, + "loss": 1.2863, + "step": 1236 + }, + { + "epoch": 0.04, + "learning_rate": 4.999308902908774e-06, + "loss": 1.1766, + "step": 1237 + }, + { + "epoch": 0.04, + "learning_rate": 4.9993031560313594e-06, + "loss": 1.103, + "step": 1238 + }, + { + "epoch": 0.04, + "learning_rate": 4.999297385361783e-06, + "loss": 1.2174, + "step": 1239 + }, + { + "epoch": 0.04, + "learning_rate": 4.999291590900099e-06, + "loss": 1.2678, + "step": 1240 + }, + { + "epoch": 0.04, + "learning_rate": 4.9992857726463626e-06, + "loss": 1.1274, + "step": 1241 + }, + { + "epoch": 0.04, + "learning_rate": 4.999279930600629e-06, + "loss": 1.1638, + "step": 1242 + }, + { + "epoch": 0.04, + "learning_rate": 4.999274064762954e-06, + "loss": 1.1029, + "step": 1243 + }, + { + "epoch": 0.04, + "learning_rate": 4.999268175133395e-06, + "loss": 1.1553, + "step": 1244 + }, + { + "epoch": 0.04, + "learning_rate": 4.999262261712006e-06, + "loss": 1.0764, + "step": 1245 + }, + { + "epoch": 0.04, + "learning_rate": 4.999256324498843e-06, + "loss": 1.173, + "step": 1246 + }, + { + "epoch": 0.04, + "learning_rate": 4.999250363493964e-06, + "loss": 0.9943, + "step": 1247 + }, + { + "epoch": 0.04, + "learning_rate": 4.999244378697425e-06, + "loss": 1.2067, + "step": 1248 + }, + { + "epoch": 0.04, + "learning_rate": 4.999238370109284e-06, + "loss": 1.2059, + "step": 1249 + }, + { + "epoch": 0.04, + "learning_rate": 4.999232337729597e-06, + "loss": 1.1521, + "step": 1250 + }, + { + "epoch": 0.04, + "learning_rate": 4.999226281558423e-06, + "loss": 1.1582, + "step": 1251 + }, + { + "epoch": 0.04, + "learning_rate": 4.999220201595816e-06, + "loss": 1.1216, + "step": 1252 + }, + { + "epoch": 0.04, + "learning_rate": 4.999214097841838e-06, + "loss": 1.2056, + "step": 1253 + }, + { + "epoch": 0.04, + "learning_rate": 4.999207970296545e-06, + "loss": 1.1163, + "step": 1254 + }, + { + "epoch": 0.04, + "learning_rate": 4.999201818959996e-06, + "loss": 1.2896, + "step": 1255 + }, + { + "epoch": 0.04, + "learning_rate": 4.99919564383225e-06, + "loss": 1.2651, + "step": 1256 + }, + { + "epoch": 0.04, + "learning_rate": 4.999189444913364e-06, + "loss": 1.1967, + "step": 1257 + }, + { + "epoch": 0.04, + "learning_rate": 4.999183222203398e-06, + "loss": 1.1393, + "step": 1258 + }, + { + "epoch": 0.04, + "learning_rate": 4.999176975702413e-06, + "loss": 1.171, + "step": 1259 + }, + { + "epoch": 0.04, + "learning_rate": 4.999170705410464e-06, + "loss": 1.1812, + "step": 1260 + }, + { + "epoch": 0.04, + "learning_rate": 4.999164411327616e-06, + "loss": 1.1964, + "step": 1261 + }, + { + "epoch": 0.04, + "learning_rate": 4.999158093453925e-06, + "loss": 1.043, + "step": 1262 + }, + { + "epoch": 0.04, + "learning_rate": 4.999151751789454e-06, + "loss": 1.1852, + "step": 1263 + }, + { + "epoch": 0.04, + "learning_rate": 4.999145386334261e-06, + "loss": 1.2063, + "step": 1264 + }, + { + "epoch": 0.04, + "learning_rate": 4.999138997088407e-06, + "loss": 1.202, + "step": 1265 + }, + { + "epoch": 0.04, + "learning_rate": 4.999132584051954e-06, + "loss": 1.1888, + "step": 1266 + }, + { + "epoch": 0.04, + "learning_rate": 4.999126147224963e-06, + "loss": 1.19, + "step": 1267 + }, + { + "epoch": 0.04, + "learning_rate": 4.999119686607494e-06, + "loss": 1.2333, + "step": 1268 + }, + { + "epoch": 0.04, + "learning_rate": 4.9991132021996105e-06, + "loss": 1.1625, + "step": 1269 + }, + { + "epoch": 0.04, + "learning_rate": 4.999106694001371e-06, + "loss": 1.2666, + "step": 1270 + }, + { + "epoch": 0.04, + "learning_rate": 4.999100162012841e-06, + "loss": 1.1904, + "step": 1271 + }, + { + "epoch": 0.04, + "learning_rate": 4.99909360623408e-06, + "loss": 1.2199, + "step": 1272 + }, + { + "epoch": 0.04, + "learning_rate": 4.9990870266651515e-06, + "loss": 1.182, + "step": 1273 + }, + { + "epoch": 0.04, + "learning_rate": 4.9990804233061185e-06, + "loss": 1.2786, + "step": 1274 + }, + { + "epoch": 0.04, + "learning_rate": 4.999073796157044e-06, + "loss": 1.2375, + "step": 1275 + }, + { + "epoch": 0.04, + "learning_rate": 4.99906714521799e-06, + "loss": 1.1514, + "step": 1276 + }, + { + "epoch": 0.04, + "learning_rate": 4.99906047048902e-06, + "loss": 1.1731, + "step": 1277 + }, + { + "epoch": 0.04, + "learning_rate": 4.9990537719701986e-06, + "loss": 1.1437, + "step": 1278 + }, + { + "epoch": 0.04, + "learning_rate": 4.999047049661588e-06, + "loss": 1.1893, + "step": 1279 + }, + { + "epoch": 0.04, + "learning_rate": 4.999040303563253e-06, + "loss": 1.27, + "step": 1280 + }, + { + "epoch": 0.04, + "learning_rate": 4.999033533675258e-06, + "loss": 1.0272, + "step": 1281 + }, + { + "epoch": 0.04, + "learning_rate": 4.999026739997668e-06, + "loss": 1.0569, + "step": 1282 + }, + { + "epoch": 0.04, + "learning_rate": 4.999019922530547e-06, + "loss": 1.1085, + "step": 1283 + }, + { + "epoch": 0.04, + "learning_rate": 4.99901308127396e-06, + "loss": 1.2321, + "step": 1284 + }, + { + "epoch": 0.04, + "learning_rate": 4.999006216227972e-06, + "loss": 1.1481, + "step": 1285 + }, + { + "epoch": 0.04, + "learning_rate": 4.998999327392648e-06, + "loss": 1.2579, + "step": 1286 + }, + { + "epoch": 0.04, + "learning_rate": 4.998992414768054e-06, + "loss": 1.1197, + "step": 1287 + }, + { + "epoch": 0.04, + "learning_rate": 4.998985478354255e-06, + "loss": 1.1748, + "step": 1288 + }, + { + "epoch": 0.04, + "learning_rate": 4.998978518151319e-06, + "loss": 1.3066, + "step": 1289 + }, + { + "epoch": 0.04, + "learning_rate": 4.998971534159311e-06, + "loss": 1.1998, + "step": 1290 + }, + { + "epoch": 0.04, + "learning_rate": 4.998964526378297e-06, + "loss": 1.1135, + "step": 1291 + }, + { + "epoch": 0.04, + "learning_rate": 4.998957494808345e-06, + "loss": 1.0623, + "step": 1292 + }, + { + "epoch": 0.04, + "learning_rate": 4.998950439449521e-06, + "loss": 1.228, + "step": 1293 + }, + { + "epoch": 0.04, + "learning_rate": 4.998943360301891e-06, + "loss": 1.1464, + "step": 1294 + }, + { + "epoch": 0.04, + "learning_rate": 4.9989362573655255e-06, + "loss": 1.3088, + "step": 1295 + }, + { + "epoch": 0.04, + "learning_rate": 4.998929130640489e-06, + "loss": 1.1648, + "step": 1296 + }, + { + "epoch": 0.04, + "learning_rate": 4.998921980126852e-06, + "loss": 1.2195, + "step": 1297 + }, + { + "epoch": 0.04, + "learning_rate": 4.99891480582468e-06, + "loss": 1.3085, + "step": 1298 + }, + { + "epoch": 0.04, + "learning_rate": 4.998907607734044e-06, + "loss": 1.2379, + "step": 1299 + }, + { + "epoch": 0.04, + "learning_rate": 4.998900385855009e-06, + "loss": 1.1582, + "step": 1300 + }, + { + "epoch": 0.04, + "learning_rate": 4.998893140187647e-06, + "loss": 1.1902, + "step": 1301 + }, + { + "epoch": 0.04, + "learning_rate": 4.9988858707320265e-06, + "loss": 1.1809, + "step": 1302 + }, + { + "epoch": 0.04, + "learning_rate": 4.998878577488216e-06, + "loss": 1.0931, + "step": 1303 + }, + { + "epoch": 0.04, + "learning_rate": 4.998871260456284e-06, + "loss": 1.2208, + "step": 1304 + }, + { + "epoch": 0.04, + "learning_rate": 4.998863919636301e-06, + "loss": 1.1002, + "step": 1305 + }, + { + "epoch": 0.04, + "learning_rate": 4.998856555028337e-06, + "loss": 1.2803, + "step": 1306 + }, + { + "epoch": 0.04, + "learning_rate": 4.9988491666324636e-06, + "loss": 1.1996, + "step": 1307 + }, + { + "epoch": 0.04, + "learning_rate": 4.998841754448749e-06, + "loss": 1.2308, + "step": 1308 + }, + { + "epoch": 0.04, + "learning_rate": 4.998834318477263e-06, + "loss": 1.1825, + "step": 1309 + }, + { + "epoch": 0.04, + "learning_rate": 4.998826858718079e-06, + "loss": 1.2411, + "step": 1310 + }, + { + "epoch": 0.04, + "learning_rate": 4.998819375171267e-06, + "loss": 1.1585, + "step": 1311 + }, + { + "epoch": 0.04, + "learning_rate": 4.998811867836897e-06, + "loss": 1.2182, + "step": 1312 + }, + { + "epoch": 0.04, + "learning_rate": 4.9988043367150415e-06, + "loss": 1.2373, + "step": 1313 + }, + { + "epoch": 0.04, + "learning_rate": 4.9987967818057735e-06, + "loss": 1.1693, + "step": 1314 + }, + { + "epoch": 0.04, + "learning_rate": 4.9987892031091624e-06, + "loss": 1.1127, + "step": 1315 + }, + { + "epoch": 0.04, + "learning_rate": 4.998781600625282e-06, + "loss": 1.2482, + "step": 1316 + }, + { + "epoch": 0.04, + "learning_rate": 4.998773974354204e-06, + "loss": 1.1218, + "step": 1317 + }, + { + "epoch": 0.04, + "learning_rate": 4.998766324296001e-06, + "loss": 1.3101, + "step": 1318 + }, + { + "epoch": 0.04, + "learning_rate": 4.998758650450747e-06, + "loss": 1.2413, + "step": 1319 + }, + { + "epoch": 0.04, + "learning_rate": 4.998750952818513e-06, + "loss": 1.0904, + "step": 1320 + }, + { + "epoch": 0.04, + "learning_rate": 4.998743231399374e-06, + "loss": 1.1758, + "step": 1321 + }, + { + "epoch": 0.04, + "learning_rate": 4.9987354861934025e-06, + "loss": 1.1472, + "step": 1322 + }, + { + "epoch": 0.04, + "learning_rate": 4.998727717200673e-06, + "loss": 1.1378, + "step": 1323 + }, + { + "epoch": 0.04, + "learning_rate": 4.998719924421259e-06, + "loss": 1.3068, + "step": 1324 + }, + { + "epoch": 0.04, + "learning_rate": 4.998712107855235e-06, + "loss": 1.183, + "step": 1325 + }, + { + "epoch": 0.04, + "learning_rate": 4.998704267502674e-06, + "loss": 1.3583, + "step": 1326 + }, + { + "epoch": 0.04, + "learning_rate": 4.998696403363653e-06, + "loss": 1.1131, + "step": 1327 + }, + { + "epoch": 0.04, + "learning_rate": 4.998688515438245e-06, + "loss": 1.1979, + "step": 1328 + }, + { + "epoch": 0.04, + "learning_rate": 4.998680603726526e-06, + "loss": 1.1226, + "step": 1329 + }, + { + "epoch": 0.04, + "learning_rate": 4.9986726682285715e-06, + "loss": 1.1897, + "step": 1330 + }, + { + "epoch": 0.04, + "learning_rate": 4.998664708944456e-06, + "loss": 1.2422, + "step": 1331 + }, + { + "epoch": 0.04, + "learning_rate": 4.9986567258742555e-06, + "loss": 1.1536, + "step": 1332 + }, + { + "epoch": 0.04, + "learning_rate": 4.998648719018047e-06, + "loss": 1.2736, + "step": 1333 + }, + { + "epoch": 0.04, + "learning_rate": 4.998640688375906e-06, + "loss": 1.1761, + "step": 1334 + }, + { + "epoch": 0.04, + "learning_rate": 4.998632633947909e-06, + "loss": 1.1676, + "step": 1335 + }, + { + "epoch": 0.04, + "learning_rate": 4.998624555734133e-06, + "loss": 1.1616, + "step": 1336 + }, + { + "epoch": 0.04, + "learning_rate": 4.998616453734654e-06, + "loss": 1.2911, + "step": 1337 + }, + { + "epoch": 0.04, + "learning_rate": 4.99860832794955e-06, + "loss": 1.298, + "step": 1338 + }, + { + "epoch": 0.04, + "learning_rate": 4.9986001783788985e-06, + "loss": 1.3102, + "step": 1339 + }, + { + "epoch": 0.04, + "learning_rate": 4.998592005022776e-06, + "loss": 1.1874, + "step": 1340 + }, + { + "epoch": 0.04, + "learning_rate": 4.998583807881261e-06, + "loss": 1.0962, + "step": 1341 + }, + { + "epoch": 0.04, + "learning_rate": 4.998575586954432e-06, + "loss": 1.1724, + "step": 1342 + }, + { + "epoch": 0.04, + "learning_rate": 4.998567342242366e-06, + "loss": 1.1174, + "step": 1343 + }, + { + "epoch": 0.04, + "learning_rate": 4.9985590737451425e-06, + "loss": 1.2355, + "step": 1344 + }, + { + "epoch": 0.04, + "learning_rate": 4.998550781462841e-06, + "loss": 1.1818, + "step": 1345 + }, + { + "epoch": 0.04, + "learning_rate": 4.998542465395538e-06, + "loss": 1.1931, + "step": 1346 + }, + { + "epoch": 0.04, + "learning_rate": 4.998534125543315e-06, + "loss": 1.1846, + "step": 1347 + }, + { + "epoch": 0.04, + "learning_rate": 4.99852576190625e-06, + "loss": 1.1802, + "step": 1348 + }, + { + "epoch": 0.04, + "learning_rate": 4.998517374484424e-06, + "loss": 1.2102, + "step": 1349 + }, + { + "epoch": 0.04, + "learning_rate": 4.998508963277915e-06, + "loss": 1.3833, + "step": 1350 + }, + { + "epoch": 0.04, + "learning_rate": 4.998500528286804e-06, + "loss": 1.1958, + "step": 1351 + }, + { + "epoch": 0.04, + "learning_rate": 4.998492069511171e-06, + "loss": 1.2758, + "step": 1352 + }, + { + "epoch": 0.04, + "learning_rate": 4.998483586951098e-06, + "loss": 1.1449, + "step": 1353 + }, + { + "epoch": 0.04, + "learning_rate": 4.998475080606664e-06, + "loss": 1.0632, + "step": 1354 + }, + { + "epoch": 0.04, + "learning_rate": 4.99846655047795e-06, + "loss": 1.209, + "step": 1355 + }, + { + "epoch": 0.04, + "learning_rate": 4.998457996565038e-06, + "loss": 1.1489, + "step": 1356 + }, + { + "epoch": 0.04, + "learning_rate": 4.99844941886801e-06, + "loss": 1.217, + "step": 1357 + }, + { + "epoch": 0.04, + "learning_rate": 4.998440817386946e-06, + "loss": 1.2353, + "step": 1358 + }, + { + "epoch": 0.04, + "learning_rate": 4.998432192121929e-06, + "loss": 1.1604, + "step": 1359 + }, + { + "epoch": 0.04, + "learning_rate": 4.9984235430730395e-06, + "loss": 1.1613, + "step": 1360 + }, + { + "epoch": 0.04, + "learning_rate": 4.998414870240364e-06, + "loss": 1.1868, + "step": 1361 + }, + { + "epoch": 0.04, + "learning_rate": 4.99840617362398e-06, + "loss": 1.2488, + "step": 1362 + }, + { + "epoch": 0.04, + "learning_rate": 4.998397453223973e-06, + "loss": 1.1479, + "step": 1363 + }, + { + "epoch": 0.04, + "learning_rate": 4.9983887090404245e-06, + "loss": 1.1649, + "step": 1364 + }, + { + "epoch": 0.04, + "learning_rate": 4.99837994107342e-06, + "loss": 1.1569, + "step": 1365 + }, + { + "epoch": 0.04, + "learning_rate": 4.998371149323042e-06, + "loss": 1.0776, + "step": 1366 + }, + { + "epoch": 0.04, + "learning_rate": 4.998362333789374e-06, + "loss": 1.2302, + "step": 1367 + }, + { + "epoch": 0.04, + "learning_rate": 4.998353494472499e-06, + "loss": 1.2625, + "step": 1368 + }, + { + "epoch": 0.04, + "learning_rate": 4.998344631372501e-06, + "loss": 1.0291, + "step": 1369 + }, + { + "epoch": 0.04, + "learning_rate": 4.9983357444894674e-06, + "loss": 1.2343, + "step": 1370 + }, + { + "epoch": 0.04, + "learning_rate": 4.998326833823481e-06, + "loss": 1.0707, + "step": 1371 + }, + { + "epoch": 0.04, + "learning_rate": 4.998317899374624e-06, + "loss": 1.2134, + "step": 1372 + }, + { + "epoch": 0.04, + "learning_rate": 4.998308941142985e-06, + "loss": 1.222, + "step": 1373 + }, + { + "epoch": 0.04, + "learning_rate": 4.998299959128649e-06, + "loss": 1.1685, + "step": 1374 + }, + { + "epoch": 0.04, + "learning_rate": 4.9982909533316996e-06, + "loss": 1.2791, + "step": 1375 + }, + { + "epoch": 0.04, + "learning_rate": 4.998281923752224e-06, + "loss": 1.1735, + "step": 1376 + }, + { + "epoch": 0.04, + "learning_rate": 4.998272870390307e-06, + "loss": 1.1858, + "step": 1377 + }, + { + "epoch": 0.04, + "learning_rate": 4.998263793246036e-06, + "loss": 1.1583, + "step": 1378 + }, + { + "epoch": 0.04, + "learning_rate": 4.998254692319497e-06, + "loss": 1.1561, + "step": 1379 + }, + { + "epoch": 0.04, + "learning_rate": 4.9982455676107765e-06, + "loss": 1.2388, + "step": 1380 + }, + { + "epoch": 0.04, + "learning_rate": 4.998236419119962e-06, + "loss": 1.1078, + "step": 1381 + }, + { + "epoch": 0.04, + "learning_rate": 4.998227246847139e-06, + "loss": 1.1591, + "step": 1382 + }, + { + "epoch": 0.04, + "learning_rate": 4.998218050792396e-06, + "loss": 1.2454, + "step": 1383 + }, + { + "epoch": 0.04, + "learning_rate": 4.99820883095582e-06, + "loss": 1.1569, + "step": 1384 + }, + { + "epoch": 0.04, + "learning_rate": 4.9981995873375e-06, + "loss": 1.175, + "step": 1385 + }, + { + "epoch": 0.04, + "learning_rate": 4.998190319937522e-06, + "loss": 1.2799, + "step": 1386 + }, + { + "epoch": 0.04, + "learning_rate": 4.998181028755976e-06, + "loss": 1.1968, + "step": 1387 + }, + { + "epoch": 0.04, + "learning_rate": 4.99817171379295e-06, + "loss": 1.2042, + "step": 1388 + }, + { + "epoch": 0.04, + "learning_rate": 4.998162375048532e-06, + "loss": 1.1487, + "step": 1389 + }, + { + "epoch": 0.04, + "learning_rate": 4.998153012522812e-06, + "loss": 1.157, + "step": 1390 + }, + { + "epoch": 0.04, + "learning_rate": 4.9981436262158775e-06, + "loss": 1.1346, + "step": 1391 + }, + { + "epoch": 0.04, + "learning_rate": 4.99813421612782e-06, + "loss": 1.2218, + "step": 1392 + }, + { + "epoch": 0.04, + "learning_rate": 4.998124782258727e-06, + "loss": 1.2579, + "step": 1393 + }, + { + "epoch": 0.04, + "learning_rate": 4.9981153246086895e-06, + "loss": 1.191, + "step": 1394 + }, + { + "epoch": 0.04, + "learning_rate": 4.998105843177797e-06, + "loss": 1.1713, + "step": 1395 + }, + { + "epoch": 0.04, + "learning_rate": 4.99809633796614e-06, + "loss": 1.1553, + "step": 1396 + }, + { + "epoch": 0.04, + "learning_rate": 4.998086808973809e-06, + "loss": 1.0659, + "step": 1397 + }, + { + "epoch": 0.04, + "learning_rate": 4.998077256200895e-06, + "loss": 1.2234, + "step": 1398 + }, + { + "epoch": 0.04, + "learning_rate": 4.99806767964749e-06, + "loss": 1.2722, + "step": 1399 + }, + { + "epoch": 0.04, + "learning_rate": 4.998058079313681e-06, + "loss": 1.185, + "step": 1400 + }, + { + "epoch": 0.04, + "learning_rate": 4.998048455199563e-06, + "loss": 1.2054, + "step": 1401 + }, + { + "epoch": 0.04, + "learning_rate": 4.998038807305228e-06, + "loss": 1.1964, + "step": 1402 + }, + { + "epoch": 0.04, + "learning_rate": 4.998029135630766e-06, + "loss": 1.0212, + "step": 1403 + }, + { + "epoch": 0.04, + "learning_rate": 4.99801944017627e-06, + "loss": 1.2871, + "step": 1404 + }, + { + "epoch": 0.04, + "learning_rate": 4.998009720941831e-06, + "loss": 1.2743, + "step": 1405 + }, + { + "epoch": 0.04, + "learning_rate": 4.997999977927543e-06, + "loss": 1.2203, + "step": 1406 + }, + { + "epoch": 0.04, + "learning_rate": 4.997990211133499e-06, + "loss": 1.1323, + "step": 1407 + }, + { + "epoch": 0.04, + "learning_rate": 4.997980420559791e-06, + "loss": 1.2367, + "step": 1408 + }, + { + "epoch": 0.04, + "learning_rate": 4.997970606206512e-06, + "loss": 1.142, + "step": 1409 + }, + { + "epoch": 0.04, + "learning_rate": 4.9979607680737565e-06, + "loss": 1.2618, + "step": 1410 + }, + { + "epoch": 0.04, + "learning_rate": 4.997950906161617e-06, + "loss": 1.1359, + "step": 1411 + }, + { + "epoch": 0.04, + "learning_rate": 4.997941020470188e-06, + "loss": 1.3521, + "step": 1412 + }, + { + "epoch": 0.04, + "learning_rate": 4.997931110999564e-06, + "loss": 1.3456, + "step": 1413 + }, + { + "epoch": 0.04, + "learning_rate": 4.9979211777498386e-06, + "loss": 1.1636, + "step": 1414 + }, + { + "epoch": 0.04, + "learning_rate": 4.997911220721107e-06, + "loss": 1.1298, + "step": 1415 + }, + { + "epoch": 0.04, + "learning_rate": 4.997901239913462e-06, + "loss": 1.145, + "step": 1416 + }, + { + "epoch": 0.04, + "learning_rate": 4.997891235327002e-06, + "loss": 1.1483, + "step": 1417 + }, + { + "epoch": 0.04, + "learning_rate": 4.99788120696182e-06, + "loss": 1.1073, + "step": 1418 + }, + { + "epoch": 0.04, + "learning_rate": 4.997871154818011e-06, + "loss": 1.2251, + "step": 1419 + }, + { + "epoch": 0.04, + "learning_rate": 4.997861078895673e-06, + "loss": 1.2023, + "step": 1420 + }, + { + "epoch": 0.04, + "learning_rate": 4.9978509791949e-06, + "loss": 1.1567, + "step": 1421 + }, + { + "epoch": 0.04, + "learning_rate": 4.997840855715789e-06, + "loss": 1.0558, + "step": 1422 + }, + { + "epoch": 0.04, + "learning_rate": 4.997830708458435e-06, + "loss": 1.1428, + "step": 1423 + }, + { + "epoch": 0.04, + "learning_rate": 4.997820537422936e-06, + "loss": 1.2295, + "step": 1424 + }, + { + "epoch": 0.04, + "learning_rate": 4.99781034260939e-06, + "loss": 1.2659, + "step": 1425 + }, + { + "epoch": 0.04, + "learning_rate": 4.997800124017891e-06, + "loss": 1.3099, + "step": 1426 + }, + { + "epoch": 0.04, + "learning_rate": 4.997789881648538e-06, + "loss": 1.0925, + "step": 1427 + }, + { + "epoch": 0.04, + "learning_rate": 4.997779615501428e-06, + "loss": 1.1285, + "step": 1428 + }, + { + "epoch": 0.04, + "learning_rate": 4.99776932557666e-06, + "loss": 1.111, + "step": 1429 + }, + { + "epoch": 0.04, + "learning_rate": 4.997759011874331e-06, + "loss": 1.2139, + "step": 1430 + }, + { + "epoch": 0.04, + "learning_rate": 4.997748674394538e-06, + "loss": 1.2056, + "step": 1431 + }, + { + "epoch": 0.04, + "learning_rate": 4.997738313137381e-06, + "loss": 1.2531, + "step": 1432 + }, + { + "epoch": 0.04, + "learning_rate": 4.997727928102959e-06, + "loss": 1.1431, + "step": 1433 + }, + { + "epoch": 0.04, + "learning_rate": 4.997717519291369e-06, + "loss": 1.1631, + "step": 1434 + }, + { + "epoch": 0.04, + "learning_rate": 4.997707086702711e-06, + "loss": 1.1643, + "step": 1435 + }, + { + "epoch": 0.04, + "learning_rate": 4.9976966303370855e-06, + "loss": 1.1473, + "step": 1436 + }, + { + "epoch": 0.04, + "learning_rate": 4.997686150194591e-06, + "loss": 1.0486, + "step": 1437 + }, + { + "epoch": 0.04, + "learning_rate": 4.997675646275328e-06, + "loss": 1.1455, + "step": 1438 + }, + { + "epoch": 0.04, + "learning_rate": 4.997665118579394e-06, + "loss": 1.1986, + "step": 1439 + }, + { + "epoch": 0.04, + "learning_rate": 4.997654567106891e-06, + "loss": 1.1876, + "step": 1440 + }, + { + "epoch": 0.04, + "learning_rate": 4.99764399185792e-06, + "loss": 1.0878, + "step": 1441 + }, + { + "epoch": 0.04, + "learning_rate": 4.997633392832582e-06, + "loss": 1.2119, + "step": 1442 + }, + { + "epoch": 0.04, + "learning_rate": 4.997622770030976e-06, + "loss": 1.2625, + "step": 1443 + }, + { + "epoch": 0.04, + "learning_rate": 4.9976121234532035e-06, + "loss": 1.2322, + "step": 1444 + }, + { + "epoch": 0.04, + "learning_rate": 4.9976014530993674e-06, + "loss": 1.2446, + "step": 1445 + }, + { + "epoch": 0.04, + "learning_rate": 4.997590758969569e-06, + "loss": 1.1074, + "step": 1446 + }, + { + "epoch": 0.04, + "learning_rate": 4.997580041063909e-06, + "loss": 1.0842, + "step": 1447 + }, + { + "epoch": 0.04, + "learning_rate": 4.9975692993824895e-06, + "loss": 1.1553, + "step": 1448 + }, + { + "epoch": 0.04, + "learning_rate": 4.997558533925413e-06, + "loss": 1.2311, + "step": 1449 + }, + { + "epoch": 0.04, + "learning_rate": 4.997547744692782e-06, + "loss": 1.1765, + "step": 1450 + }, + { + "epoch": 0.04, + "learning_rate": 4.9975369316847e-06, + "loss": 1.261, + "step": 1451 + }, + { + "epoch": 0.04, + "learning_rate": 4.9975260949012685e-06, + "loss": 1.0226, + "step": 1452 + }, + { + "epoch": 0.04, + "learning_rate": 4.997515234342593e-06, + "loss": 1.1461, + "step": 1453 + }, + { + "epoch": 0.04, + "learning_rate": 4.9975043500087735e-06, + "loss": 1.1948, + "step": 1454 + }, + { + "epoch": 0.04, + "learning_rate": 4.997493441899917e-06, + "loss": 1.2085, + "step": 1455 + }, + { + "epoch": 0.04, + "learning_rate": 4.9974825100161236e-06, + "loss": 1.0927, + "step": 1456 + }, + { + "epoch": 0.04, + "learning_rate": 4.997471554357501e-06, + "loss": 1.1628, + "step": 1457 + }, + { + "epoch": 0.04, + "learning_rate": 4.997460574924152e-06, + "loss": 1.1052, + "step": 1458 + }, + { + "epoch": 0.04, + "learning_rate": 4.997449571716181e-06, + "loss": 1.046, + "step": 1459 + }, + { + "epoch": 0.04, + "learning_rate": 4.997438544733693e-06, + "loss": 1.092, + "step": 1460 + }, + { + "epoch": 0.04, + "learning_rate": 4.997427493976793e-06, + "loss": 1.2162, + "step": 1461 + }, + { + "epoch": 0.04, + "learning_rate": 4.997416419445585e-06, + "loss": 1.1691, + "step": 1462 + }, + { + "epoch": 0.04, + "learning_rate": 4.997405321140177e-06, + "loss": 1.29, + "step": 1463 + }, + { + "epoch": 0.04, + "learning_rate": 4.9973941990606726e-06, + "loss": 1.1586, + "step": 1464 + }, + { + "epoch": 0.04, + "learning_rate": 4.9973830532071775e-06, + "loss": 1.1602, + "step": 1465 + }, + { + "epoch": 0.04, + "learning_rate": 4.997371883579799e-06, + "loss": 1.2015, + "step": 1466 + }, + { + "epoch": 0.04, + "learning_rate": 4.997360690178643e-06, + "loss": 1.1411, + "step": 1467 + }, + { + "epoch": 0.04, + "learning_rate": 4.9973494730038165e-06, + "loss": 1.2632, + "step": 1468 + }, + { + "epoch": 0.04, + "learning_rate": 4.997338232055425e-06, + "loss": 1.2042, + "step": 1469 + }, + { + "epoch": 0.04, + "learning_rate": 4.9973269673335765e-06, + "loss": 1.2416, + "step": 1470 + }, + { + "epoch": 0.04, + "learning_rate": 4.997315678838378e-06, + "loss": 1.2423, + "step": 1471 + }, + { + "epoch": 0.04, + "learning_rate": 4.9973043665699375e-06, + "loss": 1.2742, + "step": 1472 + }, + { + "epoch": 0.04, + "learning_rate": 4.997293030528362e-06, + "loss": 1.1768, + "step": 1473 + }, + { + "epoch": 0.04, + "learning_rate": 4.997281670713759e-06, + "loss": 1.2313, + "step": 1474 + }, + { + "epoch": 0.04, + "learning_rate": 4.997270287126238e-06, + "loss": 1.3273, + "step": 1475 + }, + { + "epoch": 0.04, + "learning_rate": 4.997258879765906e-06, + "loss": 1.0893, + "step": 1476 + }, + { + "epoch": 0.04, + "learning_rate": 4.997247448632873e-06, + "loss": 1.1846, + "step": 1477 + }, + { + "epoch": 0.04, + "learning_rate": 4.997235993727245e-06, + "loss": 1.1807, + "step": 1478 + }, + { + "epoch": 0.04, + "learning_rate": 4.997224515049135e-06, + "loss": 1.1299, + "step": 1479 + }, + { + "epoch": 0.04, + "learning_rate": 4.997213012598649e-06, + "loss": 1.1835, + "step": 1480 + }, + { + "epoch": 0.04, + "learning_rate": 4.997201486375899e-06, + "loss": 1.2907, + "step": 1481 + }, + { + "epoch": 0.04, + "learning_rate": 4.997189936380993e-06, + "loss": 1.1105, + "step": 1482 + }, + { + "epoch": 0.04, + "learning_rate": 4.9971783626140416e-06, + "loss": 1.2328, + "step": 1483 + }, + { + "epoch": 0.04, + "learning_rate": 4.997166765075155e-06, + "loss": 1.1407, + "step": 1484 + }, + { + "epoch": 0.04, + "learning_rate": 4.997155143764444e-06, + "loss": 1.0615, + "step": 1485 + }, + { + "epoch": 0.04, + "learning_rate": 4.997143498682017e-06, + "loss": 1.2443, + "step": 1486 + }, + { + "epoch": 0.04, + "learning_rate": 4.997131829827988e-06, + "loss": 1.2174, + "step": 1487 + }, + { + "epoch": 0.04, + "learning_rate": 4.997120137202466e-06, + "loss": 1.1293, + "step": 1488 + }, + { + "epoch": 0.04, + "learning_rate": 4.9971084208055635e-06, + "loss": 1.2218, + "step": 1489 + }, + { + "epoch": 0.04, + "learning_rate": 4.997096680637391e-06, + "loss": 1.1495, + "step": 1490 + }, + { + "epoch": 0.04, + "learning_rate": 4.997084916698061e-06, + "loss": 1.1042, + "step": 1491 + }, + { + "epoch": 0.04, + "learning_rate": 4.997073128987685e-06, + "loss": 1.2842, + "step": 1492 + }, + { + "epoch": 0.04, + "learning_rate": 4.997061317506376e-06, + "loss": 1.1063, + "step": 1493 + }, + { + "epoch": 0.05, + "learning_rate": 4.997049482254246e-06, + "loss": 1.1703, + "step": 1494 + }, + { + "epoch": 0.05, + "learning_rate": 4.997037623231406e-06, + "loss": 1.0982, + "step": 1495 + }, + { + "epoch": 0.05, + "learning_rate": 4.9970257404379715e-06, + "loss": 1.2062, + "step": 1496 + }, + { + "epoch": 0.05, + "learning_rate": 4.9970138338740544e-06, + "loss": 1.1735, + "step": 1497 + }, + { + "epoch": 0.05, + "learning_rate": 4.997001903539769e-06, + "loss": 1.1236, + "step": 1498 + }, + { + "epoch": 0.05, + "learning_rate": 4.996989949435227e-06, + "loss": 1.2139, + "step": 1499 + }, + { + "epoch": 0.05, + "learning_rate": 4.996977971560544e-06, + "loss": 1.0888, + "step": 1500 + }, + { + "epoch": 0.05, + "learning_rate": 4.996965969915833e-06, + "loss": 1.1982, + "step": 1501 + }, + { + "epoch": 0.05, + "learning_rate": 4.9969539445012084e-06, + "loss": 1.2223, + "step": 1502 + }, + { + "epoch": 0.05, + "learning_rate": 4.996941895316785e-06, + "loss": 1.0839, + "step": 1503 + }, + { + "epoch": 0.05, + "learning_rate": 4.996929822362677e-06, + "loss": 1.1498, + "step": 1504 + }, + { + "epoch": 0.05, + "learning_rate": 4.996917725639e-06, + "loss": 1.1985, + "step": 1505 + }, + { + "epoch": 0.05, + "learning_rate": 4.996905605145869e-06, + "loss": 1.1567, + "step": 1506 + }, + { + "epoch": 0.05, + "learning_rate": 4.9968934608833986e-06, + "loss": 1.1472, + "step": 1507 + }, + { + "epoch": 0.05, + "learning_rate": 4.996881292851705e-06, + "loss": 1.1729, + "step": 1508 + }, + { + "epoch": 0.05, + "learning_rate": 4.996869101050905e-06, + "loss": 1.1501, + "step": 1509 + }, + { + "epoch": 0.05, + "learning_rate": 4.996856885481113e-06, + "loss": 1.0624, + "step": 1510 + }, + { + "epoch": 0.05, + "learning_rate": 4.996844646142446e-06, + "loss": 1.1618, + "step": 1511 + }, + { + "epoch": 0.05, + "learning_rate": 4.99683238303502e-06, + "loss": 1.2357, + "step": 1512 + }, + { + "epoch": 0.05, + "learning_rate": 4.996820096158953e-06, + "loss": 1.1534, + "step": 1513 + }, + { + "epoch": 0.05, + "learning_rate": 4.996807785514361e-06, + "loss": 1.2262, + "step": 1514 + }, + { + "epoch": 0.05, + "learning_rate": 4.996795451101361e-06, + "loss": 1.191, + "step": 1515 + }, + { + "epoch": 0.05, + "learning_rate": 4.996783092920071e-06, + "loss": 1.2784, + "step": 1516 + }, + { + "epoch": 0.05, + "learning_rate": 4.996770710970609e-06, + "loss": 1.18, + "step": 1517 + }, + { + "epoch": 0.05, + "learning_rate": 4.996758305253092e-06, + "loss": 1.1997, + "step": 1518 + }, + { + "epoch": 0.05, + "learning_rate": 4.996745875767638e-06, + "loss": 1.1383, + "step": 1519 + }, + { + "epoch": 0.05, + "learning_rate": 4.996733422514366e-06, + "loss": 1.2999, + "step": 1520 + }, + { + "epoch": 0.05, + "learning_rate": 4.996720945493394e-06, + "loss": 1.1683, + "step": 1521 + }, + { + "epoch": 0.05, + "learning_rate": 4.996708444704842e-06, + "loss": 1.1771, + "step": 1522 + }, + { + "epoch": 0.05, + "learning_rate": 4.9966959201488275e-06, + "loss": 1.2676, + "step": 1523 + }, + { + "epoch": 0.05, + "learning_rate": 4.99668337182547e-06, + "loss": 1.1324, + "step": 1524 + }, + { + "epoch": 0.05, + "learning_rate": 4.99667079973489e-06, + "loss": 1.2147, + "step": 1525 + }, + { + "epoch": 0.05, + "learning_rate": 4.996658203877205e-06, + "loss": 1.2349, + "step": 1526 + }, + { + "epoch": 0.05, + "learning_rate": 4.996645584252538e-06, + "loss": 1.224, + "step": 1527 + }, + { + "epoch": 0.05, + "learning_rate": 4.996632940861006e-06, + "loss": 1.2042, + "step": 1528 + }, + { + "epoch": 0.05, + "learning_rate": 4.9966202737027315e-06, + "loss": 1.3643, + "step": 1529 + }, + { + "epoch": 0.05, + "learning_rate": 4.996607582777835e-06, + "loss": 1.2596, + "step": 1530 + }, + { + "epoch": 0.05, + "learning_rate": 4.996594868086436e-06, + "loss": 1.2344, + "step": 1531 + }, + { + "epoch": 0.05, + "learning_rate": 4.996582129628656e-06, + "loss": 1.2437, + "step": 1532 + }, + { + "epoch": 0.05, + "learning_rate": 4.996569367404617e-06, + "loss": 1.1772, + "step": 1533 + }, + { + "epoch": 0.05, + "learning_rate": 4.99655658141444e-06, + "loss": 1.1131, + "step": 1534 + }, + { + "epoch": 0.05, + "learning_rate": 4.996543771658246e-06, + "loss": 1.1116, + "step": 1535 + }, + { + "epoch": 0.05, + "learning_rate": 4.996530938136159e-06, + "loss": 1.0788, + "step": 1536 + }, + { + "epoch": 0.05, + "learning_rate": 4.996518080848299e-06, + "loss": 1.2013, + "step": 1537 + }, + { + "epoch": 0.05, + "learning_rate": 4.996505199794789e-06, + "loss": 1.0881, + "step": 1538 + }, + { + "epoch": 0.05, + "learning_rate": 4.996492294975753e-06, + "loss": 1.1772, + "step": 1539 + }, + { + "epoch": 0.05, + "learning_rate": 4.996479366391312e-06, + "loss": 1.15, + "step": 1540 + }, + { + "epoch": 0.05, + "learning_rate": 4.99646641404159e-06, + "loss": 1.1144, + "step": 1541 + }, + { + "epoch": 0.05, + "learning_rate": 4.996453437926709e-06, + "loss": 1.1946, + "step": 1542 + }, + { + "epoch": 0.05, + "learning_rate": 4.996440438046795e-06, + "loss": 1.1885, + "step": 1543 + }, + { + "epoch": 0.05, + "learning_rate": 4.9964274144019695e-06, + "loss": 1.3342, + "step": 1544 + }, + { + "epoch": 0.05, + "learning_rate": 4.9964143669923575e-06, + "loss": 1.1249, + "step": 1545 + }, + { + "epoch": 0.05, + "learning_rate": 4.996401295818083e-06, + "loss": 1.1367, + "step": 1546 + }, + { + "epoch": 0.05, + "learning_rate": 4.996388200879271e-06, + "loss": 1.2043, + "step": 1547 + }, + { + "epoch": 0.05, + "learning_rate": 4.996375082176045e-06, + "loss": 1.2315, + "step": 1548 + }, + { + "epoch": 0.05, + "learning_rate": 4.996361939708531e-06, + "loss": 1.2769, + "step": 1549 + }, + { + "epoch": 0.05, + "learning_rate": 4.996348773476854e-06, + "loss": 1.1766, + "step": 1550 + }, + { + "epoch": 0.05, + "learning_rate": 4.9963355834811375e-06, + "loss": 1.1169, + "step": 1551 + }, + { + "epoch": 0.05, + "learning_rate": 4.996322369721509e-06, + "loss": 1.174, + "step": 1552 + }, + { + "epoch": 0.05, + "learning_rate": 4.996309132198095e-06, + "loss": 1.1461, + "step": 1553 + }, + { + "epoch": 0.05, + "learning_rate": 4.996295870911019e-06, + "loss": 1.354, + "step": 1554 + }, + { + "epoch": 0.05, + "learning_rate": 4.996282585860409e-06, + "loss": 1.1774, + "step": 1555 + }, + { + "epoch": 0.05, + "learning_rate": 4.996269277046391e-06, + "loss": 1.1967, + "step": 1556 + }, + { + "epoch": 0.05, + "learning_rate": 4.996255944469092e-06, + "loss": 1.2192, + "step": 1557 + }, + { + "epoch": 0.05, + "learning_rate": 4.9962425881286385e-06, + "loss": 1.1819, + "step": 1558 + }, + { + "epoch": 0.05, + "learning_rate": 4.9962292080251575e-06, + "loss": 1.1674, + "step": 1559 + }, + { + "epoch": 0.05, + "learning_rate": 4.996215804158777e-06, + "loss": 1.1873, + "step": 1560 + }, + { + "epoch": 0.05, + "learning_rate": 4.996202376529625e-06, + "loss": 1.3192, + "step": 1561 + }, + { + "epoch": 0.05, + "learning_rate": 4.996188925137827e-06, + "loss": 1.1459, + "step": 1562 + }, + { + "epoch": 0.05, + "learning_rate": 4.9961754499835136e-06, + "loss": 1.1735, + "step": 1563 + }, + { + "epoch": 0.05, + "learning_rate": 4.9961619510668125e-06, + "loss": 1.166, + "step": 1564 + }, + { + "epoch": 0.05, + "learning_rate": 4.996148428387851e-06, + "loss": 1.0241, + "step": 1565 + }, + { + "epoch": 0.05, + "learning_rate": 4.996134881946759e-06, + "loss": 1.2385, + "step": 1566 + }, + { + "epoch": 0.05, + "learning_rate": 4.996121311743665e-06, + "loss": 1.2433, + "step": 1567 + }, + { + "epoch": 0.05, + "learning_rate": 4.996107717778698e-06, + "loss": 1.1202, + "step": 1568 + }, + { + "epoch": 0.05, + "learning_rate": 4.996094100051988e-06, + "loss": 1.1934, + "step": 1569 + }, + { + "epoch": 0.05, + "learning_rate": 4.996080458563664e-06, + "loss": 1.1459, + "step": 1570 + }, + { + "epoch": 0.05, + "learning_rate": 4.9960667933138575e-06, + "loss": 1.0416, + "step": 1571 + }, + { + "epoch": 0.05, + "learning_rate": 4.996053104302696e-06, + "loss": 1.1928, + "step": 1572 + }, + { + "epoch": 0.05, + "learning_rate": 4.996039391530312e-06, + "loss": 1.1469, + "step": 1573 + }, + { + "epoch": 0.05, + "learning_rate": 4.9960256549968335e-06, + "loss": 1.1815, + "step": 1574 + }, + { + "epoch": 0.05, + "learning_rate": 4.996011894702394e-06, + "loss": 1.2447, + "step": 1575 + }, + { + "epoch": 0.05, + "learning_rate": 4.995998110647123e-06, + "loss": 1.1324, + "step": 1576 + }, + { + "epoch": 0.05, + "learning_rate": 4.995984302831153e-06, + "loss": 1.1459, + "step": 1577 + }, + { + "epoch": 0.05, + "learning_rate": 4.995970471254613e-06, + "loss": 1.1298, + "step": 1578 + }, + { + "epoch": 0.05, + "learning_rate": 4.995956615917637e-06, + "loss": 1.2235, + "step": 1579 + }, + { + "epoch": 0.05, + "learning_rate": 4.995942736820357e-06, + "loss": 1.1102, + "step": 1580 + }, + { + "epoch": 0.05, + "learning_rate": 4.9959288339629034e-06, + "loss": 1.1386, + "step": 1581 + }, + { + "epoch": 0.05, + "learning_rate": 4.99591490734541e-06, + "loss": 1.0818, + "step": 1582 + }, + { + "epoch": 0.05, + "learning_rate": 4.9959009569680074e-06, + "loss": 1.1465, + "step": 1583 + }, + { + "epoch": 0.05, + "learning_rate": 4.995886982830831e-06, + "loss": 1.1124, + "step": 1584 + }, + { + "epoch": 0.05, + "learning_rate": 4.995872984934012e-06, + "loss": 1.271, + "step": 1585 + }, + { + "epoch": 0.05, + "learning_rate": 4.995858963277685e-06, + "loss": 1.1163, + "step": 1586 + }, + { + "epoch": 0.05, + "learning_rate": 4.995844917861981e-06, + "loss": 1.1763, + "step": 1587 + }, + { + "epoch": 0.05, + "learning_rate": 4.9958308486870375e-06, + "loss": 1.2415, + "step": 1588 + }, + { + "epoch": 0.05, + "learning_rate": 4.995816755752985e-06, + "loss": 1.181, + "step": 1589 + }, + { + "epoch": 0.05, + "learning_rate": 4.995802639059959e-06, + "loss": 1.1247, + "step": 1590 + }, + { + "epoch": 0.05, + "learning_rate": 4.995788498608094e-06, + "loss": 1.1912, + "step": 1591 + }, + { + "epoch": 0.05, + "learning_rate": 4.995774334397525e-06, + "loss": 1.1967, + "step": 1592 + }, + { + "epoch": 0.05, + "learning_rate": 4.995760146428387e-06, + "loss": 1.1281, + "step": 1593 + }, + { + "epoch": 0.05, + "learning_rate": 4.995745934700813e-06, + "loss": 1.1555, + "step": 1594 + }, + { + "epoch": 0.05, + "learning_rate": 4.995731699214941e-06, + "loss": 1.1896, + "step": 1595 + }, + { + "epoch": 0.05, + "learning_rate": 4.9957174399709045e-06, + "loss": 1.192, + "step": 1596 + }, + { + "epoch": 0.05, + "learning_rate": 4.995703156968839e-06, + "loss": 1.051, + "step": 1597 + }, + { + "epoch": 0.05, + "learning_rate": 4.995688850208882e-06, + "loss": 1.2188, + "step": 1598 + }, + { + "epoch": 0.05, + "learning_rate": 4.99567451969117e-06, + "loss": 1.1842, + "step": 1599 + }, + { + "epoch": 0.05, + "learning_rate": 4.995660165415838e-06, + "loss": 1.1573, + "step": 1600 + }, + { + "epoch": 0.05, + "learning_rate": 4.9956457873830235e-06, + "loss": 1.239, + "step": 1601 + }, + { + "epoch": 0.05, + "learning_rate": 4.995631385592862e-06, + "loss": 1.1345, + "step": 1602 + }, + { + "epoch": 0.05, + "learning_rate": 4.995616960045493e-06, + "loss": 1.0983, + "step": 1603 + }, + { + "epoch": 0.05, + "learning_rate": 4.995602510741051e-06, + "loss": 1.2007, + "step": 1604 + }, + { + "epoch": 0.05, + "learning_rate": 4.995588037679676e-06, + "loss": 1.1747, + "step": 1605 + }, + { + "epoch": 0.05, + "learning_rate": 4.995573540861505e-06, + "loss": 1.1755, + "step": 1606 + }, + { + "epoch": 0.05, + "learning_rate": 4.995559020286676e-06, + "loss": 1.1733, + "step": 1607 + }, + { + "epoch": 0.05, + "learning_rate": 4.995544475955326e-06, + "loss": 1.1702, + "step": 1608 + }, + { + "epoch": 0.05, + "learning_rate": 4.995529907867595e-06, + "loss": 1.2209, + "step": 1609 + }, + { + "epoch": 0.05, + "learning_rate": 4.99551531602362e-06, + "loss": 1.278, + "step": 1610 + }, + { + "epoch": 0.05, + "learning_rate": 4.995500700423543e-06, + "loss": 1.1365, + "step": 1611 + }, + { + "epoch": 0.05, + "learning_rate": 4.9954860610675e-06, + "loss": 1.1733, + "step": 1612 + }, + { + "epoch": 0.05, + "learning_rate": 4.995471397955632e-06, + "loss": 1.0359, + "step": 1613 + }, + { + "epoch": 0.05, + "learning_rate": 4.995456711088078e-06, + "loss": 1.116, + "step": 1614 + }, + { + "epoch": 0.05, + "learning_rate": 4.995442000464978e-06, + "loss": 1.1791, + "step": 1615 + }, + { + "epoch": 0.05, + "learning_rate": 4.995427266086472e-06, + "loss": 1.1511, + "step": 1616 + }, + { + "epoch": 0.05, + "learning_rate": 4.9954125079527005e-06, + "loss": 1.2079, + "step": 1617 + }, + { + "epoch": 0.05, + "learning_rate": 4.995397726063804e-06, + "loss": 1.2311, + "step": 1618 + }, + { + "epoch": 0.05, + "learning_rate": 4.995382920419922e-06, + "loss": 1.3351, + "step": 1619 + }, + { + "epoch": 0.05, + "learning_rate": 4.995368091021198e-06, + "loss": 1.1236, + "step": 1620 + }, + { + "epoch": 0.05, + "learning_rate": 4.99535323786777e-06, + "loss": 1.0858, + "step": 1621 + }, + { + "epoch": 0.05, + "learning_rate": 4.995338360959782e-06, + "loss": 1.1331, + "step": 1622 + }, + { + "epoch": 0.05, + "learning_rate": 4.995323460297373e-06, + "loss": 1.2081, + "step": 1623 + }, + { + "epoch": 0.05, + "learning_rate": 4.995308535880688e-06, + "loss": 1.2941, + "step": 1624 + }, + { + "epoch": 0.05, + "learning_rate": 4.995293587709868e-06, + "loss": 1.1794, + "step": 1625 + }, + { + "epoch": 0.05, + "learning_rate": 4.995278615785053e-06, + "loss": 1.1582, + "step": 1626 + }, + { + "epoch": 0.05, + "learning_rate": 4.995263620106389e-06, + "loss": 1.1793, + "step": 1627 + }, + { + "epoch": 0.05, + "learning_rate": 4.995248600674016e-06, + "loss": 1.1071, + "step": 1628 + }, + { + "epoch": 0.05, + "learning_rate": 4.995233557488079e-06, + "loss": 1.2351, + "step": 1629 + }, + { + "epoch": 0.05, + "learning_rate": 4.995218490548719e-06, + "loss": 1.1041, + "step": 1630 + }, + { + "epoch": 0.05, + "learning_rate": 4.995203399856081e-06, + "loss": 1.2623, + "step": 1631 + }, + { + "epoch": 0.05, + "learning_rate": 4.995188285410309e-06, + "loss": 1.1351, + "step": 1632 + }, + { + "epoch": 0.05, + "learning_rate": 4.995173147211546e-06, + "loss": 1.1996, + "step": 1633 + }, + { + "epoch": 0.05, + "learning_rate": 4.995157985259936e-06, + "loss": 1.137, + "step": 1634 + }, + { + "epoch": 0.05, + "learning_rate": 4.9951427995556246e-06, + "loss": 1.1227, + "step": 1635 + }, + { + "epoch": 0.05, + "learning_rate": 4.995127590098755e-06, + "loss": 1.1649, + "step": 1636 + }, + { + "epoch": 0.05, + "learning_rate": 4.995112356889472e-06, + "loss": 1.1418, + "step": 1637 + }, + { + "epoch": 0.05, + "learning_rate": 4.995097099927922e-06, + "loss": 1.227, + "step": 1638 + }, + { + "epoch": 0.05, + "learning_rate": 4.995081819214248e-06, + "loss": 1.1496, + "step": 1639 + }, + { + "epoch": 0.05, + "learning_rate": 4.995066514748598e-06, + "loss": 1.0347, + "step": 1640 + }, + { + "epoch": 0.05, + "learning_rate": 4.9950511865311155e-06, + "loss": 1.2484, + "step": 1641 + }, + { + "epoch": 0.05, + "learning_rate": 4.995035834561948e-06, + "loss": 1.1472, + "step": 1642 + }, + { + "epoch": 0.05, + "learning_rate": 4.995020458841241e-06, + "loss": 1.2468, + "step": 1643 + }, + { + "epoch": 0.05, + "learning_rate": 4.99500505936914e-06, + "loss": 1.1393, + "step": 1644 + }, + { + "epoch": 0.05, + "learning_rate": 4.9949896361457936e-06, + "loss": 1.0506, + "step": 1645 + }, + { + "epoch": 0.05, + "learning_rate": 4.994974189171346e-06, + "loss": 1.1703, + "step": 1646 + }, + { + "epoch": 0.05, + "learning_rate": 4.9949587184459484e-06, + "loss": 1.2708, + "step": 1647 + }, + { + "epoch": 0.05, + "learning_rate": 4.9949432239697435e-06, + "loss": 1.1866, + "step": 1648 + }, + { + "epoch": 0.05, + "learning_rate": 4.99492770574288e-06, + "loss": 1.3478, + "step": 1649 + }, + { + "epoch": 0.05, + "learning_rate": 4.994912163765508e-06, + "loss": 1.2264, + "step": 1650 + }, + { + "epoch": 0.05, + "learning_rate": 4.9948965980377726e-06, + "loss": 1.2232, + "step": 1651 + }, + { + "epoch": 0.05, + "learning_rate": 4.994881008559824e-06, + "loss": 1.067, + "step": 1652 + }, + { + "epoch": 0.05, + "learning_rate": 4.994865395331809e-06, + "loss": 1.0826, + "step": 1653 + }, + { + "epoch": 0.05, + "learning_rate": 4.994849758353878e-06, + "loss": 1.1506, + "step": 1654 + }, + { + "epoch": 0.05, + "learning_rate": 4.994834097626178e-06, + "loss": 1.2198, + "step": 1655 + }, + { + "epoch": 0.05, + "learning_rate": 4.99481841314886e-06, + "loss": 1.2283, + "step": 1656 + }, + { + "epoch": 0.05, + "learning_rate": 4.994802704922071e-06, + "loss": 1.1685, + "step": 1657 + }, + { + "epoch": 0.05, + "learning_rate": 4.994786972945963e-06, + "loss": 1.2269, + "step": 1658 + }, + { + "epoch": 0.05, + "learning_rate": 4.994771217220683e-06, + "loss": 1.0861, + "step": 1659 + }, + { + "epoch": 0.05, + "learning_rate": 4.9947554377463835e-06, + "loss": 1.1929, + "step": 1660 + }, + { + "epoch": 0.05, + "learning_rate": 4.994739634523213e-06, + "loss": 1.1861, + "step": 1661 + }, + { + "epoch": 0.05, + "learning_rate": 4.994723807551324e-06, + "loss": 1.1339, + "step": 1662 + }, + { + "epoch": 0.05, + "learning_rate": 4.994707956830865e-06, + "loss": 1.1885, + "step": 1663 + }, + { + "epoch": 0.05, + "learning_rate": 4.9946920823619885e-06, + "loss": 1.1979, + "step": 1664 + }, + { + "epoch": 0.05, + "learning_rate": 4.994676184144844e-06, + "loss": 1.1755, + "step": 1665 + }, + { + "epoch": 0.05, + "learning_rate": 4.9946602621795835e-06, + "loss": 1.1328, + "step": 1666 + }, + { + "epoch": 0.05, + "learning_rate": 4.994644316466359e-06, + "loss": 1.1513, + "step": 1667 + }, + { + "epoch": 0.05, + "learning_rate": 4.994628347005323e-06, + "loss": 1.1221, + "step": 1668 + }, + { + "epoch": 0.05, + "learning_rate": 4.994612353796626e-06, + "loss": 1.2172, + "step": 1669 + }, + { + "epoch": 0.05, + "learning_rate": 4.994596336840421e-06, + "loss": 1.1649, + "step": 1670 + }, + { + "epoch": 0.05, + "learning_rate": 4.9945802961368594e-06, + "loss": 1.2111, + "step": 1671 + }, + { + "epoch": 0.05, + "learning_rate": 4.994564231686096e-06, + "loss": 1.2229, + "step": 1672 + }, + { + "epoch": 0.05, + "learning_rate": 4.9945481434882815e-06, + "loss": 1.1837, + "step": 1673 + }, + { + "epoch": 0.05, + "learning_rate": 4.994532031543571e-06, + "loss": 1.2053, + "step": 1674 + }, + { + "epoch": 0.05, + "learning_rate": 4.994515895852117e-06, + "loss": 1.1487, + "step": 1675 + }, + { + "epoch": 0.05, + "learning_rate": 4.994499736414072e-06, + "loss": 1.1232, + "step": 1676 + }, + { + "epoch": 0.05, + "learning_rate": 4.994483553229592e-06, + "loss": 1.191, + "step": 1677 + }, + { + "epoch": 0.05, + "learning_rate": 4.994467346298829e-06, + "loss": 1.072, + "step": 1678 + }, + { + "epoch": 0.05, + "learning_rate": 4.994451115621939e-06, + "loss": 1.1729, + "step": 1679 + }, + { + "epoch": 0.05, + "learning_rate": 4.994434861199076e-06, + "loss": 1.2803, + "step": 1680 + }, + { + "epoch": 0.05, + "learning_rate": 4.994418583030393e-06, + "loss": 1.2723, + "step": 1681 + }, + { + "epoch": 0.05, + "learning_rate": 4.994402281116048e-06, + "loss": 1.1328, + "step": 1682 + }, + { + "epoch": 0.05, + "learning_rate": 4.994385955456193e-06, + "loss": 1.1125, + "step": 1683 + }, + { + "epoch": 0.05, + "learning_rate": 4.994369606050987e-06, + "loss": 1.0543, + "step": 1684 + }, + { + "epoch": 0.05, + "learning_rate": 4.994353232900583e-06, + "loss": 1.2303, + "step": 1685 + }, + { + "epoch": 0.05, + "learning_rate": 4.994336836005137e-06, + "loss": 1.2257, + "step": 1686 + }, + { + "epoch": 0.05, + "learning_rate": 4.994320415364806e-06, + "loss": 1.3856, + "step": 1687 + }, + { + "epoch": 0.05, + "learning_rate": 4.994303970979746e-06, + "loss": 1.15, + "step": 1688 + }, + { + "epoch": 0.05, + "learning_rate": 4.994287502850113e-06, + "loss": 1.0637, + "step": 1689 + }, + { + "epoch": 0.05, + "learning_rate": 4.994271010976065e-06, + "loss": 1.0891, + "step": 1690 + }, + { + "epoch": 0.05, + "learning_rate": 4.9942544953577575e-06, + "loss": 1.1115, + "step": 1691 + }, + { + "epoch": 0.05, + "learning_rate": 4.994237955995349e-06, + "loss": 1.3015, + "step": 1692 + }, + { + "epoch": 0.05, + "learning_rate": 4.994221392888997e-06, + "loss": 1.225, + "step": 1693 + }, + { + "epoch": 0.05, + "learning_rate": 4.994204806038857e-06, + "loss": 1.3075, + "step": 1694 + }, + { + "epoch": 0.05, + "learning_rate": 4.99418819544509e-06, + "loss": 1.1508, + "step": 1695 + }, + { + "epoch": 0.05, + "learning_rate": 4.994171561107852e-06, + "loss": 1.152, + "step": 1696 + }, + { + "epoch": 0.05, + "learning_rate": 4.9941549030273015e-06, + "loss": 1.137, + "step": 1697 + }, + { + "epoch": 0.05, + "learning_rate": 4.9941382212035986e-06, + "loss": 1.2516, + "step": 1698 + }, + { + "epoch": 0.05, + "learning_rate": 4.9941215156369006e-06, + "loss": 1.2577, + "step": 1699 + }, + { + "epoch": 0.05, + "learning_rate": 4.994104786327367e-06, + "loss": 1.2245, + "step": 1700 + }, + { + "epoch": 0.05, + "learning_rate": 4.994088033275156e-06, + "loss": 1.1021, + "step": 1701 + }, + { + "epoch": 0.05, + "learning_rate": 4.9940712564804296e-06, + "loss": 1.1862, + "step": 1702 + }, + { + "epoch": 0.05, + "learning_rate": 4.9940544559433455e-06, + "loss": 1.1258, + "step": 1703 + }, + { + "epoch": 0.05, + "learning_rate": 4.9940376316640634e-06, + "loss": 1.2409, + "step": 1704 + }, + { + "epoch": 0.05, + "learning_rate": 4.994020783642746e-06, + "loss": 1.3036, + "step": 1705 + }, + { + "epoch": 0.05, + "learning_rate": 4.99400391187955e-06, + "loss": 1.2081, + "step": 1706 + }, + { + "epoch": 0.05, + "learning_rate": 4.99398701637464e-06, + "loss": 1.1615, + "step": 1707 + }, + { + "epoch": 0.05, + "learning_rate": 4.993970097128172e-06, + "loss": 1.2204, + "step": 1708 + }, + { + "epoch": 0.05, + "learning_rate": 4.993953154140312e-06, + "loss": 1.2557, + "step": 1709 + }, + { + "epoch": 0.05, + "learning_rate": 4.993936187411218e-06, + "loss": 1.1786, + "step": 1710 + }, + { + "epoch": 0.05, + "learning_rate": 4.993919196941054e-06, + "loss": 1.2738, + "step": 1711 + }, + { + "epoch": 0.05, + "learning_rate": 4.993902182729979e-06, + "loss": 1.1138, + "step": 1712 + }, + { + "epoch": 0.05, + "learning_rate": 4.9938851447781565e-06, + "loss": 1.2151, + "step": 1713 + }, + { + "epoch": 0.05, + "learning_rate": 4.993868083085749e-06, + "loss": 1.1438, + "step": 1714 + }, + { + "epoch": 0.05, + "learning_rate": 4.993850997652918e-06, + "loss": 1.0769, + "step": 1715 + }, + { + "epoch": 0.05, + "learning_rate": 4.993833888479827e-06, + "loss": 1.0342, + "step": 1716 + }, + { + "epoch": 0.05, + "learning_rate": 4.993816755566638e-06, + "loss": 1.1973, + "step": 1717 + }, + { + "epoch": 0.05, + "learning_rate": 4.993799598913515e-06, + "loss": 1.2147, + "step": 1718 + }, + { + "epoch": 0.05, + "learning_rate": 4.993782418520621e-06, + "loss": 1.0717, + "step": 1719 + }, + { + "epoch": 0.05, + "learning_rate": 4.993765214388119e-06, + "loss": 1.1673, + "step": 1720 + }, + { + "epoch": 0.05, + "learning_rate": 4.993747986516173e-06, + "loss": 1.2903, + "step": 1721 + }, + { + "epoch": 0.05, + "learning_rate": 4.993730734904947e-06, + "loss": 1.0559, + "step": 1722 + }, + { + "epoch": 0.05, + "learning_rate": 4.993713459554606e-06, + "loss": 1.1838, + "step": 1723 + }, + { + "epoch": 0.05, + "learning_rate": 4.993696160465313e-06, + "loss": 1.1482, + "step": 1724 + }, + { + "epoch": 0.05, + "learning_rate": 4.993678837637235e-06, + "loss": 1.1609, + "step": 1725 + }, + { + "epoch": 0.05, + "learning_rate": 4.993661491070535e-06, + "loss": 1.1902, + "step": 1726 + }, + { + "epoch": 0.05, + "learning_rate": 4.993644120765379e-06, + "loss": 1.2123, + "step": 1727 + }, + { + "epoch": 0.05, + "learning_rate": 4.993626726721931e-06, + "loss": 1.1949, + "step": 1728 + }, + { + "epoch": 0.05, + "learning_rate": 4.993609308940357e-06, + "loss": 1.223, + "step": 1729 + }, + { + "epoch": 0.05, + "learning_rate": 4.993591867420825e-06, + "loss": 1.1504, + "step": 1730 + }, + { + "epoch": 0.05, + "learning_rate": 4.993574402163498e-06, + "loss": 1.2003, + "step": 1731 + }, + { + "epoch": 0.05, + "learning_rate": 4.993556913168545e-06, + "loss": 1.1251, + "step": 1732 + }, + { + "epoch": 0.05, + "learning_rate": 4.993539400436129e-06, + "loss": 1.2101, + "step": 1733 + }, + { + "epoch": 0.05, + "learning_rate": 4.9935218639664205e-06, + "loss": 1.1796, + "step": 1734 + }, + { + "epoch": 0.05, + "learning_rate": 4.993504303759585e-06, + "loss": 1.1869, + "step": 1735 + }, + { + "epoch": 0.05, + "learning_rate": 4.993486719815789e-06, + "loss": 1.136, + "step": 1736 + }, + { + "epoch": 0.05, + "learning_rate": 4.9934691121351995e-06, + "loss": 1.2129, + "step": 1737 + }, + { + "epoch": 0.05, + "learning_rate": 4.993451480717986e-06, + "loss": 1.0723, + "step": 1738 + }, + { + "epoch": 0.05, + "learning_rate": 4.993433825564315e-06, + "loss": 1.2408, + "step": 1739 + }, + { + "epoch": 0.05, + "learning_rate": 4.9934161466743545e-06, + "loss": 1.1537, + "step": 1740 + }, + { + "epoch": 0.05, + "learning_rate": 4.993398444048274e-06, + "loss": 1.0949, + "step": 1741 + }, + { + "epoch": 0.05, + "learning_rate": 4.99338071768624e-06, + "loss": 1.2535, + "step": 1742 + }, + { + "epoch": 0.05, + "learning_rate": 4.993362967588423e-06, + "loss": 1.1711, + "step": 1743 + }, + { + "epoch": 0.05, + "learning_rate": 4.993345193754992e-06, + "loss": 1.1674, + "step": 1744 + }, + { + "epoch": 0.05, + "learning_rate": 4.993327396186115e-06, + "loss": 1.1352, + "step": 1745 + }, + { + "epoch": 0.05, + "learning_rate": 4.993309574881962e-06, + "loss": 1.1139, + "step": 1746 + }, + { + "epoch": 0.05, + "learning_rate": 4.993291729842703e-06, + "loss": 1.1443, + "step": 1747 + }, + { + "epoch": 0.05, + "learning_rate": 4.993273861068507e-06, + "loss": 1.1875, + "step": 1748 + }, + { + "epoch": 0.05, + "learning_rate": 4.993255968559545e-06, + "loss": 1.3621, + "step": 1749 + }, + { + "epoch": 0.05, + "learning_rate": 4.993238052315987e-06, + "loss": 1.3691, + "step": 1750 + }, + { + "epoch": 0.05, + "learning_rate": 4.9932201123380034e-06, + "loss": 1.1616, + "step": 1751 + }, + { + "epoch": 0.05, + "learning_rate": 4.9932021486257656e-06, + "loss": 1.1288, + "step": 1752 + }, + { + "epoch": 0.05, + "learning_rate": 4.993184161179443e-06, + "loss": 1.1696, + "step": 1753 + }, + { + "epoch": 0.05, + "learning_rate": 4.993166149999209e-06, + "loss": 1.0894, + "step": 1754 + }, + { + "epoch": 0.05, + "learning_rate": 4.993148115085233e-06, + "loss": 1.2091, + "step": 1755 + }, + { + "epoch": 0.05, + "learning_rate": 4.9931300564376885e-06, + "loss": 1.0378, + "step": 1756 + }, + { + "epoch": 0.05, + "learning_rate": 4.993111974056746e-06, + "loss": 1.2112, + "step": 1757 + }, + { + "epoch": 0.05, + "learning_rate": 4.993093867942579e-06, + "loss": 1.2089, + "step": 1758 + }, + { + "epoch": 0.05, + "learning_rate": 4.9930757380953585e-06, + "loss": 1.1425, + "step": 1759 + }, + { + "epoch": 0.05, + "learning_rate": 4.993057584515259e-06, + "loss": 1.2323, + "step": 1760 + }, + { + "epoch": 0.05, + "learning_rate": 4.99303940720245e-06, + "loss": 1.2281, + "step": 1761 + }, + { + "epoch": 0.05, + "learning_rate": 4.993021206157107e-06, + "loss": 1.3446, + "step": 1762 + }, + { + "epoch": 0.05, + "learning_rate": 4.993002981379404e-06, + "loss": 1.0708, + "step": 1763 + }, + { + "epoch": 0.05, + "learning_rate": 4.992984732869512e-06, + "loss": 1.13, + "step": 1764 + }, + { + "epoch": 0.05, + "learning_rate": 4.992966460627606e-06, + "loss": 1.0885, + "step": 1765 + }, + { + "epoch": 0.05, + "learning_rate": 4.992948164653861e-06, + "loss": 1.155, + "step": 1766 + }, + { + "epoch": 0.05, + "learning_rate": 4.992929844948449e-06, + "loss": 1.1599, + "step": 1767 + }, + { + "epoch": 0.05, + "learning_rate": 4.992911501511546e-06, + "loss": 1.0884, + "step": 1768 + }, + { + "epoch": 0.05, + "learning_rate": 4.992893134343327e-06, + "loss": 1.2465, + "step": 1769 + }, + { + "epoch": 0.05, + "learning_rate": 4.992874743443965e-06, + "loss": 1.1279, + "step": 1770 + }, + { + "epoch": 0.05, + "learning_rate": 4.992856328813636e-06, + "loss": 1.0395, + "step": 1771 + }, + { + "epoch": 0.05, + "learning_rate": 4.992837890452515e-06, + "loss": 1.1788, + "step": 1772 + }, + { + "epoch": 0.05, + "learning_rate": 4.992819428360779e-06, + "loss": 1.0602, + "step": 1773 + }, + { + "epoch": 0.05, + "learning_rate": 4.992800942538603e-06, + "loss": 1.2147, + "step": 1774 + }, + { + "epoch": 0.05, + "learning_rate": 4.99278243298616e-06, + "loss": 1.1048, + "step": 1775 + }, + { + "epoch": 0.05, + "learning_rate": 4.9927638997036314e-06, + "loss": 1.2137, + "step": 1776 + }, + { + "epoch": 0.05, + "learning_rate": 4.99274534269119e-06, + "loss": 1.1358, + "step": 1777 + }, + { + "epoch": 0.05, + "learning_rate": 4.992726761949014e-06, + "loss": 1.1248, + "step": 1778 + }, + { + "epoch": 0.05, + "learning_rate": 4.99270815747728e-06, + "loss": 1.3333, + "step": 1779 + }, + { + "epoch": 0.05, + "learning_rate": 4.992689529276163e-06, + "loss": 1.2406, + "step": 1780 + }, + { + "epoch": 0.05, + "learning_rate": 4.992670877345844e-06, + "loss": 1.2061, + "step": 1781 + }, + { + "epoch": 0.05, + "learning_rate": 4.992652201686498e-06, + "loss": 1.2119, + "step": 1782 + }, + { + "epoch": 0.05, + "learning_rate": 4.992633502298304e-06, + "loss": 1.1481, + "step": 1783 + }, + { + "epoch": 0.05, + "learning_rate": 4.992614779181439e-06, + "loss": 1.1063, + "step": 1784 + }, + { + "epoch": 0.05, + "learning_rate": 4.992596032336083e-06, + "loss": 1.0818, + "step": 1785 + }, + { + "epoch": 0.05, + "learning_rate": 4.992577261762412e-06, + "loss": 1.1601, + "step": 1786 + }, + { + "epoch": 0.05, + "learning_rate": 4.992558467460605e-06, + "loss": 1.1558, + "step": 1787 + }, + { + "epoch": 0.05, + "learning_rate": 4.992539649430844e-06, + "loss": 1.2151, + "step": 1788 + }, + { + "epoch": 0.05, + "learning_rate": 4.992520807673305e-06, + "loss": 1.1699, + "step": 1789 + }, + { + "epoch": 0.05, + "learning_rate": 4.992501942188168e-06, + "loss": 1.1133, + "step": 1790 + }, + { + "epoch": 0.05, + "learning_rate": 4.992483052975614e-06, + "loss": 1.1204, + "step": 1791 + }, + { + "epoch": 0.05, + "learning_rate": 4.992464140035821e-06, + "loss": 1.2202, + "step": 1792 + }, + { + "epoch": 0.05, + "learning_rate": 4.99244520336897e-06, + "loss": 1.1898, + "step": 1793 + }, + { + "epoch": 0.05, + "learning_rate": 4.9924262429752415e-06, + "loss": 1.226, + "step": 1794 + }, + { + "epoch": 0.05, + "learning_rate": 4.992407258854814e-06, + "loss": 1.1675, + "step": 1795 + }, + { + "epoch": 0.05, + "learning_rate": 4.992388251007871e-06, + "loss": 1.1712, + "step": 1796 + }, + { + "epoch": 0.05, + "learning_rate": 4.992369219434592e-06, + "loss": 1.1633, + "step": 1797 + }, + { + "epoch": 0.05, + "learning_rate": 4.992350164135159e-06, + "loss": 1.182, + "step": 1798 + }, + { + "epoch": 0.05, + "learning_rate": 4.992331085109751e-06, + "loss": 1.1582, + "step": 1799 + }, + { + "epoch": 0.05, + "learning_rate": 4.992311982358554e-06, + "loss": 1.1177, + "step": 1800 + }, + { + "epoch": 0.05, + "learning_rate": 4.992292855881746e-06, + "loss": 1.0875, + "step": 1801 + }, + { + "epoch": 0.05, + "learning_rate": 4.9922737056795104e-06, + "loss": 1.1392, + "step": 1802 + }, + { + "epoch": 0.05, + "learning_rate": 4.992254531752029e-06, + "loss": 1.2073, + "step": 1803 + }, + { + "epoch": 0.05, + "learning_rate": 4.992235334099485e-06, + "loss": 1.1397, + "step": 1804 + }, + { + "epoch": 0.05, + "learning_rate": 4.992216112722061e-06, + "loss": 1.2868, + "step": 1805 + }, + { + "epoch": 0.05, + "learning_rate": 4.99219686761994e-06, + "loss": 1.0015, + "step": 1806 + }, + { + "epoch": 0.05, + "learning_rate": 4.992177598793305e-06, + "loss": 1.1962, + "step": 1807 + }, + { + "epoch": 0.05, + "learning_rate": 4.99215830624234e-06, + "loss": 1.1972, + "step": 1808 + }, + { + "epoch": 0.05, + "learning_rate": 4.992138989967228e-06, + "loss": 1.157, + "step": 1809 + }, + { + "epoch": 0.05, + "learning_rate": 4.992119649968152e-06, + "loss": 1.0169, + "step": 1810 + }, + { + "epoch": 0.05, + "learning_rate": 4.992100286245299e-06, + "loss": 1.1111, + "step": 1811 + }, + { + "epoch": 0.05, + "learning_rate": 4.99208089879885e-06, + "loss": 1.2236, + "step": 1812 + }, + { + "epoch": 0.05, + "learning_rate": 4.992061487628991e-06, + "loss": 1.0386, + "step": 1813 + }, + { + "epoch": 0.05, + "learning_rate": 4.992042052735908e-06, + "loss": 1.1586, + "step": 1814 + }, + { + "epoch": 0.05, + "learning_rate": 4.992022594119784e-06, + "loss": 1.2238, + "step": 1815 + }, + { + "epoch": 0.05, + "learning_rate": 4.992003111780806e-06, + "loss": 1.0806, + "step": 1816 + }, + { + "epoch": 0.05, + "learning_rate": 4.991983605719158e-06, + "loss": 1.1262, + "step": 1817 + }, + { + "epoch": 0.05, + "learning_rate": 4.991964075935025e-06, + "loss": 1.2547, + "step": 1818 + }, + { + "epoch": 0.05, + "learning_rate": 4.991944522428595e-06, + "loss": 1.24, + "step": 1819 + }, + { + "epoch": 0.05, + "learning_rate": 4.9919249452000545e-06, + "loss": 1.2107, + "step": 1820 + }, + { + "epoch": 0.05, + "learning_rate": 4.991905344249588e-06, + "loss": 1.208, + "step": 1821 + }, + { + "epoch": 0.05, + "learning_rate": 4.9918857195773825e-06, + "loss": 1.1254, + "step": 1822 + }, + { + "epoch": 0.05, + "learning_rate": 4.991866071183626e-06, + "loss": 1.1178, + "step": 1823 + }, + { + "epoch": 0.05, + "learning_rate": 4.991846399068503e-06, + "loss": 1.2797, + "step": 1824 + }, + { + "epoch": 0.05, + "learning_rate": 4.991826703232203e-06, + "loss": 1.1245, + "step": 1825 + }, + { + "epoch": 0.06, + "learning_rate": 4.991806983674914e-06, + "loss": 1.1855, + "step": 1826 + }, + { + "epoch": 0.06, + "learning_rate": 4.991787240396822e-06, + "loss": 1.0915, + "step": 1827 + }, + { + "epoch": 0.06, + "learning_rate": 4.991767473398115e-06, + "loss": 1.0463, + "step": 1828 + }, + { + "epoch": 0.06, + "learning_rate": 4.9917476826789816e-06, + "loss": 1.0316, + "step": 1829 + }, + { + "epoch": 0.06, + "learning_rate": 4.991727868239611e-06, + "loss": 1.184, + "step": 1830 + }, + { + "epoch": 0.06, + "learning_rate": 4.991708030080191e-06, + "loss": 1.1977, + "step": 1831 + }, + { + "epoch": 0.06, + "learning_rate": 4.99168816820091e-06, + "loss": 1.1993, + "step": 1832 + }, + { + "epoch": 0.06, + "learning_rate": 4.991668282601958e-06, + "loss": 1.0783, + "step": 1833 + }, + { + "epoch": 0.06, + "learning_rate": 4.991648373283525e-06, + "loss": 1.192, + "step": 1834 + }, + { + "epoch": 0.06, + "learning_rate": 4.991628440245798e-06, + "loss": 1.2295, + "step": 1835 + }, + { + "epoch": 0.06, + "learning_rate": 4.991608483488969e-06, + "loss": 1.1897, + "step": 1836 + }, + { + "epoch": 0.06, + "learning_rate": 4.991588503013227e-06, + "loss": 1.1386, + "step": 1837 + }, + { + "epoch": 0.06, + "learning_rate": 4.991568498818763e-06, + "loss": 1.142, + "step": 1838 + }, + { + "epoch": 0.06, + "learning_rate": 4.9915484709057665e-06, + "loss": 1.1813, + "step": 1839 + }, + { + "epoch": 0.06, + "learning_rate": 4.991528419274429e-06, + "loss": 1.1105, + "step": 1840 + }, + { + "epoch": 0.06, + "learning_rate": 4.99150834392494e-06, + "loss": 1.2478, + "step": 1841 + }, + { + "epoch": 0.06, + "learning_rate": 4.991488244857492e-06, + "loss": 1.2432, + "step": 1842 + }, + { + "epoch": 0.06, + "learning_rate": 4.991468122072276e-06, + "loss": 1.282, + "step": 1843 + }, + { + "epoch": 0.06, + "learning_rate": 4.9914479755694825e-06, + "loss": 1.217, + "step": 1844 + }, + { + "epoch": 0.06, + "learning_rate": 4.9914278053493055e-06, + "loss": 1.0934, + "step": 1845 + }, + { + "epoch": 0.06, + "learning_rate": 4.991407611411935e-06, + "loss": 1.1908, + "step": 1846 + }, + { + "epoch": 0.06, + "learning_rate": 4.991387393757564e-06, + "loss": 1.1635, + "step": 1847 + }, + { + "epoch": 0.06, + "learning_rate": 4.991367152386385e-06, + "loss": 1.1462, + "step": 1848 + }, + { + "epoch": 0.06, + "learning_rate": 4.9913468872985905e-06, + "loss": 1.1096, + "step": 1849 + }, + { + "epoch": 0.06, + "learning_rate": 4.991326598494373e-06, + "loss": 1.2751, + "step": 1850 + }, + { + "epoch": 0.06, + "learning_rate": 4.991306285973927e-06, + "loss": 1.1738, + "step": 1851 + }, + { + "epoch": 0.06, + "learning_rate": 4.991285949737445e-06, + "loss": 1.0478, + "step": 1852 + }, + { + "epoch": 0.06, + "learning_rate": 4.99126558978512e-06, + "loss": 1.1918, + "step": 1853 + }, + { + "epoch": 0.06, + "learning_rate": 4.991245206117147e-06, + "loss": 1.2594, + "step": 1854 + }, + { + "epoch": 0.06, + "learning_rate": 4.9912247987337195e-06, + "loss": 1.0857, + "step": 1855 + }, + { + "epoch": 0.06, + "learning_rate": 4.991204367635031e-06, + "loss": 1.3604, + "step": 1856 + }, + { + "epoch": 0.06, + "learning_rate": 4.991183912821277e-06, + "loss": 1.2059, + "step": 1857 + }, + { + "epoch": 0.06, + "learning_rate": 4.991163434292652e-06, + "loss": 1.1129, + "step": 1858 + }, + { + "epoch": 0.06, + "learning_rate": 4.991142932049351e-06, + "loss": 1.1208, + "step": 1859 + }, + { + "epoch": 0.06, + "learning_rate": 4.991122406091569e-06, + "loss": 1.1471, + "step": 1860 + }, + { + "epoch": 0.06, + "learning_rate": 4.991101856419502e-06, + "loss": 1.1185, + "step": 1861 + }, + { + "epoch": 0.06, + "learning_rate": 4.991081283033345e-06, + "loss": 1.1464, + "step": 1862 + }, + { + "epoch": 0.06, + "learning_rate": 4.991060685933293e-06, + "loss": 1.0615, + "step": 1863 + }, + { + "epoch": 0.06, + "learning_rate": 4.9910400651195436e-06, + "loss": 1.207, + "step": 1864 + }, + { + "epoch": 0.06, + "learning_rate": 4.991019420592293e-06, + "loss": 1.1184, + "step": 1865 + }, + { + "epoch": 0.06, + "learning_rate": 4.990998752351735e-06, + "loss": 1.1034, + "step": 1866 + }, + { + "epoch": 0.06, + "learning_rate": 4.990978060398071e-06, + "loss": 1.1022, + "step": 1867 + }, + { + "epoch": 0.06, + "learning_rate": 4.9909573447314955e-06, + "loss": 1.2406, + "step": 1868 + }, + { + "epoch": 0.06, + "learning_rate": 4.990936605352204e-06, + "loss": 1.2224, + "step": 1869 + }, + { + "epoch": 0.06, + "learning_rate": 4.990915842260398e-06, + "loss": 1.1685, + "step": 1870 + }, + { + "epoch": 0.06, + "learning_rate": 4.990895055456271e-06, + "loss": 1.0631, + "step": 1871 + }, + { + "epoch": 0.06, + "learning_rate": 4.990874244940023e-06, + "loss": 1.1515, + "step": 1872 + }, + { + "epoch": 0.06, + "learning_rate": 4.9908534107118525e-06, + "loss": 1.2278, + "step": 1873 + }, + { + "epoch": 0.06, + "learning_rate": 4.990832552771957e-06, + "loss": 1.2804, + "step": 1874 + }, + { + "epoch": 0.06, + "learning_rate": 4.990811671120535e-06, + "loss": 1.2511, + "step": 1875 + }, + { + "epoch": 0.06, + "learning_rate": 4.990790765757785e-06, + "loss": 1.1488, + "step": 1876 + }, + { + "epoch": 0.06, + "learning_rate": 4.990769836683907e-06, + "loss": 1.0787, + "step": 1877 + }, + { + "epoch": 0.06, + "learning_rate": 4.9907488838991e-06, + "loss": 1.0507, + "step": 1878 + }, + { + "epoch": 0.06, + "learning_rate": 4.990727907403563e-06, + "loss": 1.2288, + "step": 1879 + }, + { + "epoch": 0.06, + "learning_rate": 4.990706907197497e-06, + "loss": 1.215, + "step": 1880 + }, + { + "epoch": 0.06, + "learning_rate": 4.990685883281099e-06, + "loss": 1.152, + "step": 1881 + }, + { + "epoch": 0.06, + "learning_rate": 4.990664835654572e-06, + "loss": 1.2483, + "step": 1882 + }, + { + "epoch": 0.06, + "learning_rate": 4.990643764318115e-06, + "loss": 1.264, + "step": 1883 + }, + { + "epoch": 0.06, + "learning_rate": 4.990622669271928e-06, + "loss": 1.1669, + "step": 1884 + }, + { + "epoch": 0.06, + "learning_rate": 4.990601550516214e-06, + "loss": 1.2172, + "step": 1885 + }, + { + "epoch": 0.06, + "learning_rate": 4.990580408051173e-06, + "loss": 1.194, + "step": 1886 + }, + { + "epoch": 0.06, + "learning_rate": 4.990559241877005e-06, + "loss": 1.2091, + "step": 1887 + }, + { + "epoch": 0.06, + "learning_rate": 4.990538051993913e-06, + "loss": 1.1351, + "step": 1888 + }, + { + "epoch": 0.06, + "learning_rate": 4.990516838402099e-06, + "loss": 1.1061, + "step": 1889 + }, + { + "epoch": 0.06, + "learning_rate": 4.990495601101762e-06, + "loss": 1.1444, + "step": 1890 + }, + { + "epoch": 0.06, + "learning_rate": 4.990474340093108e-06, + "loss": 1.147, + "step": 1891 + }, + { + "epoch": 0.06, + "learning_rate": 4.990453055376337e-06, + "loss": 1.1416, + "step": 1892 + }, + { + "epoch": 0.06, + "learning_rate": 4.990431746951654e-06, + "loss": 1.3163, + "step": 1893 + }, + { + "epoch": 0.06, + "learning_rate": 4.990410414819258e-06, + "loss": 1.1438, + "step": 1894 + }, + { + "epoch": 0.06, + "learning_rate": 4.990389058979356e-06, + "loss": 1.2422, + "step": 1895 + }, + { + "epoch": 0.06, + "learning_rate": 4.9903676794321484e-06, + "loss": 1.2457, + "step": 1896 + }, + { + "epoch": 0.06, + "learning_rate": 4.99034627617784e-06, + "loss": 1.1146, + "step": 1897 + }, + { + "epoch": 0.06, + "learning_rate": 4.990324849216635e-06, + "loss": 1.1113, + "step": 1898 + }, + { + "epoch": 0.06, + "learning_rate": 4.990303398548736e-06, + "loss": 1.1888, + "step": 1899 + }, + { + "epoch": 0.06, + "learning_rate": 4.990281924174349e-06, + "loss": 1.1556, + "step": 1900 + }, + { + "epoch": 0.06, + "learning_rate": 4.990260426093677e-06, + "loss": 1.1411, + "step": 1901 + }, + { + "epoch": 0.06, + "learning_rate": 4.9902389043069255e-06, + "loss": 1.1866, + "step": 1902 + }, + { + "epoch": 0.06, + "learning_rate": 4.990217358814298e-06, + "loss": 1.1622, + "step": 1903 + }, + { + "epoch": 0.06, + "learning_rate": 4.990195789616001e-06, + "loss": 1.1802, + "step": 1904 + }, + { + "epoch": 0.06, + "learning_rate": 4.99017419671224e-06, + "loss": 1.1766, + "step": 1905 + }, + { + "epoch": 0.06, + "learning_rate": 4.990152580103219e-06, + "loss": 1.1871, + "step": 1906 + }, + { + "epoch": 0.06, + "learning_rate": 4.9901309397891454e-06, + "loss": 1.0873, + "step": 1907 + }, + { + "epoch": 0.06, + "learning_rate": 4.990109275770225e-06, + "loss": 1.1981, + "step": 1908 + }, + { + "epoch": 0.06, + "learning_rate": 4.990087588046662e-06, + "loss": 1.1417, + "step": 1909 + }, + { + "epoch": 0.06, + "learning_rate": 4.990065876618666e-06, + "loss": 1.1264, + "step": 1910 + }, + { + "epoch": 0.06, + "learning_rate": 4.990044141486441e-06, + "loss": 1.3105, + "step": 1911 + }, + { + "epoch": 0.06, + "learning_rate": 4.990022382650196e-06, + "loss": 1.0682, + "step": 1912 + }, + { + "epoch": 0.06, + "learning_rate": 4.9900006001101364e-06, + "loss": 1.1171, + "step": 1913 + }, + { + "epoch": 0.06, + "learning_rate": 4.989978793866472e-06, + "loss": 1.0682, + "step": 1914 + }, + { + "epoch": 0.06, + "learning_rate": 4.989956963919406e-06, + "loss": 1.0899, + "step": 1915 + }, + { + "epoch": 0.06, + "learning_rate": 4.989935110269151e-06, + "loss": 1.2227, + "step": 1916 + }, + { + "epoch": 0.06, + "learning_rate": 4.989913232915912e-06, + "loss": 1.2773, + "step": 1917 + }, + { + "epoch": 0.06, + "learning_rate": 4.989891331859897e-06, + "loss": 1.1799, + "step": 1918 + }, + { + "epoch": 0.06, + "learning_rate": 4.989869407101318e-06, + "loss": 1.1683, + "step": 1919 + }, + { + "epoch": 0.06, + "learning_rate": 4.98984745864038e-06, + "loss": 1.238, + "step": 1920 + }, + { + "epoch": 0.06, + "learning_rate": 4.989825486477294e-06, + "loss": 1.2238, + "step": 1921 + }, + { + "epoch": 0.06, + "learning_rate": 4.989803490612268e-06, + "loss": 1.2483, + "step": 1922 + }, + { + "epoch": 0.06, + "learning_rate": 4.989781471045513e-06, + "loss": 1.1865, + "step": 1923 + }, + { + "epoch": 0.06, + "learning_rate": 4.989759427777237e-06, + "loss": 1.1711, + "step": 1924 + }, + { + "epoch": 0.06, + "learning_rate": 4.989737360807649e-06, + "loss": 1.175, + "step": 1925 + }, + { + "epoch": 0.06, + "learning_rate": 4.989715270136961e-06, + "loss": 1.175, + "step": 1926 + }, + { + "epoch": 0.06, + "learning_rate": 4.989693155765384e-06, + "loss": 1.0892, + "step": 1927 + }, + { + "epoch": 0.06, + "learning_rate": 4.989671017693126e-06, + "loss": 1.0696, + "step": 1928 + }, + { + "epoch": 0.06, + "learning_rate": 4.9896488559204e-06, + "loss": 1.2998, + "step": 1929 + }, + { + "epoch": 0.06, + "learning_rate": 4.989626670447415e-06, + "loss": 1.2631, + "step": 1930 + }, + { + "epoch": 0.06, + "learning_rate": 4.989604461274384e-06, + "loss": 1.3171, + "step": 1931 + }, + { + "epoch": 0.06, + "learning_rate": 4.989582228401517e-06, + "loss": 1.16, + "step": 1932 + }, + { + "epoch": 0.06, + "learning_rate": 4.989559971829026e-06, + "loss": 1.1606, + "step": 1933 + }, + { + "epoch": 0.06, + "learning_rate": 4.989537691557124e-06, + "loss": 1.0742, + "step": 1934 + }, + { + "epoch": 0.06, + "learning_rate": 4.989515387586022e-06, + "loss": 1.1476, + "step": 1935 + }, + { + "epoch": 0.06, + "learning_rate": 4.989493059915931e-06, + "loss": 1.2321, + "step": 1936 + }, + { + "epoch": 0.06, + "learning_rate": 4.989470708547066e-06, + "loss": 1.2372, + "step": 1937 + }, + { + "epoch": 0.06, + "learning_rate": 4.989448333479639e-06, + "loss": 1.1469, + "step": 1938 + }, + { + "epoch": 0.06, + "learning_rate": 4.989425934713863e-06, + "loss": 1.0983, + "step": 1939 + }, + { + "epoch": 0.06, + "learning_rate": 4.989403512249951e-06, + "loss": 1.1199, + "step": 1940 + }, + { + "epoch": 0.06, + "learning_rate": 4.989381066088116e-06, + "loss": 1.1314, + "step": 1941 + }, + { + "epoch": 0.06, + "learning_rate": 4.989358596228572e-06, + "loss": 1.2166, + "step": 1942 + }, + { + "epoch": 0.06, + "learning_rate": 4.989336102671533e-06, + "loss": 1.1805, + "step": 1943 + }, + { + "epoch": 0.06, + "learning_rate": 4.989313585417215e-06, + "loss": 1.2549, + "step": 1944 + }, + { + "epoch": 0.06, + "learning_rate": 4.989291044465829e-06, + "loss": 1.2523, + "step": 1945 + }, + { + "epoch": 0.06, + "learning_rate": 4.989268479817591e-06, + "loss": 1.1691, + "step": 1946 + }, + { + "epoch": 0.06, + "learning_rate": 4.989245891472717e-06, + "loss": 1.1789, + "step": 1947 + }, + { + "epoch": 0.06, + "learning_rate": 4.98922327943142e-06, + "loss": 1.1942, + "step": 1948 + }, + { + "epoch": 0.06, + "learning_rate": 4.989200643693917e-06, + "loss": 1.1624, + "step": 1949 + }, + { + "epoch": 0.06, + "learning_rate": 4.989177984260422e-06, + "loss": 1.1586, + "step": 1950 + }, + { + "epoch": 0.06, + "learning_rate": 4.989155301131152e-06, + "loss": 1.1024, + "step": 1951 + }, + { + "epoch": 0.06, + "learning_rate": 4.9891325943063215e-06, + "loss": 1.2128, + "step": 1952 + }, + { + "epoch": 0.06, + "learning_rate": 4.989109863786148e-06, + "loss": 1.1095, + "step": 1953 + }, + { + "epoch": 0.06, + "learning_rate": 4.9890871095708485e-06, + "loss": 1.0652, + "step": 1954 + }, + { + "epoch": 0.06, + "learning_rate": 4.989064331660637e-06, + "loss": 1.2979, + "step": 1955 + }, + { + "epoch": 0.06, + "learning_rate": 4.989041530055733e-06, + "loss": 1.1725, + "step": 1956 + }, + { + "epoch": 0.06, + "learning_rate": 4.989018704756351e-06, + "loss": 1.0879, + "step": 1957 + }, + { + "epoch": 0.06, + "learning_rate": 4.988995855762711e-06, + "loss": 1.1053, + "step": 1958 + }, + { + "epoch": 0.06, + "learning_rate": 4.9889729830750284e-06, + "loss": 1.1122, + "step": 1959 + }, + { + "epoch": 0.06, + "learning_rate": 4.988950086693521e-06, + "loss": 1.2218, + "step": 1960 + }, + { + "epoch": 0.06, + "learning_rate": 4.988927166618409e-06, + "loss": 1.1768, + "step": 1961 + }, + { + "epoch": 0.06, + "learning_rate": 4.988904222849909e-06, + "loss": 1.3022, + "step": 1962 + }, + { + "epoch": 0.06, + "learning_rate": 4.9888812553882385e-06, + "loss": 1.1634, + "step": 1963 + }, + { + "epoch": 0.06, + "learning_rate": 4.9888582642336185e-06, + "loss": 1.2872, + "step": 1964 + }, + { + "epoch": 0.06, + "learning_rate": 4.9888352493862655e-06, + "loss": 1.0566, + "step": 1965 + }, + { + "epoch": 0.06, + "learning_rate": 4.988812210846399e-06, + "loss": 1.1961, + "step": 1966 + }, + { + "epoch": 0.06, + "learning_rate": 4.98878914861424e-06, + "loss": 1.2167, + "step": 1967 + }, + { + "epoch": 0.06, + "learning_rate": 4.988766062690006e-06, + "loss": 1.2092, + "step": 1968 + }, + { + "epoch": 0.06, + "learning_rate": 4.9887429530739185e-06, + "loss": 1.1915, + "step": 1969 + }, + { + "epoch": 0.06, + "learning_rate": 4.9887198197661966e-06, + "loss": 1.2217, + "step": 1970 + }, + { + "epoch": 0.06, + "learning_rate": 4.9886966627670605e-06, + "loss": 1.1559, + "step": 1971 + }, + { + "epoch": 0.06, + "learning_rate": 4.988673482076731e-06, + "loss": 1.0035, + "step": 1972 + }, + { + "epoch": 0.06, + "learning_rate": 4.988650277695429e-06, + "loss": 1.1774, + "step": 1973 + }, + { + "epoch": 0.06, + "learning_rate": 4.988627049623373e-06, + "loss": 1.1968, + "step": 1974 + }, + { + "epoch": 0.06, + "learning_rate": 4.988603797860788e-06, + "loss": 1.0595, + "step": 1975 + }, + { + "epoch": 0.06, + "learning_rate": 4.988580522407893e-06, + "loss": 1.1901, + "step": 1976 + }, + { + "epoch": 0.06, + "learning_rate": 4.988557223264909e-06, + "loss": 1.1543, + "step": 1977 + }, + { + "epoch": 0.06, + "learning_rate": 4.98853390043206e-06, + "loss": 1.2415, + "step": 1978 + }, + { + "epoch": 0.06, + "learning_rate": 4.988510553909566e-06, + "loss": 1.2595, + "step": 1979 + }, + { + "epoch": 0.06, + "learning_rate": 4.98848718369765e-06, + "loss": 1.178, + "step": 1980 + }, + { + "epoch": 0.06, + "learning_rate": 4.988463789796535e-06, + "loss": 1.2241, + "step": 1981 + }, + { + "epoch": 0.06, + "learning_rate": 4.988440372206443e-06, + "loss": 1.2849, + "step": 1982 + }, + { + "epoch": 0.06, + "learning_rate": 4.988416930927597e-06, + "loss": 1.158, + "step": 1983 + }, + { + "epoch": 0.06, + "learning_rate": 4.988393465960221e-06, + "loss": 1.1897, + "step": 1984 + }, + { + "epoch": 0.06, + "learning_rate": 4.9883699773045365e-06, + "loss": 1.2605, + "step": 1985 + }, + { + "epoch": 0.06, + "learning_rate": 4.988346464960769e-06, + "loss": 1.14, + "step": 1986 + }, + { + "epoch": 0.06, + "learning_rate": 4.988322928929141e-06, + "loss": 1.0616, + "step": 1987 + }, + { + "epoch": 0.06, + "learning_rate": 4.988299369209878e-06, + "loss": 1.113, + "step": 1988 + }, + { + "epoch": 0.06, + "learning_rate": 4.988275785803203e-06, + "loss": 1.1251, + "step": 1989 + }, + { + "epoch": 0.06, + "learning_rate": 4.988252178709341e-06, + "loss": 1.2095, + "step": 1990 + }, + { + "epoch": 0.06, + "learning_rate": 4.988228547928516e-06, + "loss": 1.1732, + "step": 1991 + }, + { + "epoch": 0.06, + "learning_rate": 4.988204893460954e-06, + "loss": 1.2094, + "step": 1992 + }, + { + "epoch": 0.06, + "learning_rate": 4.98818121530688e-06, + "loss": 1.3403, + "step": 1993 + }, + { + "epoch": 0.06, + "learning_rate": 4.98815751346652e-06, + "loss": 1.1157, + "step": 1994 + }, + { + "epoch": 0.06, + "learning_rate": 4.988133787940097e-06, + "loss": 1.0797, + "step": 1995 + }, + { + "epoch": 0.06, + "learning_rate": 4.98811003872784e-06, + "loss": 1.1405, + "step": 1996 + }, + { + "epoch": 0.06, + "learning_rate": 4.988086265829973e-06, + "loss": 1.0806, + "step": 1997 + }, + { + "epoch": 0.06, + "learning_rate": 4.988062469246724e-06, + "loss": 1.1907, + "step": 1998 + }, + { + "epoch": 0.06, + "learning_rate": 4.988038648978317e-06, + "loss": 1.2792, + "step": 1999 + }, + { + "epoch": 0.06, + "learning_rate": 4.988014805024981e-06, + "loss": 1.185, + "step": 2000 + }, + { + "epoch": 0.06, + "learning_rate": 4.987990937386942e-06, + "loss": 1.0763, + "step": 2001 + }, + { + "epoch": 0.06, + "learning_rate": 4.987967046064429e-06, + "loss": 1.0901, + "step": 2002 + }, + { + "epoch": 0.06, + "learning_rate": 4.987943131057668e-06, + "loss": 1.1668, + "step": 2003 + }, + { + "epoch": 0.06, + "learning_rate": 4.987919192366885e-06, + "loss": 1.1404, + "step": 2004 + }, + { + "epoch": 0.06, + "learning_rate": 4.98789522999231e-06, + "loss": 1.1703, + "step": 2005 + }, + { + "epoch": 0.06, + "learning_rate": 4.9878712439341716e-06, + "loss": 1.2279, + "step": 2006 + }, + { + "epoch": 0.06, + "learning_rate": 4.987847234192696e-06, + "loss": 1.2134, + "step": 2007 + }, + { + "epoch": 0.06, + "learning_rate": 4.987823200768113e-06, + "loss": 1.1408, + "step": 2008 + }, + { + "epoch": 0.06, + "learning_rate": 4.987799143660652e-06, + "loss": 1.1118, + "step": 2009 + }, + { + "epoch": 0.06, + "learning_rate": 4.987775062870541e-06, + "loss": 1.1886, + "step": 2010 + }, + { + "epoch": 0.06, + "learning_rate": 4.987750958398009e-06, + "loss": 1.2009, + "step": 2011 + }, + { + "epoch": 0.06, + "learning_rate": 4.987726830243287e-06, + "loss": 1.0886, + "step": 2012 + }, + { + "epoch": 0.06, + "learning_rate": 4.987702678406603e-06, + "loss": 1.1173, + "step": 2013 + }, + { + "epoch": 0.06, + "learning_rate": 4.987678502888188e-06, + "loss": 1.149, + "step": 2014 + }, + { + "epoch": 0.06, + "learning_rate": 4.9876543036882715e-06, + "loss": 1.1453, + "step": 2015 + }, + { + "epoch": 0.06, + "learning_rate": 4.9876300808070845e-06, + "loss": 1.1866, + "step": 2016 + }, + { + "epoch": 0.06, + "learning_rate": 4.987605834244856e-06, + "loss": 1.2305, + "step": 2017 + }, + { + "epoch": 0.06, + "learning_rate": 4.987581564001819e-06, + "loss": 1.2609, + "step": 2018 + }, + { + "epoch": 0.06, + "learning_rate": 4.987557270078204e-06, + "loss": 1.0944, + "step": 2019 + }, + { + "epoch": 0.06, + "learning_rate": 4.987532952474241e-06, + "loss": 1.2349, + "step": 2020 + }, + { + "epoch": 0.06, + "learning_rate": 4.987508611190162e-06, + "loss": 1.1116, + "step": 2021 + }, + { + "epoch": 0.06, + "learning_rate": 4.987484246226201e-06, + "loss": 1.1808, + "step": 2022 + }, + { + "epoch": 0.06, + "learning_rate": 4.987459857582586e-06, + "loss": 1.0766, + "step": 2023 + }, + { + "epoch": 0.06, + "learning_rate": 4.9874354452595525e-06, + "loss": 1.3002, + "step": 2024 + }, + { + "epoch": 0.06, + "learning_rate": 4.987411009257331e-06, + "loss": 1.2611, + "step": 2025 + }, + { + "epoch": 0.06, + "learning_rate": 4.9873865495761545e-06, + "loss": 1.122, + "step": 2026 + }, + { + "epoch": 0.06, + "learning_rate": 4.987362066216256e-06, + "loss": 1.1747, + "step": 2027 + }, + { + "epoch": 0.06, + "learning_rate": 4.9873375591778685e-06, + "loss": 1.1384, + "step": 2028 + }, + { + "epoch": 0.06, + "learning_rate": 4.987313028461226e-06, + "loss": 1.2748, + "step": 2029 + }, + { + "epoch": 0.06, + "learning_rate": 4.987288474066561e-06, + "loss": 1.1407, + "step": 2030 + }, + { + "epoch": 0.06, + "learning_rate": 4.987263895994108e-06, + "loss": 1.0835, + "step": 2031 + }, + { + "epoch": 0.06, + "learning_rate": 4.9872392942440995e-06, + "loss": 1.1104, + "step": 2032 + }, + { + "epoch": 0.06, + "learning_rate": 4.987214668816772e-06, + "loss": 1.1531, + "step": 2033 + }, + { + "epoch": 0.06, + "learning_rate": 4.987190019712358e-06, + "loss": 1.1643, + "step": 2034 + }, + { + "epoch": 0.06, + "learning_rate": 4.987165346931093e-06, + "loss": 1.2318, + "step": 2035 + }, + { + "epoch": 0.06, + "learning_rate": 4.987140650473213e-06, + "loss": 1.1873, + "step": 2036 + }, + { + "epoch": 0.06, + "learning_rate": 4.9871159303389504e-06, + "loss": 1.1844, + "step": 2037 + }, + { + "epoch": 0.06, + "learning_rate": 4.987091186528542e-06, + "loss": 1.2528, + "step": 2038 + }, + { + "epoch": 0.06, + "learning_rate": 4.987066419042223e-06, + "loss": 1.2693, + "step": 2039 + }, + { + "epoch": 0.06, + "learning_rate": 4.987041627880232e-06, + "loss": 1.1809, + "step": 2040 + }, + { + "epoch": 0.06, + "learning_rate": 4.9870168130427995e-06, + "loss": 1.2167, + "step": 2041 + }, + { + "epoch": 0.06, + "learning_rate": 4.986991974530166e-06, + "loss": 1.2649, + "step": 2042 + }, + { + "epoch": 0.06, + "learning_rate": 4.986967112342566e-06, + "loss": 1.2572, + "step": 2043 + }, + { + "epoch": 0.06, + "learning_rate": 4.986942226480238e-06, + "loss": 1.1671, + "step": 2044 + }, + { + "epoch": 0.06, + "learning_rate": 4.986917316943418e-06, + "loss": 1.175, + "step": 2045 + }, + { + "epoch": 0.06, + "learning_rate": 4.986892383732342e-06, + "loss": 1.1857, + "step": 2046 + }, + { + "epoch": 0.06, + "learning_rate": 4.986867426847248e-06, + "loss": 1.1923, + "step": 2047 + }, + { + "epoch": 0.06, + "learning_rate": 4.986842446288374e-06, + "loss": 1.1912, + "step": 2048 + }, + { + "epoch": 0.06, + "learning_rate": 4.986817442055958e-06, + "loss": 1.1512, + "step": 2049 + }, + { + "epoch": 0.06, + "learning_rate": 4.9867924141502374e-06, + "loss": 1.1989, + "step": 2050 + }, + { + "epoch": 0.06, + "learning_rate": 4.986767362571451e-06, + "loss": 1.1809, + "step": 2051 + }, + { + "epoch": 0.06, + "learning_rate": 4.986742287319837e-06, + "loss": 1.1304, + "step": 2052 + }, + { + "epoch": 0.06, + "learning_rate": 4.986717188395633e-06, + "loss": 1.0994, + "step": 2053 + }, + { + "epoch": 0.06, + "learning_rate": 4.98669206579908e-06, + "loss": 1.1455, + "step": 2054 + }, + { + "epoch": 0.06, + "learning_rate": 4.986666919530416e-06, + "loss": 1.2406, + "step": 2055 + }, + { + "epoch": 0.06, + "learning_rate": 4.986641749589881e-06, + "loss": 1.1901, + "step": 2056 + }, + { + "epoch": 0.06, + "learning_rate": 4.986616555977714e-06, + "loss": 1.251, + "step": 2057 + }, + { + "epoch": 0.06, + "learning_rate": 4.986591338694154e-06, + "loss": 1.1047, + "step": 2058 + }, + { + "epoch": 0.06, + "learning_rate": 4.986566097739443e-06, + "loss": 1.1118, + "step": 2059 + }, + { + "epoch": 0.06, + "learning_rate": 4.98654083311382e-06, + "loss": 1.0846, + "step": 2060 + }, + { + "epoch": 0.06, + "learning_rate": 4.986515544817525e-06, + "loss": 1.1268, + "step": 2061 + }, + { + "epoch": 0.06, + "learning_rate": 4.986490232850801e-06, + "loss": 1.1962, + "step": 2062 + }, + { + "epoch": 0.06, + "learning_rate": 4.9864648972138865e-06, + "loss": 1.1804, + "step": 2063 + }, + { + "epoch": 0.06, + "learning_rate": 4.986439537907024e-06, + "loss": 1.1846, + "step": 2064 + }, + { + "epoch": 0.06, + "learning_rate": 4.986414154930455e-06, + "loss": 1.0468, + "step": 2065 + }, + { + "epoch": 0.06, + "learning_rate": 4.986388748284421e-06, + "loss": 1.1806, + "step": 2066 + }, + { + "epoch": 0.06, + "learning_rate": 4.9863633179691624e-06, + "loss": 1.2271, + "step": 2067 + }, + { + "epoch": 0.06, + "learning_rate": 4.986337863984924e-06, + "loss": 1.2532, + "step": 2068 + }, + { + "epoch": 0.06, + "learning_rate": 4.986312386331945e-06, + "loss": 1.1546, + "step": 2069 + }, + { + "epoch": 0.06, + "learning_rate": 4.986286885010471e-06, + "loss": 1.2103, + "step": 2070 + }, + { + "epoch": 0.06, + "learning_rate": 4.986261360020742e-06, + "loss": 1.1544, + "step": 2071 + }, + { + "epoch": 0.06, + "learning_rate": 4.986235811363003e-06, + "loss": 1.1726, + "step": 2072 + }, + { + "epoch": 0.06, + "learning_rate": 4.986210239037496e-06, + "loss": 1.0778, + "step": 2073 + }, + { + "epoch": 0.06, + "learning_rate": 4.986184643044465e-06, + "loss": 1.0168, + "step": 2074 + }, + { + "epoch": 0.06, + "learning_rate": 4.986159023384154e-06, + "loss": 1.1907, + "step": 2075 + }, + { + "epoch": 0.06, + "learning_rate": 4.986133380056807e-06, + "loss": 1.2898, + "step": 2076 + }, + { + "epoch": 0.06, + "learning_rate": 4.986107713062667e-06, + "loss": 1.1855, + "step": 2077 + }, + { + "epoch": 0.06, + "learning_rate": 4.986082022401978e-06, + "loss": 1.1355, + "step": 2078 + }, + { + "epoch": 0.06, + "learning_rate": 4.986056308074987e-06, + "loss": 1.1967, + "step": 2079 + }, + { + "epoch": 0.06, + "learning_rate": 4.986030570081936e-06, + "loss": 1.1772, + "step": 2080 + }, + { + "epoch": 0.06, + "learning_rate": 4.986004808423072e-06, + "loss": 1.2101, + "step": 2081 + }, + { + "epoch": 0.06, + "learning_rate": 4.9859790230986396e-06, + "loss": 1.0864, + "step": 2082 + }, + { + "epoch": 0.06, + "learning_rate": 4.985953214108884e-06, + "loss": 1.0322, + "step": 2083 + }, + { + "epoch": 0.06, + "learning_rate": 4.985927381454051e-06, + "loss": 1.1594, + "step": 2084 + }, + { + "epoch": 0.06, + "learning_rate": 4.985901525134386e-06, + "loss": 1.2071, + "step": 2085 + }, + { + "epoch": 0.06, + "learning_rate": 4.985875645150137e-06, + "loss": 1.2257, + "step": 2086 + }, + { + "epoch": 0.06, + "learning_rate": 4.985849741501548e-06, + "loss": 1.1998, + "step": 2087 + }, + { + "epoch": 0.06, + "learning_rate": 4.985823814188868e-06, + "loss": 1.1614, + "step": 2088 + }, + { + "epoch": 0.06, + "learning_rate": 4.985797863212342e-06, + "loss": 1.3022, + "step": 2089 + }, + { + "epoch": 0.06, + "learning_rate": 4.985771888572216e-06, + "loss": 1.0962, + "step": 2090 + }, + { + "epoch": 0.06, + "learning_rate": 4.9857458902687405e-06, + "loss": 1.2693, + "step": 2091 + }, + { + "epoch": 0.06, + "learning_rate": 4.98571986830216e-06, + "loss": 1.3082, + "step": 2092 + }, + { + "epoch": 0.06, + "learning_rate": 4.985693822672725e-06, + "loss": 1.138, + "step": 2093 + }, + { + "epoch": 0.06, + "learning_rate": 4.985667753380681e-06, + "loss": 1.2204, + "step": 2094 + }, + { + "epoch": 0.06, + "learning_rate": 4.985641660426278e-06, + "loss": 1.1172, + "step": 2095 + }, + { + "epoch": 0.06, + "learning_rate": 4.985615543809763e-06, + "loss": 1.2186, + "step": 2096 + }, + { + "epoch": 0.06, + "learning_rate": 4.985589403531384e-06, + "loss": 1.1763, + "step": 2097 + }, + { + "epoch": 0.06, + "learning_rate": 4.985563239591394e-06, + "loss": 1.2863, + "step": 2098 + }, + { + "epoch": 0.06, + "learning_rate": 4.985537051990036e-06, + "loss": 1.1529, + "step": 2099 + }, + { + "epoch": 0.06, + "learning_rate": 4.9855108407275635e-06, + "loss": 1.0938, + "step": 2100 + }, + { + "epoch": 0.06, + "learning_rate": 4.985484605804225e-06, + "loss": 1.1229, + "step": 2101 + }, + { + "epoch": 0.06, + "learning_rate": 4.98545834722027e-06, + "loss": 1.1588, + "step": 2102 + }, + { + "epoch": 0.06, + "learning_rate": 4.985432064975948e-06, + "loss": 1.1784, + "step": 2103 + }, + { + "epoch": 0.06, + "learning_rate": 4.985405759071511e-06, + "loss": 1.1328, + "step": 2104 + }, + { + "epoch": 0.06, + "learning_rate": 4.985379429507206e-06, + "loss": 1.1092, + "step": 2105 + }, + { + "epoch": 0.06, + "learning_rate": 4.985353076283288e-06, + "loss": 1.2693, + "step": 2106 + }, + { + "epoch": 0.06, + "learning_rate": 4.985326699400005e-06, + "loss": 1.2052, + "step": 2107 + }, + { + "epoch": 0.06, + "learning_rate": 4.9853002988576085e-06, + "loss": 1.123, + "step": 2108 + }, + { + "epoch": 0.06, + "learning_rate": 4.985273874656351e-06, + "loss": 1.1243, + "step": 2109 + }, + { + "epoch": 0.06, + "learning_rate": 4.985247426796482e-06, + "loss": 1.2427, + "step": 2110 + }, + { + "epoch": 0.06, + "learning_rate": 4.9852209552782554e-06, + "loss": 1.1003, + "step": 2111 + }, + { + "epoch": 0.06, + "learning_rate": 4.985194460101922e-06, + "loss": 1.1159, + "step": 2112 + }, + { + "epoch": 0.06, + "learning_rate": 4.985167941267733e-06, + "loss": 1.1535, + "step": 2113 + }, + { + "epoch": 0.06, + "learning_rate": 4.9851413987759435e-06, + "loss": 1.1869, + "step": 2114 + }, + { + "epoch": 0.06, + "learning_rate": 4.985114832626805e-06, + "loss": 1.2016, + "step": 2115 + }, + { + "epoch": 0.06, + "learning_rate": 4.985088242820569e-06, + "loss": 1.1417, + "step": 2116 + }, + { + "epoch": 0.06, + "learning_rate": 4.985061629357491e-06, + "loss": 1.1628, + "step": 2117 + }, + { + "epoch": 0.06, + "learning_rate": 4.985034992237823e-06, + "loss": 1.1791, + "step": 2118 + }, + { + "epoch": 0.06, + "learning_rate": 4.985008331461817e-06, + "loss": 1.1371, + "step": 2119 + }, + { + "epoch": 0.06, + "learning_rate": 4.984981647029731e-06, + "loss": 1.2222, + "step": 2120 + }, + { + "epoch": 0.06, + "learning_rate": 4.984954938941815e-06, + "loss": 1.183, + "step": 2121 + }, + { + "epoch": 0.06, + "learning_rate": 4.984928207198325e-06, + "loss": 1.2257, + "step": 2122 + }, + { + "epoch": 0.06, + "learning_rate": 4.984901451799515e-06, + "loss": 1.2455, + "step": 2123 + }, + { + "epoch": 0.06, + "learning_rate": 4.98487467274564e-06, + "loss": 1.1484, + "step": 2124 + }, + { + "epoch": 0.06, + "learning_rate": 4.9848478700369555e-06, + "loss": 1.1837, + "step": 2125 + }, + { + "epoch": 0.06, + "learning_rate": 4.984821043673715e-06, + "loss": 1.2218, + "step": 2126 + }, + { + "epoch": 0.06, + "learning_rate": 4.984794193656176e-06, + "loss": 1.1821, + "step": 2127 + }, + { + "epoch": 0.06, + "learning_rate": 4.984767319984593e-06, + "loss": 1.1774, + "step": 2128 + }, + { + "epoch": 0.06, + "learning_rate": 4.984740422659221e-06, + "loss": 1.0772, + "step": 2129 + }, + { + "epoch": 0.06, + "learning_rate": 4.984713501680317e-06, + "loss": 1.2188, + "step": 2130 + }, + { + "epoch": 0.06, + "learning_rate": 4.984686557048137e-06, + "loss": 1.2906, + "step": 2131 + }, + { + "epoch": 0.06, + "learning_rate": 4.984659588762938e-06, + "loss": 1.145, + "step": 2132 + }, + { + "epoch": 0.06, + "learning_rate": 4.984632596824977e-06, + "loss": 1.1139, + "step": 2133 + }, + { + "epoch": 0.06, + "learning_rate": 4.98460558123451e-06, + "loss": 1.2003, + "step": 2134 + }, + { + "epoch": 0.06, + "learning_rate": 4.984578541991794e-06, + "loss": 1.1884, + "step": 2135 + }, + { + "epoch": 0.06, + "learning_rate": 4.9845514790970864e-06, + "loss": 1.1524, + "step": 2136 + }, + { + "epoch": 0.06, + "learning_rate": 4.984524392550646e-06, + "loss": 1.298, + "step": 2137 + }, + { + "epoch": 0.06, + "learning_rate": 4.9844972823527295e-06, + "loss": 1.1504, + "step": 2138 + }, + { + "epoch": 0.06, + "learning_rate": 4.984470148503596e-06, + "loss": 1.1605, + "step": 2139 + }, + { + "epoch": 0.06, + "learning_rate": 4.984442991003503e-06, + "loss": 1.2095, + "step": 2140 + }, + { + "epoch": 0.06, + "learning_rate": 4.98441580985271e-06, + "loss": 1.197, + "step": 2141 + }, + { + "epoch": 0.06, + "learning_rate": 4.984388605051474e-06, + "loss": 1.1713, + "step": 2142 + }, + { + "epoch": 0.06, + "learning_rate": 4.984361376600056e-06, + "loss": 1.2595, + "step": 2143 + }, + { + "epoch": 0.06, + "learning_rate": 4.984334124498714e-06, + "loss": 1.2227, + "step": 2144 + }, + { + "epoch": 0.06, + "learning_rate": 4.984306848747707e-06, + "loss": 1.1718, + "step": 2145 + }, + { + "epoch": 0.06, + "learning_rate": 4.9842795493472955e-06, + "loss": 1.2222, + "step": 2146 + }, + { + "epoch": 0.06, + "learning_rate": 4.984252226297739e-06, + "loss": 1.1146, + "step": 2147 + }, + { + "epoch": 0.06, + "learning_rate": 4.9842248795992985e-06, + "loss": 1.1503, + "step": 2148 + }, + { + "epoch": 0.06, + "learning_rate": 4.984197509252233e-06, + "loss": 1.2391, + "step": 2149 + }, + { + "epoch": 0.06, + "learning_rate": 4.984170115256803e-06, + "loss": 1.3014, + "step": 2150 + }, + { + "epoch": 0.06, + "learning_rate": 4.984142697613271e-06, + "loss": 1.168, + "step": 2151 + }, + { + "epoch": 0.06, + "learning_rate": 4.984115256321897e-06, + "loss": 1.1166, + "step": 2152 + }, + { + "epoch": 0.06, + "learning_rate": 4.984087791382941e-06, + "loss": 1.1064, + "step": 2153 + }, + { + "epoch": 0.06, + "learning_rate": 4.984060302796666e-06, + "loss": 1.0186, + "step": 2154 + }, + { + "epoch": 0.06, + "learning_rate": 4.984032790563334e-06, + "loss": 1.1801, + "step": 2155 + }, + { + "epoch": 0.06, + "learning_rate": 4.9840052546832065e-06, + "loss": 1.2991, + "step": 2156 + }, + { + "epoch": 0.06, + "learning_rate": 4.9839776951565445e-06, + "loss": 1.1566, + "step": 2157 + }, + { + "epoch": 0.07, + "learning_rate": 4.983950111983611e-06, + "loss": 1.1339, + "step": 2158 + }, + { + "epoch": 0.07, + "learning_rate": 4.983922505164669e-06, + "loss": 1.0595, + "step": 2159 + }, + { + "epoch": 0.07, + "learning_rate": 4.983894874699981e-06, + "loss": 1.1186, + "step": 2160 + }, + { + "epoch": 0.07, + "learning_rate": 4.98386722058981e-06, + "loss": 1.0469, + "step": 2161 + }, + { + "epoch": 0.07, + "learning_rate": 4.98383954283442e-06, + "loss": 1.2512, + "step": 2162 + }, + { + "epoch": 0.07, + "learning_rate": 4.983811841434073e-06, + "loss": 1.1202, + "step": 2163 + }, + { + "epoch": 0.07, + "learning_rate": 4.983784116389034e-06, + "loss": 1.1533, + "step": 2164 + }, + { + "epoch": 0.07, + "learning_rate": 4.983756367699566e-06, + "loss": 1.1595, + "step": 2165 + }, + { + "epoch": 0.07, + "learning_rate": 4.983728595365933e-06, + "loss": 1.2346, + "step": 2166 + }, + { + "epoch": 0.07, + "learning_rate": 4.983700799388401e-06, + "loss": 1.2028, + "step": 2167 + }, + { + "epoch": 0.07, + "learning_rate": 4.983672979767234e-06, + "loss": 1.2991, + "step": 2168 + }, + { + "epoch": 0.07, + "learning_rate": 4.983645136502696e-06, + "loss": 1.1478, + "step": 2169 + }, + { + "epoch": 0.07, + "learning_rate": 4.983617269595052e-06, + "loss": 1.1696, + "step": 2170 + }, + { + "epoch": 0.07, + "learning_rate": 4.983589379044568e-06, + "loss": 1.0733, + "step": 2171 + }, + { + "epoch": 0.07, + "learning_rate": 4.9835614648515095e-06, + "loss": 1.1381, + "step": 2172 + }, + { + "epoch": 0.07, + "learning_rate": 4.983533527016142e-06, + "loss": 1.2355, + "step": 2173 + }, + { + "epoch": 0.07, + "learning_rate": 4.983505565538731e-06, + "loss": 1.0709, + "step": 2174 + }, + { + "epoch": 0.07, + "learning_rate": 4.983477580419543e-06, + "loss": 1.2024, + "step": 2175 + }, + { + "epoch": 0.07, + "learning_rate": 4.983449571658845e-06, + "loss": 1.0659, + "step": 2176 + }, + { + "epoch": 0.07, + "learning_rate": 4.983421539256903e-06, + "loss": 1.2184, + "step": 2177 + }, + { + "epoch": 0.07, + "learning_rate": 4.983393483213984e-06, + "loss": 1.1708, + "step": 2178 + }, + { + "epoch": 0.07, + "learning_rate": 4.983365403530355e-06, + "loss": 1.0844, + "step": 2179 + }, + { + "epoch": 0.07, + "learning_rate": 4.9833373002062834e-06, + "loss": 1.0958, + "step": 2180 + }, + { + "epoch": 0.07, + "learning_rate": 4.983309173242037e-06, + "loss": 1.1794, + "step": 2181 + }, + { + "epoch": 0.07, + "learning_rate": 4.983281022637882e-06, + "loss": 1.2211, + "step": 2182 + }, + { + "epoch": 0.07, + "learning_rate": 4.983252848394089e-06, + "loss": 1.179, + "step": 2183 + }, + { + "epoch": 0.07, + "learning_rate": 4.983224650510925e-06, + "loss": 1.1646, + "step": 2184 + }, + { + "epoch": 0.07, + "learning_rate": 4.983196428988658e-06, + "loss": 1.0979, + "step": 2185 + }, + { + "epoch": 0.07, + "learning_rate": 4.9831681838275566e-06, + "loss": 1.1389, + "step": 2186 + }, + { + "epoch": 0.07, + "learning_rate": 4.98313991502789e-06, + "loss": 1.1805, + "step": 2187 + }, + { + "epoch": 0.07, + "learning_rate": 4.983111622589928e-06, + "loss": 1.1697, + "step": 2188 + }, + { + "epoch": 0.07, + "learning_rate": 4.983083306513938e-06, + "loss": 1.2897, + "step": 2189 + }, + { + "epoch": 0.07, + "learning_rate": 4.983054966800192e-06, + "loss": 1.1979, + "step": 2190 + }, + { + "epoch": 0.07, + "learning_rate": 4.983026603448958e-06, + "loss": 1.2167, + "step": 2191 + }, + { + "epoch": 0.07, + "learning_rate": 4.982998216460507e-06, + "loss": 1.1815, + "step": 2192 + }, + { + "epoch": 0.07, + "learning_rate": 4.9829698058351084e-06, + "loss": 1.1493, + "step": 2193 + }, + { + "epoch": 0.07, + "learning_rate": 4.9829413715730335e-06, + "loss": 1.0162, + "step": 2194 + }, + { + "epoch": 0.07, + "learning_rate": 4.982912913674552e-06, + "loss": 1.1607, + "step": 2195 + }, + { + "epoch": 0.07, + "learning_rate": 4.982884432139936e-06, + "loss": 1.1155, + "step": 2196 + }, + { + "epoch": 0.07, + "learning_rate": 4.982855926969456e-06, + "loss": 1.1547, + "step": 2197 + }, + { + "epoch": 0.07, + "learning_rate": 4.982827398163383e-06, + "loss": 1.1292, + "step": 2198 + }, + { + "epoch": 0.07, + "learning_rate": 4.982798845721989e-06, + "loss": 1.2045, + "step": 2199 + }, + { + "epoch": 0.07, + "learning_rate": 4.982770269645546e-06, + "loss": 1.2064, + "step": 2200 + }, + { + "epoch": 0.07, + "learning_rate": 4.982741669934326e-06, + "loss": 1.1305, + "step": 2201 + }, + { + "epoch": 0.07, + "learning_rate": 4.9827130465886e-06, + "loss": 1.1995, + "step": 2202 + }, + { + "epoch": 0.07, + "learning_rate": 4.982684399608642e-06, + "loss": 1.1302, + "step": 2203 + }, + { + "epoch": 0.07, + "learning_rate": 4.982655728994725e-06, + "loss": 1.1677, + "step": 2204 + }, + { + "epoch": 0.07, + "learning_rate": 4.98262703474712e-06, + "loss": 1.1941, + "step": 2205 + }, + { + "epoch": 0.07, + "learning_rate": 4.982598316866102e-06, + "loss": 1.1013, + "step": 2206 + }, + { + "epoch": 0.07, + "learning_rate": 4.982569575351943e-06, + "loss": 1.178, + "step": 2207 + }, + { + "epoch": 0.07, + "learning_rate": 4.982540810204917e-06, + "loss": 1.1371, + "step": 2208 + }, + { + "epoch": 0.07, + "learning_rate": 4.9825120214253e-06, + "loss": 1.0938, + "step": 2209 + }, + { + "epoch": 0.07, + "learning_rate": 4.982483209013363e-06, + "loss": 1.0757, + "step": 2210 + }, + { + "epoch": 0.07, + "learning_rate": 4.982454372969382e-06, + "loss": 1.3065, + "step": 2211 + }, + { + "epoch": 0.07, + "learning_rate": 4.98242551329363e-06, + "loss": 1.1896, + "step": 2212 + }, + { + "epoch": 0.07, + "learning_rate": 4.982396629986384e-06, + "loss": 1.2227, + "step": 2213 + }, + { + "epoch": 0.07, + "learning_rate": 4.9823677230479165e-06, + "loss": 1.1848, + "step": 2214 + }, + { + "epoch": 0.07, + "learning_rate": 4.982338792478504e-06, + "loss": 1.1598, + "step": 2215 + }, + { + "epoch": 0.07, + "learning_rate": 4.9823098382784215e-06, + "loss": 1.1686, + "step": 2216 + }, + { + "epoch": 0.07, + "learning_rate": 4.982280860447946e-06, + "loss": 1.1176, + "step": 2217 + }, + { + "epoch": 0.07, + "learning_rate": 4.982251858987351e-06, + "loss": 1.2499, + "step": 2218 + }, + { + "epoch": 0.07, + "learning_rate": 4.982222833896914e-06, + "loss": 1.3091, + "step": 2219 + }, + { + "epoch": 0.07, + "learning_rate": 4.9821937851769114e-06, + "loss": 1.2134, + "step": 2220 + }, + { + "epoch": 0.07, + "learning_rate": 4.982164712827619e-06, + "loss": 1.1296, + "step": 2221 + }, + { + "epoch": 0.07, + "learning_rate": 4.9821356168493154e-06, + "loss": 1.0604, + "step": 2222 + }, + { + "epoch": 0.07, + "learning_rate": 4.982106497242275e-06, + "loss": 1.1205, + "step": 2223 + }, + { + "epoch": 0.07, + "learning_rate": 4.982077354006775e-06, + "loss": 1.2728, + "step": 2224 + }, + { + "epoch": 0.07, + "learning_rate": 4.9820481871430955e-06, + "loss": 1.1606, + "step": 2225 + }, + { + "epoch": 0.07, + "learning_rate": 4.982018996651513e-06, + "loss": 1.126, + "step": 2226 + }, + { + "epoch": 0.07, + "learning_rate": 4.981989782532305e-06, + "loss": 1.1188, + "step": 2227 + }, + { + "epoch": 0.07, + "learning_rate": 4.981960544785749e-06, + "loss": 1.1991, + "step": 2228 + }, + { + "epoch": 0.07, + "learning_rate": 4.981931283412124e-06, + "loss": 1.1779, + "step": 2229 + }, + { + "epoch": 0.07, + "learning_rate": 4.981901998411708e-06, + "loss": 1.1218, + "step": 2230 + }, + { + "epoch": 0.07, + "learning_rate": 4.981872689784781e-06, + "loss": 1.251, + "step": 2231 + }, + { + "epoch": 0.07, + "learning_rate": 4.9818433575316215e-06, + "loss": 1.1664, + "step": 2232 + }, + { + "epoch": 0.07, + "learning_rate": 4.981814001652508e-06, + "loss": 1.2229, + "step": 2233 + }, + { + "epoch": 0.07, + "learning_rate": 4.981784622147721e-06, + "loss": 1.0662, + "step": 2234 + }, + { + "epoch": 0.07, + "learning_rate": 4.981755219017539e-06, + "loss": 1.1852, + "step": 2235 + }, + { + "epoch": 0.07, + "learning_rate": 4.981725792262243e-06, + "loss": 1.1641, + "step": 2236 + }, + { + "epoch": 0.07, + "learning_rate": 4.981696341882113e-06, + "loss": 1.2478, + "step": 2237 + }, + { + "epoch": 0.07, + "learning_rate": 4.981666867877429e-06, + "loss": 1.142, + "step": 2238 + }, + { + "epoch": 0.07, + "learning_rate": 4.981637370248471e-06, + "loss": 1.1741, + "step": 2239 + }, + { + "epoch": 0.07, + "learning_rate": 4.981607848995521e-06, + "loss": 1.1471, + "step": 2240 + }, + { + "epoch": 0.07, + "learning_rate": 4.981578304118859e-06, + "loss": 1.1365, + "step": 2241 + }, + { + "epoch": 0.07, + "learning_rate": 4.981548735618767e-06, + "loss": 1.1511, + "step": 2242 + }, + { + "epoch": 0.07, + "learning_rate": 4.981519143495526e-06, + "loss": 1.1849, + "step": 2243 + }, + { + "epoch": 0.07, + "learning_rate": 4.981489527749418e-06, + "loss": 1.1671, + "step": 2244 + }, + { + "epoch": 0.07, + "learning_rate": 4.981459888380725e-06, + "loss": 1.0894, + "step": 2245 + }, + { + "epoch": 0.07, + "learning_rate": 4.981430225389729e-06, + "loss": 1.0164, + "step": 2246 + }, + { + "epoch": 0.07, + "learning_rate": 4.981400538776713e-06, + "loss": 1.1099, + "step": 2247 + }, + { + "epoch": 0.07, + "learning_rate": 4.981370828541957e-06, + "loss": 1.2375, + "step": 2248 + }, + { + "epoch": 0.07, + "learning_rate": 4.981341094685747e-06, + "loss": 0.9931, + "step": 2249 + }, + { + "epoch": 0.07, + "learning_rate": 4.981311337208365e-06, + "loss": 1.1268, + "step": 2250 + }, + { + "epoch": 0.07, + "learning_rate": 4.981281556110094e-06, + "loss": 1.1611, + "step": 2251 + }, + { + "epoch": 0.07, + "learning_rate": 4.9812517513912175e-06, + "loss": 1.1666, + "step": 2252 + }, + { + "epoch": 0.07, + "learning_rate": 4.9812219230520195e-06, + "loss": 1.1737, + "step": 2253 + }, + { + "epoch": 0.07, + "learning_rate": 4.981192071092783e-06, + "loss": 1.1603, + "step": 2254 + }, + { + "epoch": 0.07, + "learning_rate": 4.981162195513794e-06, + "loss": 1.2158, + "step": 2255 + }, + { + "epoch": 0.07, + "learning_rate": 4.981132296315335e-06, + "loss": 1.0555, + "step": 2256 + }, + { + "epoch": 0.07, + "learning_rate": 4.9811023734976925e-06, + "loss": 1.236, + "step": 2257 + }, + { + "epoch": 0.07, + "learning_rate": 4.9810724270611495e-06, + "loss": 1.0659, + "step": 2258 + }, + { + "epoch": 0.07, + "learning_rate": 4.981042457005992e-06, + "loss": 1.1522, + "step": 2259 + }, + { + "epoch": 0.07, + "learning_rate": 4.9810124633325056e-06, + "loss": 1.0778, + "step": 2260 + }, + { + "epoch": 0.07, + "learning_rate": 4.980982446040975e-06, + "loss": 1.1776, + "step": 2261 + }, + { + "epoch": 0.07, + "learning_rate": 4.980952405131687e-06, + "loss": 1.3334, + "step": 2262 + }, + { + "epoch": 0.07, + "learning_rate": 4.9809223406049265e-06, + "loss": 1.2162, + "step": 2263 + }, + { + "epoch": 0.07, + "learning_rate": 4.98089225246098e-06, + "loss": 1.0953, + "step": 2264 + }, + { + "epoch": 0.07, + "learning_rate": 4.980862140700135e-06, + "loss": 1.1263, + "step": 2265 + }, + { + "epoch": 0.07, + "learning_rate": 4.980832005322677e-06, + "loss": 1.2361, + "step": 2266 + }, + { + "epoch": 0.07, + "learning_rate": 4.980801846328892e-06, + "loss": 1.173, + "step": 2267 + }, + { + "epoch": 0.07, + "learning_rate": 4.980771663719069e-06, + "loss": 1.079, + "step": 2268 + }, + { + "epoch": 0.07, + "learning_rate": 4.9807414574934945e-06, + "loss": 1.1881, + "step": 2269 + }, + { + "epoch": 0.07, + "learning_rate": 4.980711227652456e-06, + "loss": 1.2231, + "step": 2270 + }, + { + "epoch": 0.07, + "learning_rate": 4.980680974196242e-06, + "loss": 1.0372, + "step": 2271 + }, + { + "epoch": 0.07, + "learning_rate": 4.980650697125139e-06, + "loss": 1.088, + "step": 2272 + }, + { + "epoch": 0.07, + "learning_rate": 4.9806203964394366e-06, + "loss": 1.2313, + "step": 2273 + }, + { + "epoch": 0.07, + "learning_rate": 4.980590072139423e-06, + "loss": 1.1939, + "step": 2274 + }, + { + "epoch": 0.07, + "learning_rate": 4.9805597242253855e-06, + "loss": 1.1375, + "step": 2275 + }, + { + "epoch": 0.07, + "learning_rate": 4.980529352697615e-06, + "loss": 1.234, + "step": 2276 + }, + { + "epoch": 0.07, + "learning_rate": 4.980498957556399e-06, + "loss": 1.1048, + "step": 2277 + }, + { + "epoch": 0.07, + "learning_rate": 4.980468538802028e-06, + "loss": 1.032, + "step": 2278 + }, + { + "epoch": 0.07, + "learning_rate": 4.980438096434792e-06, + "loss": 1.1368, + "step": 2279 + }, + { + "epoch": 0.07, + "learning_rate": 4.980407630454978e-06, + "loss": 1.131, + "step": 2280 + }, + { + "epoch": 0.07, + "learning_rate": 4.9803771408628795e-06, + "loss": 1.1523, + "step": 2281 + }, + { + "epoch": 0.07, + "learning_rate": 4.980346627658785e-06, + "loss": 1.0834, + "step": 2282 + }, + { + "epoch": 0.07, + "learning_rate": 4.980316090842985e-06, + "loss": 1.1167, + "step": 2283 + }, + { + "epoch": 0.07, + "learning_rate": 4.9802855304157714e-06, + "loss": 1.2216, + "step": 2284 + }, + { + "epoch": 0.07, + "learning_rate": 4.980254946377432e-06, + "loss": 1.1779, + "step": 2285 + }, + { + "epoch": 0.07, + "learning_rate": 4.980224338728261e-06, + "loss": 1.1528, + "step": 2286 + }, + { + "epoch": 0.07, + "learning_rate": 4.980193707468549e-06, + "loss": 1.2634, + "step": 2287 + }, + { + "epoch": 0.07, + "learning_rate": 4.980163052598588e-06, + "loss": 1.0626, + "step": 2288 + }, + { + "epoch": 0.07, + "learning_rate": 4.980132374118668e-06, + "loss": 1.2542, + "step": 2289 + }, + { + "epoch": 0.07, + "learning_rate": 4.980101672029084e-06, + "loss": 1.2521, + "step": 2290 + }, + { + "epoch": 0.07, + "learning_rate": 4.9800709463301246e-06, + "loss": 1.2335, + "step": 2291 + }, + { + "epoch": 0.07, + "learning_rate": 4.980040197022085e-06, + "loss": 1.1328, + "step": 2292 + }, + { + "epoch": 0.07, + "learning_rate": 4.9800094241052575e-06, + "loss": 1.2114, + "step": 2293 + }, + { + "epoch": 0.07, + "learning_rate": 4.979978627579934e-06, + "loss": 1.1594, + "step": 2294 + }, + { + "epoch": 0.07, + "learning_rate": 4.979947807446409e-06, + "loss": 1.1752, + "step": 2295 + }, + { + "epoch": 0.07, + "learning_rate": 4.979916963704975e-06, + "loss": 1.137, + "step": 2296 + }, + { + "epoch": 0.07, + "learning_rate": 4.979886096355926e-06, + "loss": 1.1866, + "step": 2297 + }, + { + "epoch": 0.07, + "learning_rate": 4.979855205399555e-06, + "loss": 1.1406, + "step": 2298 + }, + { + "epoch": 0.07, + "learning_rate": 4.979824290836158e-06, + "loss": 1.165, + "step": 2299 + }, + { + "epoch": 0.07, + "learning_rate": 4.979793352666027e-06, + "loss": 1.1973, + "step": 2300 + }, + { + "epoch": 0.07, + "learning_rate": 4.979762390889459e-06, + "loss": 1.274, + "step": 2301 + }, + { + "epoch": 0.07, + "learning_rate": 4.979731405506746e-06, + "loss": 1.1204, + "step": 2302 + }, + { + "epoch": 0.07, + "learning_rate": 4.979700396518184e-06, + "loss": 1.156, + "step": 2303 + }, + { + "epoch": 0.07, + "learning_rate": 4.97966936392407e-06, + "loss": 1.0836, + "step": 2304 + }, + { + "epoch": 0.07, + "learning_rate": 4.979638307724697e-06, + "loss": 1.1205, + "step": 2305 + }, + { + "epoch": 0.07, + "learning_rate": 4.979607227920361e-06, + "loss": 1.1871, + "step": 2306 + }, + { + "epoch": 0.07, + "learning_rate": 4.97957612451136e-06, + "loss": 1.1699, + "step": 2307 + }, + { + "epoch": 0.07, + "learning_rate": 4.979544997497987e-06, + "loss": 1.1917, + "step": 2308 + }, + { + "epoch": 0.07, + "learning_rate": 4.979513846880541e-06, + "loss": 1.1547, + "step": 2309 + }, + { + "epoch": 0.07, + "learning_rate": 4.979482672659316e-06, + "loss": 1.1471, + "step": 2310 + }, + { + "epoch": 0.07, + "learning_rate": 4.97945147483461e-06, + "loss": 1.0533, + "step": 2311 + }, + { + "epoch": 0.07, + "learning_rate": 4.979420253406721e-06, + "loss": 1.2097, + "step": 2312 + }, + { + "epoch": 0.07, + "learning_rate": 4.9793890083759455e-06, + "loss": 1.1167, + "step": 2313 + }, + { + "epoch": 0.07, + "learning_rate": 4.9793577397425805e-06, + "loss": 1.1902, + "step": 2314 + }, + { + "epoch": 0.07, + "learning_rate": 4.979326447506924e-06, + "loss": 1.2245, + "step": 2315 + }, + { + "epoch": 0.07, + "learning_rate": 4.979295131669274e-06, + "loss": 1.1899, + "step": 2316 + }, + { + "epoch": 0.07, + "learning_rate": 4.979263792229928e-06, + "loss": 1.1754, + "step": 2317 + }, + { + "epoch": 0.07, + "learning_rate": 4.979232429189184e-06, + "loss": 1.2415, + "step": 2318 + }, + { + "epoch": 0.07, + "learning_rate": 4.979201042547342e-06, + "loss": 1.1138, + "step": 2319 + }, + { + "epoch": 0.07, + "learning_rate": 4.979169632304701e-06, + "loss": 1.1331, + "step": 2320 + }, + { + "epoch": 0.07, + "learning_rate": 4.979138198461559e-06, + "loss": 1.1368, + "step": 2321 + }, + { + "epoch": 0.07, + "learning_rate": 4.979106741018214e-06, + "loss": 1.1993, + "step": 2322 + }, + { + "epoch": 0.07, + "learning_rate": 4.979075259974968e-06, + "loss": 1.1702, + "step": 2323 + }, + { + "epoch": 0.07, + "learning_rate": 4.979043755332119e-06, + "loss": 1.213, + "step": 2324 + }, + { + "epoch": 0.07, + "learning_rate": 4.979012227089967e-06, + "loss": 1.1058, + "step": 2325 + }, + { + "epoch": 0.07, + "learning_rate": 4.978980675248814e-06, + "loss": 1.1371, + "step": 2326 + }, + { + "epoch": 0.07, + "learning_rate": 4.978949099808957e-06, + "loss": 1.1645, + "step": 2327 + }, + { + "epoch": 0.07, + "learning_rate": 4.9789175007706994e-06, + "loss": 1.2356, + "step": 2328 + }, + { + "epoch": 0.07, + "learning_rate": 4.978885878134341e-06, + "loss": 1.1613, + "step": 2329 + }, + { + "epoch": 0.07, + "learning_rate": 4.978854231900183e-06, + "loss": 1.2551, + "step": 2330 + }, + { + "epoch": 0.07, + "learning_rate": 4.978822562068526e-06, + "loss": 1.1619, + "step": 2331 + }, + { + "epoch": 0.07, + "learning_rate": 4.978790868639673e-06, + "loss": 1.0833, + "step": 2332 + }, + { + "epoch": 0.07, + "learning_rate": 4.978759151613925e-06, + "loss": 1.1229, + "step": 2333 + }, + { + "epoch": 0.07, + "learning_rate": 4.978727410991582e-06, + "loss": 1.1117, + "step": 2334 + }, + { + "epoch": 0.07, + "learning_rate": 4.978695646772949e-06, + "loss": 1.0671, + "step": 2335 + }, + { + "epoch": 0.07, + "learning_rate": 4.9786638589583266e-06, + "loss": 1.0976, + "step": 2336 + }, + { + "epoch": 0.07, + "learning_rate": 4.978632047548018e-06, + "loss": 1.2671, + "step": 2337 + }, + { + "epoch": 0.07, + "learning_rate": 4.978600212542327e-06, + "loss": 1.0799, + "step": 2338 + }, + { + "epoch": 0.07, + "learning_rate": 4.978568353941555e-06, + "loss": 1.1379, + "step": 2339 + }, + { + "epoch": 0.07, + "learning_rate": 4.978536471746007e-06, + "loss": 1.1131, + "step": 2340 + }, + { + "epoch": 0.07, + "learning_rate": 4.978504565955985e-06, + "loss": 1.1287, + "step": 2341 + }, + { + "epoch": 0.07, + "learning_rate": 4.978472636571793e-06, + "loss": 1.2994, + "step": 2342 + }, + { + "epoch": 0.07, + "learning_rate": 4.978440683593735e-06, + "loss": 1.1185, + "step": 2343 + }, + { + "epoch": 0.07, + "learning_rate": 4.978408707022115e-06, + "loss": 1.1789, + "step": 2344 + }, + { + "epoch": 0.07, + "learning_rate": 4.9783767068572385e-06, + "loss": 1.0994, + "step": 2345 + }, + { + "epoch": 0.07, + "learning_rate": 4.9783446830994085e-06, + "loss": 1.2245, + "step": 2346 + }, + { + "epoch": 0.07, + "learning_rate": 4.978312635748932e-06, + "loss": 1.1163, + "step": 2347 + }, + { + "epoch": 0.07, + "learning_rate": 4.9782805648061116e-06, + "loss": 1.1753, + "step": 2348 + }, + { + "epoch": 0.07, + "learning_rate": 4.9782484702712546e-06, + "loss": 1.1606, + "step": 2349 + }, + { + "epoch": 0.07, + "learning_rate": 4.978216352144666e-06, + "loss": 1.0797, + "step": 2350 + }, + { + "epoch": 0.07, + "learning_rate": 4.97818421042665e-06, + "loss": 1.0815, + "step": 2351 + }, + { + "epoch": 0.07, + "learning_rate": 4.9781520451175144e-06, + "loss": 1.1744, + "step": 2352 + }, + { + "epoch": 0.07, + "learning_rate": 4.978119856217565e-06, + "loss": 1.2491, + "step": 2353 + }, + { + "epoch": 0.07, + "learning_rate": 4.978087643727108e-06, + "loss": 1.0422, + "step": 2354 + }, + { + "epoch": 0.07, + "learning_rate": 4.978055407646451e-06, + "loss": 1.111, + "step": 2355 + }, + { + "epoch": 0.07, + "learning_rate": 4.978023147975899e-06, + "loss": 1.1661, + "step": 2356 + }, + { + "epoch": 0.07, + "learning_rate": 4.97799086471576e-06, + "loss": 1.2323, + "step": 2357 + }, + { + "epoch": 0.07, + "learning_rate": 4.977958557866342e-06, + "loss": 1.2089, + "step": 2358 + }, + { + "epoch": 0.07, + "learning_rate": 4.977926227427951e-06, + "loss": 1.1785, + "step": 2359 + }, + { + "epoch": 0.07, + "learning_rate": 4.977893873400898e-06, + "loss": 1.2303, + "step": 2360 + }, + { + "epoch": 0.07, + "learning_rate": 4.977861495785487e-06, + "loss": 1.067, + "step": 2361 + }, + { + "epoch": 0.07, + "learning_rate": 4.9778290945820276e-06, + "loss": 1.2122, + "step": 2362 + }, + { + "epoch": 0.07, + "learning_rate": 4.977796669790829e-06, + "loss": 1.1307, + "step": 2363 + }, + { + "epoch": 0.07, + "learning_rate": 4.977764221412199e-06, + "loss": 1.2812, + "step": 2364 + }, + { + "epoch": 0.07, + "learning_rate": 4.977731749446448e-06, + "loss": 1.1005, + "step": 2365 + }, + { + "epoch": 0.07, + "learning_rate": 4.977699253893883e-06, + "loss": 1.1333, + "step": 2366 + }, + { + "epoch": 0.07, + "learning_rate": 4.977666734754814e-06, + "loss": 1.1681, + "step": 2367 + }, + { + "epoch": 0.07, + "learning_rate": 4.977634192029553e-06, + "loss": 1.1792, + "step": 2368 + }, + { + "epoch": 0.07, + "learning_rate": 4.977601625718407e-06, + "loss": 1.1215, + "step": 2369 + }, + { + "epoch": 0.07, + "learning_rate": 4.977569035821686e-06, + "loss": 1.1732, + "step": 2370 + }, + { + "epoch": 0.07, + "learning_rate": 4.977536422339701e-06, + "loss": 1.1243, + "step": 2371 + }, + { + "epoch": 0.07, + "learning_rate": 4.977503785272764e-06, + "loss": 1.2002, + "step": 2372 + }, + { + "epoch": 0.07, + "learning_rate": 4.977471124621183e-06, + "loss": 1.0992, + "step": 2373 + }, + { + "epoch": 0.07, + "learning_rate": 4.977438440385269e-06, + "loss": 1.1509, + "step": 2374 + }, + { + "epoch": 0.07, + "learning_rate": 4.977405732565336e-06, + "loss": 1.1221, + "step": 2375 + }, + { + "epoch": 0.07, + "learning_rate": 4.9773730011616924e-06, + "loss": 1.2218, + "step": 2376 + }, + { + "epoch": 0.07, + "learning_rate": 4.9773402461746525e-06, + "loss": 1.1924, + "step": 2377 + }, + { + "epoch": 0.07, + "learning_rate": 4.9773074676045256e-06, + "loss": 1.1934, + "step": 2378 + }, + { + "epoch": 0.07, + "learning_rate": 4.977274665451625e-06, + "loss": 1.2609, + "step": 2379 + }, + { + "epoch": 0.07, + "learning_rate": 4.9772418397162614e-06, + "loss": 1.2697, + "step": 2380 + }, + { + "epoch": 0.07, + "learning_rate": 4.977208990398749e-06, + "loss": 1.2703, + "step": 2381 + }, + { + "epoch": 0.07, + "learning_rate": 4.977176117499401e-06, + "loss": 1.106, + "step": 2382 + }, + { + "epoch": 0.07, + "learning_rate": 4.97714322101853e-06, + "loss": 1.1057, + "step": 2383 + }, + { + "epoch": 0.07, + "learning_rate": 4.977110300956447e-06, + "loss": 1.1178, + "step": 2384 + }, + { + "epoch": 0.07, + "learning_rate": 4.9770773573134675e-06, + "loss": 1.1903, + "step": 2385 + }, + { + "epoch": 0.07, + "learning_rate": 4.977044390089905e-06, + "loss": 1.1535, + "step": 2386 + }, + { + "epoch": 0.07, + "learning_rate": 4.977011399286072e-06, + "loss": 1.2194, + "step": 2387 + }, + { + "epoch": 0.07, + "learning_rate": 4.976978384902284e-06, + "loss": 1.1818, + "step": 2388 + }, + { + "epoch": 0.07, + "learning_rate": 4.976945346938855e-06, + "loss": 1.1967, + "step": 2389 + }, + { + "epoch": 0.07, + "learning_rate": 4.976912285396099e-06, + "loss": 1.1846, + "step": 2390 + }, + { + "epoch": 0.07, + "learning_rate": 4.976879200274332e-06, + "loss": 1.1074, + "step": 2391 + }, + { + "epoch": 0.07, + "learning_rate": 4.976846091573866e-06, + "loss": 1.1339, + "step": 2392 + }, + { + "epoch": 0.07, + "learning_rate": 4.9768129592950195e-06, + "loss": 1.2009, + "step": 2393 + }, + { + "epoch": 0.07, + "learning_rate": 4.976779803438106e-06, + "loss": 1.1778, + "step": 2394 + }, + { + "epoch": 0.07, + "learning_rate": 4.976746624003441e-06, + "loss": 1.2021, + "step": 2395 + }, + { + "epoch": 0.07, + "learning_rate": 4.976713420991341e-06, + "loss": 1.1251, + "step": 2396 + }, + { + "epoch": 0.07, + "learning_rate": 4.976680194402124e-06, + "loss": 1.1, + "step": 2397 + }, + { + "epoch": 0.07, + "learning_rate": 4.976646944236102e-06, + "loss": 1.1834, + "step": 2398 + }, + { + "epoch": 0.07, + "learning_rate": 4.9766136704935955e-06, + "loss": 1.2394, + "step": 2399 + }, + { + "epoch": 0.07, + "learning_rate": 4.976580373174919e-06, + "loss": 1.1287, + "step": 2400 + }, + { + "epoch": 0.07, + "learning_rate": 4.97654705228039e-06, + "loss": 1.1708, + "step": 2401 + }, + { + "epoch": 0.07, + "learning_rate": 4.976513707810326e-06, + "loss": 1.0304, + "step": 2402 + }, + { + "epoch": 0.07, + "learning_rate": 4.976480339765044e-06, + "loss": 1.1447, + "step": 2403 + }, + { + "epoch": 0.07, + "learning_rate": 4.976446948144862e-06, + "loss": 1.2693, + "step": 2404 + }, + { + "epoch": 0.07, + "learning_rate": 4.976413532950098e-06, + "loss": 1.2212, + "step": 2405 + }, + { + "epoch": 0.07, + "learning_rate": 4.976380094181069e-06, + "loss": 1.2423, + "step": 2406 + }, + { + "epoch": 0.07, + "learning_rate": 4.9763466318380954e-06, + "loss": 1.0923, + "step": 2407 + }, + { + "epoch": 0.07, + "learning_rate": 4.976313145921494e-06, + "loss": 1.2371, + "step": 2408 + }, + { + "epoch": 0.07, + "learning_rate": 4.976279636431583e-06, + "loss": 1.165, + "step": 2409 + }, + { + "epoch": 0.07, + "learning_rate": 4.976246103368685e-06, + "loss": 1.255, + "step": 2410 + }, + { + "epoch": 0.07, + "learning_rate": 4.976212546733115e-06, + "loss": 1.3843, + "step": 2411 + }, + { + "epoch": 0.07, + "learning_rate": 4.9761789665251935e-06, + "loss": 1.1589, + "step": 2412 + }, + { + "epoch": 0.07, + "learning_rate": 4.976145362745241e-06, + "loss": 1.1118, + "step": 2413 + }, + { + "epoch": 0.07, + "learning_rate": 4.9761117353935785e-06, + "loss": 1.1894, + "step": 2414 + }, + { + "epoch": 0.07, + "learning_rate": 4.9760780844705245e-06, + "loss": 1.1779, + "step": 2415 + }, + { + "epoch": 0.07, + "learning_rate": 4.976044409976399e-06, + "loss": 1.0919, + "step": 2416 + }, + { + "epoch": 0.07, + "learning_rate": 4.976010711911523e-06, + "loss": 1.2932, + "step": 2417 + }, + { + "epoch": 0.07, + "learning_rate": 4.975976990276219e-06, + "loss": 1.2516, + "step": 2418 + }, + { + "epoch": 0.07, + "learning_rate": 4.975943245070805e-06, + "loss": 1.0366, + "step": 2419 + }, + { + "epoch": 0.07, + "learning_rate": 4.9759094762956045e-06, + "loss": 1.1572, + "step": 2420 + }, + { + "epoch": 0.07, + "learning_rate": 4.975875683950938e-06, + "loss": 1.0662, + "step": 2421 + }, + { + "epoch": 0.07, + "learning_rate": 4.975841868037128e-06, + "loss": 1.1621, + "step": 2422 + }, + { + "epoch": 0.07, + "learning_rate": 4.9758080285544955e-06, + "loss": 1.1382, + "step": 2423 + }, + { + "epoch": 0.07, + "learning_rate": 4.975774165503362e-06, + "loss": 1.2424, + "step": 2424 + }, + { + "epoch": 0.07, + "learning_rate": 4.975740278884051e-06, + "loss": 1.1293, + "step": 2425 + }, + { + "epoch": 0.07, + "learning_rate": 4.975706368696886e-06, + "loss": 1.1731, + "step": 2426 + }, + { + "epoch": 0.07, + "learning_rate": 4.975672434942188e-06, + "loss": 1.134, + "step": 2427 + }, + { + "epoch": 0.07, + "learning_rate": 4.975638477620281e-06, + "loss": 1.1519, + "step": 2428 + }, + { + "epoch": 0.07, + "learning_rate": 4.975604496731488e-06, + "loss": 1.2087, + "step": 2429 + }, + { + "epoch": 0.07, + "learning_rate": 4.975570492276133e-06, + "loss": 1.2567, + "step": 2430 + }, + { + "epoch": 0.07, + "learning_rate": 4.975536464254538e-06, + "loss": 1.1942, + "step": 2431 + }, + { + "epoch": 0.07, + "learning_rate": 4.975502412667029e-06, + "loss": 1.0864, + "step": 2432 + }, + { + "epoch": 0.07, + "learning_rate": 4.975468337513929e-06, + "loss": 1.1124, + "step": 2433 + }, + { + "epoch": 0.07, + "learning_rate": 4.975434238795563e-06, + "loss": 1.0667, + "step": 2434 + }, + { + "epoch": 0.07, + "learning_rate": 4.975400116512255e-06, + "loss": 1.1107, + "step": 2435 + }, + { + "epoch": 0.07, + "learning_rate": 4.975365970664329e-06, + "loss": 1.1589, + "step": 2436 + }, + { + "epoch": 0.07, + "learning_rate": 4.975331801252113e-06, + "loss": 1.2238, + "step": 2437 + }, + { + "epoch": 0.07, + "learning_rate": 4.975297608275929e-06, + "loss": 1.176, + "step": 2438 + }, + { + "epoch": 0.07, + "learning_rate": 4.975263391736104e-06, + "loss": 1.1591, + "step": 2439 + }, + { + "epoch": 0.07, + "learning_rate": 4.975229151632965e-06, + "loss": 1.1592, + "step": 2440 + }, + { + "epoch": 0.07, + "learning_rate": 4.975194887966835e-06, + "loss": 1.153, + "step": 2441 + }, + { + "epoch": 0.07, + "learning_rate": 4.975160600738042e-06, + "loss": 1.1093, + "step": 2442 + }, + { + "epoch": 0.07, + "learning_rate": 4.975126289946913e-06, + "loss": 1.2509, + "step": 2443 + }, + { + "epoch": 0.07, + "learning_rate": 4.975091955593773e-06, + "loss": 1.1122, + "step": 2444 + }, + { + "epoch": 0.07, + "learning_rate": 4.9750575976789505e-06, + "loss": 1.1119, + "step": 2445 + }, + { + "epoch": 0.07, + "learning_rate": 4.975023216202771e-06, + "loss": 1.0353, + "step": 2446 + }, + { + "epoch": 0.07, + "learning_rate": 4.974988811165563e-06, + "loss": 1.1084, + "step": 2447 + }, + { + "epoch": 0.07, + "learning_rate": 4.974954382567652e-06, + "loss": 1.1622, + "step": 2448 + }, + { + "epoch": 0.07, + "learning_rate": 4.974919930409369e-06, + "loss": 1.1669, + "step": 2449 + }, + { + "epoch": 0.07, + "learning_rate": 4.9748854546910395e-06, + "loss": 1.0735, + "step": 2450 + }, + { + "epoch": 0.07, + "learning_rate": 4.9748509554129934e-06, + "loss": 1.241, + "step": 2451 + }, + { + "epoch": 0.07, + "learning_rate": 4.974816432575557e-06, + "loss": 1.157, + "step": 2452 + }, + { + "epoch": 0.07, + "learning_rate": 4.97478188617906e-06, + "loss": 1.1154, + "step": 2453 + }, + { + "epoch": 0.07, + "learning_rate": 4.974747316223832e-06, + "loss": 1.2094, + "step": 2454 + }, + { + "epoch": 0.07, + "learning_rate": 4.974712722710201e-06, + "loss": 1.1556, + "step": 2455 + }, + { + "epoch": 0.07, + "learning_rate": 4.974678105638497e-06, + "loss": 1.1713, + "step": 2456 + }, + { + "epoch": 0.07, + "learning_rate": 4.974643465009049e-06, + "loss": 1.1448, + "step": 2457 + }, + { + "epoch": 0.07, + "learning_rate": 4.974608800822187e-06, + "loss": 1.1714, + "step": 2458 + }, + { + "epoch": 0.07, + "learning_rate": 4.974574113078242e-06, + "loss": 1.2101, + "step": 2459 + }, + { + "epoch": 0.07, + "learning_rate": 4.974539401777542e-06, + "loss": 1.0562, + "step": 2460 + }, + { + "epoch": 0.07, + "learning_rate": 4.974504666920419e-06, + "loss": 1.2665, + "step": 2461 + }, + { + "epoch": 0.07, + "learning_rate": 4.974469908507204e-06, + "loss": 1.1498, + "step": 2462 + }, + { + "epoch": 0.07, + "learning_rate": 4.974435126538227e-06, + "loss": 1.092, + "step": 2463 + }, + { + "epoch": 0.07, + "learning_rate": 4.9744003210138185e-06, + "loss": 1.1398, + "step": 2464 + }, + { + "epoch": 0.07, + "learning_rate": 4.974365491934312e-06, + "loss": 1.1497, + "step": 2465 + }, + { + "epoch": 0.07, + "learning_rate": 4.974330639300036e-06, + "loss": 1.1255, + "step": 2466 + }, + { + "epoch": 0.07, + "learning_rate": 4.9742957631113255e-06, + "loss": 1.2872, + "step": 2467 + }, + { + "epoch": 0.07, + "learning_rate": 4.97426086336851e-06, + "loss": 1.2933, + "step": 2468 + }, + { + "epoch": 0.07, + "learning_rate": 4.9742259400719235e-06, + "loss": 1.1274, + "step": 2469 + }, + { + "epoch": 0.07, + "learning_rate": 4.974190993221897e-06, + "loss": 1.1566, + "step": 2470 + }, + { + "epoch": 0.07, + "learning_rate": 4.974156022818765e-06, + "loss": 1.1383, + "step": 2471 + }, + { + "epoch": 0.07, + "learning_rate": 4.974121028862858e-06, + "loss": 1.1602, + "step": 2472 + }, + { + "epoch": 0.07, + "learning_rate": 4.974086011354511e-06, + "loss": 1.1967, + "step": 2473 + }, + { + "epoch": 0.07, + "learning_rate": 4.974050970294056e-06, + "loss": 1.1019, + "step": 2474 + }, + { + "epoch": 0.07, + "learning_rate": 4.974015905681828e-06, + "loss": 1.1178, + "step": 2475 + }, + { + "epoch": 0.07, + "learning_rate": 4.97398081751816e-06, + "loss": 1.1069, + "step": 2476 + }, + { + "epoch": 0.07, + "learning_rate": 4.973945705803385e-06, + "loss": 1.1702, + "step": 2477 + }, + { + "epoch": 0.07, + "learning_rate": 4.9739105705378405e-06, + "loss": 1.1865, + "step": 2478 + }, + { + "epoch": 0.07, + "learning_rate": 4.973875411721858e-06, + "loss": 1.1039, + "step": 2479 + }, + { + "epoch": 0.07, + "learning_rate": 4.973840229355772e-06, + "loss": 1.2833, + "step": 2480 + }, + { + "epoch": 0.07, + "learning_rate": 4.973805023439919e-06, + "loss": 1.1337, + "step": 2481 + }, + { + "epoch": 0.07, + "learning_rate": 4.973769793974634e-06, + "loss": 1.2246, + "step": 2482 + }, + { + "epoch": 0.07, + "learning_rate": 4.973734540960252e-06, + "loss": 1.0942, + "step": 2483 + }, + { + "epoch": 0.07, + "learning_rate": 4.973699264397109e-06, + "loss": 1.1484, + "step": 2484 + }, + { + "epoch": 0.07, + "learning_rate": 4.97366396428554e-06, + "loss": 1.1165, + "step": 2485 + }, + { + "epoch": 0.07, + "learning_rate": 4.973628640625881e-06, + "loss": 1.2441, + "step": 2486 + }, + { + "epoch": 0.07, + "learning_rate": 4.973593293418469e-06, + "loss": 1.1199, + "step": 2487 + }, + { + "epoch": 0.07, + "learning_rate": 4.97355792266364e-06, + "loss": 1.1995, + "step": 2488 + }, + { + "epoch": 0.07, + "learning_rate": 4.973522528361731e-06, + "loss": 1.2446, + "step": 2489 + }, + { + "epoch": 0.08, + "learning_rate": 4.973487110513079e-06, + "loss": 1.1167, + "step": 2490 + }, + { + "epoch": 0.08, + "learning_rate": 4.97345166911802e-06, + "loss": 1.1309, + "step": 2491 + }, + { + "epoch": 0.08, + "learning_rate": 4.973416204176893e-06, + "loss": 1.2407, + "step": 2492 + }, + { + "epoch": 0.08, + "learning_rate": 4.973380715690036e-06, + "loss": 1.1092, + "step": 2493 + }, + { + "epoch": 0.08, + "learning_rate": 4.973345203657785e-06, + "loss": 1.1184, + "step": 2494 + }, + { + "epoch": 0.08, + "learning_rate": 4.9733096680804785e-06, + "loss": 1.1964, + "step": 2495 + }, + { + "epoch": 0.08, + "learning_rate": 4.973274108958455e-06, + "loss": 1.2279, + "step": 2496 + }, + { + "epoch": 0.08, + "learning_rate": 4.973238526292054e-06, + "loss": 1.1384, + "step": 2497 + }, + { + "epoch": 0.08, + "learning_rate": 4.973202920081612e-06, + "loss": 1.1202, + "step": 2498 + }, + { + "epoch": 0.08, + "learning_rate": 4.973167290327471e-06, + "loss": 1.1771, + "step": 2499 + }, + { + "epoch": 0.08, + "learning_rate": 4.973131637029967e-06, + "loss": 1.2191, + "step": 2500 + }, + { + "epoch": 0.08, + "learning_rate": 4.973095960189443e-06, + "loss": 1.0993, + "step": 2501 + }, + { + "epoch": 0.08, + "learning_rate": 4.9730602598062346e-06, + "loss": 1.1334, + "step": 2502 + }, + { + "epoch": 0.08, + "learning_rate": 4.973024535880684e-06, + "loss": 1.0573, + "step": 2503 + }, + { + "epoch": 0.08, + "learning_rate": 4.972988788413131e-06, + "loss": 1.2072, + "step": 2504 + }, + { + "epoch": 0.08, + "learning_rate": 4.972953017403917e-06, + "loss": 1.1862, + "step": 2505 + }, + { + "epoch": 0.08, + "learning_rate": 4.972917222853379e-06, + "loss": 1.1123, + "step": 2506 + }, + { + "epoch": 0.08, + "learning_rate": 4.972881404761861e-06, + "loss": 1.1371, + "step": 2507 + }, + { + "epoch": 0.08, + "learning_rate": 4.972845563129704e-06, + "loss": 1.1373, + "step": 2508 + }, + { + "epoch": 0.08, + "learning_rate": 4.972809697957247e-06, + "loss": 1.0532, + "step": 2509 + }, + { + "epoch": 0.08, + "learning_rate": 4.972773809244833e-06, + "loss": 1.0837, + "step": 2510 + }, + { + "epoch": 0.08, + "learning_rate": 4.972737896992804e-06, + "loss": 1.2242, + "step": 2511 + }, + { + "epoch": 0.08, + "learning_rate": 4.9727019612015e-06, + "loss": 1.2007, + "step": 2512 + }, + { + "epoch": 0.08, + "learning_rate": 4.9726660018712645e-06, + "loss": 1.1073, + "step": 2513 + }, + { + "epoch": 0.08, + "learning_rate": 4.9726300190024405e-06, + "loss": 1.2397, + "step": 2514 + }, + { + "epoch": 0.08, + "learning_rate": 4.972594012595369e-06, + "loss": 1.1414, + "step": 2515 + }, + { + "epoch": 0.08, + "learning_rate": 4.9725579826503924e-06, + "loss": 1.1888, + "step": 2516 + }, + { + "epoch": 0.08, + "learning_rate": 4.972521929167855e-06, + "loss": 1.1206, + "step": 2517 + }, + { + "epoch": 0.08, + "learning_rate": 4.9724858521481005e-06, + "loss": 1.1288, + "step": 2518 + }, + { + "epoch": 0.08, + "learning_rate": 4.972449751591471e-06, + "loss": 1.0701, + "step": 2519 + }, + { + "epoch": 0.08, + "learning_rate": 4.972413627498311e-06, + "loss": 1.0913, + "step": 2520 + }, + { + "epoch": 0.08, + "learning_rate": 4.972377479868963e-06, + "loss": 1.2262, + "step": 2521 + }, + { + "epoch": 0.08, + "learning_rate": 4.972341308703773e-06, + "loss": 1.2351, + "step": 2522 + }, + { + "epoch": 0.08, + "learning_rate": 4.972305114003084e-06, + "loss": 1.1095, + "step": 2523 + }, + { + "epoch": 0.08, + "learning_rate": 4.972268895767242e-06, + "loss": 1.3137, + "step": 2524 + }, + { + "epoch": 0.08, + "learning_rate": 4.9722326539965895e-06, + "loss": 1.3156, + "step": 2525 + }, + { + "epoch": 0.08, + "learning_rate": 4.972196388691473e-06, + "loss": 1.1651, + "step": 2526 + }, + { + "epoch": 0.08, + "learning_rate": 4.972160099852238e-06, + "loss": 1.2574, + "step": 2527 + }, + { + "epoch": 0.08, + "learning_rate": 4.9721237874792294e-06, + "loss": 1.2234, + "step": 2528 + }, + { + "epoch": 0.08, + "learning_rate": 4.972087451572793e-06, + "loss": 1.1858, + "step": 2529 + }, + { + "epoch": 0.08, + "learning_rate": 4.972051092133274e-06, + "loss": 1.1736, + "step": 2530 + }, + { + "epoch": 0.08, + "learning_rate": 4.972014709161021e-06, + "loss": 1.3253, + "step": 2531 + }, + { + "epoch": 0.08, + "learning_rate": 4.971978302656377e-06, + "loss": 1.1191, + "step": 2532 + }, + { + "epoch": 0.08, + "learning_rate": 4.97194187261969e-06, + "loss": 1.1828, + "step": 2533 + }, + { + "epoch": 0.08, + "learning_rate": 4.971905419051307e-06, + "loss": 1.1091, + "step": 2534 + }, + { + "epoch": 0.08, + "learning_rate": 4.971868941951575e-06, + "loss": 1.0854, + "step": 2535 + }, + { + "epoch": 0.08, + "learning_rate": 4.9718324413208415e-06, + "loss": 1.1924, + "step": 2536 + }, + { + "epoch": 0.08, + "learning_rate": 4.971795917159454e-06, + "loss": 1.1523, + "step": 2537 + }, + { + "epoch": 0.08, + "learning_rate": 4.971759369467759e-06, + "loss": 1.1993, + "step": 2538 + }, + { + "epoch": 0.08, + "learning_rate": 4.9717227982461055e-06, + "loss": 1.1239, + "step": 2539 + }, + { + "epoch": 0.08, + "learning_rate": 4.971686203494842e-06, + "loss": 1.2415, + "step": 2540 + }, + { + "epoch": 0.08, + "learning_rate": 4.971649585214315e-06, + "loss": 1.1077, + "step": 2541 + }, + { + "epoch": 0.08, + "learning_rate": 4.971612943404876e-06, + "loss": 1.2751, + "step": 2542 + }, + { + "epoch": 0.08, + "learning_rate": 4.971576278066871e-06, + "loss": 1.2079, + "step": 2543 + }, + { + "epoch": 0.08, + "learning_rate": 4.97153958920065e-06, + "loss": 1.0312, + "step": 2544 + }, + { + "epoch": 0.08, + "learning_rate": 4.971502876806563e-06, + "loss": 1.0806, + "step": 2545 + }, + { + "epoch": 0.08, + "learning_rate": 4.971466140884958e-06, + "loss": 1.1174, + "step": 2546 + }, + { + "epoch": 0.08, + "learning_rate": 4.9714293814361865e-06, + "loss": 1.2775, + "step": 2547 + }, + { + "epoch": 0.08, + "learning_rate": 4.971392598460598e-06, + "loss": 1.1641, + "step": 2548 + }, + { + "epoch": 0.08, + "learning_rate": 4.971355791958542e-06, + "loss": 1.2115, + "step": 2549 + }, + { + "epoch": 0.08, + "learning_rate": 4.971318961930368e-06, + "loss": 1.0908, + "step": 2550 + }, + { + "epoch": 0.08, + "learning_rate": 4.971282108376429e-06, + "loss": 1.1742, + "step": 2551 + }, + { + "epoch": 0.08, + "learning_rate": 4.971245231297074e-06, + "loss": 1.1703, + "step": 2552 + }, + { + "epoch": 0.08, + "learning_rate": 4.971208330692655e-06, + "loss": 1.1992, + "step": 2553 + }, + { + "epoch": 0.08, + "learning_rate": 4.971171406563522e-06, + "loss": 1.2034, + "step": 2554 + }, + { + "epoch": 0.08, + "learning_rate": 4.971134458910028e-06, + "loss": 1.2306, + "step": 2555 + }, + { + "epoch": 0.08, + "learning_rate": 4.971097487732524e-06, + "loss": 1.1556, + "step": 2556 + }, + { + "epoch": 0.08, + "learning_rate": 4.9710604930313625e-06, + "loss": 1.1992, + "step": 2557 + }, + { + "epoch": 0.08, + "learning_rate": 4.971023474806894e-06, + "loss": 1.1165, + "step": 2558 + }, + { + "epoch": 0.08, + "learning_rate": 4.970986433059473e-06, + "loss": 1.1194, + "step": 2559 + }, + { + "epoch": 0.08, + "learning_rate": 4.970949367789451e-06, + "loss": 1.0812, + "step": 2560 + }, + { + "epoch": 0.08, + "learning_rate": 4.9709122789971805e-06, + "loss": 1.1432, + "step": 2561 + }, + { + "epoch": 0.08, + "learning_rate": 4.970875166683017e-06, + "loss": 1.1439, + "step": 2562 + }, + { + "epoch": 0.08, + "learning_rate": 4.97083803084731e-06, + "loss": 1.0571, + "step": 2563 + }, + { + "epoch": 0.08, + "learning_rate": 4.970800871490415e-06, + "loss": 1.2118, + "step": 2564 + }, + { + "epoch": 0.08, + "learning_rate": 4.970763688612687e-06, + "loss": 1.1707, + "step": 2565 + }, + { + "epoch": 0.08, + "learning_rate": 4.970726482214478e-06, + "loss": 1.1771, + "step": 2566 + }, + { + "epoch": 0.08, + "learning_rate": 4.970689252296142e-06, + "loss": 1.3208, + "step": 2567 + }, + { + "epoch": 0.08, + "learning_rate": 4.970651998858036e-06, + "loss": 1.2413, + "step": 2568 + }, + { + "epoch": 0.08, + "learning_rate": 4.970614721900512e-06, + "loss": 1.0828, + "step": 2569 + }, + { + "epoch": 0.08, + "learning_rate": 4.970577421423925e-06, + "loss": 1.278, + "step": 2570 + }, + { + "epoch": 0.08, + "learning_rate": 4.970540097428632e-06, + "loss": 1.0607, + "step": 2571 + }, + { + "epoch": 0.08, + "learning_rate": 4.970502749914986e-06, + "loss": 1.1439, + "step": 2572 + }, + { + "epoch": 0.08, + "learning_rate": 4.970465378883345e-06, + "loss": 1.1781, + "step": 2573 + }, + { + "epoch": 0.08, + "learning_rate": 4.970427984334062e-06, + "loss": 1.1423, + "step": 2574 + }, + { + "epoch": 0.08, + "learning_rate": 4.970390566267495e-06, + "loss": 1.1765, + "step": 2575 + }, + { + "epoch": 0.08, + "learning_rate": 4.970353124684e-06, + "loss": 1.0581, + "step": 2576 + }, + { + "epoch": 0.08, + "learning_rate": 4.9703156595839325e-06, + "loss": 1.1124, + "step": 2577 + }, + { + "epoch": 0.08, + "learning_rate": 4.9702781709676495e-06, + "loss": 1.1677, + "step": 2578 + }, + { + "epoch": 0.08, + "learning_rate": 4.970240658835508e-06, + "loss": 1.1824, + "step": 2579 + }, + { + "epoch": 0.08, + "learning_rate": 4.970203123187866e-06, + "loss": 1.1627, + "step": 2580 + }, + { + "epoch": 0.08, + "learning_rate": 4.970165564025079e-06, + "loss": 1.1066, + "step": 2581 + }, + { + "epoch": 0.08, + "learning_rate": 4.970127981347507e-06, + "loss": 1.1246, + "step": 2582 + }, + { + "epoch": 0.08, + "learning_rate": 4.970090375155505e-06, + "loss": 1.1619, + "step": 2583 + }, + { + "epoch": 0.08, + "learning_rate": 4.9700527454494315e-06, + "loss": 1.0868, + "step": 2584 + }, + { + "epoch": 0.08, + "learning_rate": 4.970015092229647e-06, + "loss": 1.1823, + "step": 2585 + }, + { + "epoch": 0.08, + "learning_rate": 4.969977415496508e-06, + "loss": 1.1882, + "step": 2586 + }, + { + "epoch": 0.08, + "learning_rate": 4.9699397152503734e-06, + "loss": 1.1821, + "step": 2587 + }, + { + "epoch": 0.08, + "learning_rate": 4.9699019914916024e-06, + "loss": 1.1948, + "step": 2588 + }, + { + "epoch": 0.08, + "learning_rate": 4.969864244220554e-06, + "loss": 1.147, + "step": 2589 + }, + { + "epoch": 0.08, + "learning_rate": 4.9698264734375874e-06, + "loss": 1.139, + "step": 2590 + }, + { + "epoch": 0.08, + "learning_rate": 4.9697886791430625e-06, + "loss": 1.2021, + "step": 2591 + }, + { + "epoch": 0.08, + "learning_rate": 4.969750861337338e-06, + "loss": 1.224, + "step": 2592 + }, + { + "epoch": 0.08, + "learning_rate": 4.9697130200207754e-06, + "loss": 1.1225, + "step": 2593 + }, + { + "epoch": 0.08, + "learning_rate": 4.969675155193735e-06, + "loss": 1.1502, + "step": 2594 + }, + { + "epoch": 0.08, + "learning_rate": 4.969637266856576e-06, + "loss": 1.1721, + "step": 2595 + }, + { + "epoch": 0.08, + "learning_rate": 4.96959935500966e-06, + "loss": 1.1217, + "step": 2596 + }, + { + "epoch": 0.08, + "learning_rate": 4.969561419653347e-06, + "loss": 1.0771, + "step": 2597 + }, + { + "epoch": 0.08, + "learning_rate": 4.9695234607879986e-06, + "loss": 1.1263, + "step": 2598 + }, + { + "epoch": 0.08, + "learning_rate": 4.969485478413976e-06, + "loss": 1.2081, + "step": 2599 + }, + { + "epoch": 0.08, + "learning_rate": 4.969447472531641e-06, + "loss": 1.0327, + "step": 2600 + }, + { + "epoch": 0.08, + "learning_rate": 4.969409443141356e-06, + "loss": 1.2365, + "step": 2601 + }, + { + "epoch": 0.08, + "learning_rate": 4.969371390243483e-06, + "loss": 1.0519, + "step": 2602 + }, + { + "epoch": 0.08, + "learning_rate": 4.969333313838382e-06, + "loss": 1.2091, + "step": 2603 + }, + { + "epoch": 0.08, + "learning_rate": 4.969295213926418e-06, + "loss": 1.1888, + "step": 2604 + }, + { + "epoch": 0.08, + "learning_rate": 4.969257090507953e-06, + "loss": 1.1405, + "step": 2605 + }, + { + "epoch": 0.08, + "learning_rate": 4.9692189435833495e-06, + "loss": 1.1331, + "step": 2606 + }, + { + "epoch": 0.08, + "learning_rate": 4.969180773152971e-06, + "loss": 1.0916, + "step": 2607 + }, + { + "epoch": 0.08, + "learning_rate": 4.96914257921718e-06, + "loss": 1.2206, + "step": 2608 + }, + { + "epoch": 0.08, + "learning_rate": 4.969104361776342e-06, + "loss": 1.113, + "step": 2609 + }, + { + "epoch": 0.08, + "learning_rate": 4.9690661208308185e-06, + "loss": 1.0297, + "step": 2610 + }, + { + "epoch": 0.08, + "learning_rate": 4.9690278563809755e-06, + "loss": 1.1425, + "step": 2611 + }, + { + "epoch": 0.08, + "learning_rate": 4.968989568427176e-06, + "loss": 1.1799, + "step": 2612 + }, + { + "epoch": 0.08, + "learning_rate": 4.968951256969785e-06, + "loss": 1.151, + "step": 2613 + }, + { + "epoch": 0.08, + "learning_rate": 4.9689129220091675e-06, + "loss": 1.1987, + "step": 2614 + }, + { + "epoch": 0.08, + "learning_rate": 4.968874563545688e-06, + "loss": 1.1485, + "step": 2615 + }, + { + "epoch": 0.08, + "learning_rate": 4.9688361815797115e-06, + "loss": 1.222, + "step": 2616 + }, + { + "epoch": 0.08, + "learning_rate": 4.9687977761116035e-06, + "loss": 1.1161, + "step": 2617 + }, + { + "epoch": 0.08, + "learning_rate": 4.9687593471417296e-06, + "loss": 1.1352, + "step": 2618 + }, + { + "epoch": 0.08, + "learning_rate": 4.9687208946704555e-06, + "loss": 1.2532, + "step": 2619 + }, + { + "epoch": 0.08, + "learning_rate": 4.968682418698148e-06, + "loss": 1.236, + "step": 2620 + }, + { + "epoch": 0.08, + "learning_rate": 4.968643919225173e-06, + "loss": 1.0186, + "step": 2621 + }, + { + "epoch": 0.08, + "learning_rate": 4.968605396251896e-06, + "loss": 1.0884, + "step": 2622 + }, + { + "epoch": 0.08, + "learning_rate": 4.9685668497786855e-06, + "loss": 1.2299, + "step": 2623 + }, + { + "epoch": 0.08, + "learning_rate": 4.968528279805907e-06, + "loss": 1.1835, + "step": 2624 + }, + { + "epoch": 0.08, + "learning_rate": 4.968489686333928e-06, + "loss": 1.103, + "step": 2625 + }, + { + "epoch": 0.08, + "learning_rate": 4.9684510693631165e-06, + "loss": 1.0466, + "step": 2626 + }, + { + "epoch": 0.08, + "learning_rate": 4.9684124288938395e-06, + "loss": 1.2383, + "step": 2627 + }, + { + "epoch": 0.08, + "learning_rate": 4.968373764926465e-06, + "loss": 1.0576, + "step": 2628 + }, + { + "epoch": 0.08, + "learning_rate": 4.968335077461361e-06, + "loss": 1.0831, + "step": 2629 + }, + { + "epoch": 0.08, + "learning_rate": 4.968296366498896e-06, + "loss": 1.1729, + "step": 2630 + }, + { + "epoch": 0.08, + "learning_rate": 4.968257632039438e-06, + "loss": 1.1721, + "step": 2631 + }, + { + "epoch": 0.08, + "learning_rate": 4.968218874083356e-06, + "loss": 1.0349, + "step": 2632 + }, + { + "epoch": 0.08, + "learning_rate": 4.9681800926310196e-06, + "loss": 1.1046, + "step": 2633 + }, + { + "epoch": 0.08, + "learning_rate": 4.968141287682797e-06, + "loss": 1.1819, + "step": 2634 + }, + { + "epoch": 0.08, + "learning_rate": 4.968102459239058e-06, + "loss": 1.0283, + "step": 2635 + }, + { + "epoch": 0.08, + "learning_rate": 4.968063607300173e-06, + "loss": 1.2427, + "step": 2636 + }, + { + "epoch": 0.08, + "learning_rate": 4.96802473186651e-06, + "loss": 1.1804, + "step": 2637 + }, + { + "epoch": 0.08, + "learning_rate": 4.967985832938441e-06, + "loss": 1.2158, + "step": 2638 + }, + { + "epoch": 0.08, + "learning_rate": 4.967946910516336e-06, + "loss": 1.2183, + "step": 2639 + }, + { + "epoch": 0.08, + "learning_rate": 4.967907964600563e-06, + "loss": 1.1858, + "step": 2640 + }, + { + "epoch": 0.08, + "learning_rate": 4.967868995191497e-06, + "loss": 1.1481, + "step": 2641 + }, + { + "epoch": 0.08, + "learning_rate": 4.967830002289505e-06, + "loss": 1.0664, + "step": 2642 + }, + { + "epoch": 0.08, + "learning_rate": 4.967790985894961e-06, + "loss": 1.2611, + "step": 2643 + }, + { + "epoch": 0.08, + "learning_rate": 4.967751946008235e-06, + "loss": 1.1627, + "step": 2644 + }, + { + "epoch": 0.08, + "learning_rate": 4.967712882629699e-06, + "loss": 1.1399, + "step": 2645 + }, + { + "epoch": 0.08, + "learning_rate": 4.967673795759726e-06, + "loss": 1.2074, + "step": 2646 + }, + { + "epoch": 0.08, + "learning_rate": 4.967634685398685e-06, + "loss": 1.2109, + "step": 2647 + }, + { + "epoch": 0.08, + "learning_rate": 4.967595551546951e-06, + "loss": 1.2366, + "step": 2648 + }, + { + "epoch": 0.08, + "learning_rate": 4.967556394204896e-06, + "loss": 1.1979, + "step": 2649 + }, + { + "epoch": 0.08, + "learning_rate": 4.967517213372892e-06, + "loss": 1.1648, + "step": 2650 + }, + { + "epoch": 0.08, + "learning_rate": 4.967478009051313e-06, + "loss": 1.1372, + "step": 2651 + }, + { + "epoch": 0.08, + "learning_rate": 4.967438781240532e-06, + "loss": 1.1874, + "step": 2652 + }, + { + "epoch": 0.08, + "learning_rate": 4.967399529940922e-06, + "loss": 1.0513, + "step": 2653 + }, + { + "epoch": 0.08, + "learning_rate": 4.967360255152857e-06, + "loss": 1.0471, + "step": 2654 + }, + { + "epoch": 0.08, + "learning_rate": 4.96732095687671e-06, + "loss": 1.2137, + "step": 2655 + }, + { + "epoch": 0.08, + "learning_rate": 4.967281635112856e-06, + "loss": 1.2463, + "step": 2656 + }, + { + "epoch": 0.08, + "learning_rate": 4.967242289861669e-06, + "loss": 1.2393, + "step": 2657 + }, + { + "epoch": 0.08, + "learning_rate": 4.967202921123524e-06, + "loss": 1.1414, + "step": 2658 + }, + { + "epoch": 0.08, + "learning_rate": 4.9671635288987955e-06, + "loss": 1.1206, + "step": 2659 + }, + { + "epoch": 0.08, + "learning_rate": 4.9671241131878575e-06, + "loss": 1.178, + "step": 2660 + }, + { + "epoch": 0.08, + "learning_rate": 4.967084673991088e-06, + "loss": 1.1614, + "step": 2661 + }, + { + "epoch": 0.08, + "learning_rate": 4.967045211308859e-06, + "loss": 1.2672, + "step": 2662 + }, + { + "epoch": 0.08, + "learning_rate": 4.967005725141548e-06, + "loss": 1.1768, + "step": 2663 + }, + { + "epoch": 0.08, + "learning_rate": 4.966966215489532e-06, + "loss": 1.1965, + "step": 2664 + }, + { + "epoch": 0.08, + "learning_rate": 4.966926682353184e-06, + "loss": 1.065, + "step": 2665 + }, + { + "epoch": 0.08, + "learning_rate": 4.966887125732883e-06, + "loss": 1.2606, + "step": 2666 + }, + { + "epoch": 0.08, + "learning_rate": 4.9668475456290046e-06, + "loss": 1.2399, + "step": 2667 + }, + { + "epoch": 0.08, + "learning_rate": 4.966807942041925e-06, + "loss": 1.0883, + "step": 2668 + }, + { + "epoch": 0.08, + "learning_rate": 4.9667683149720225e-06, + "loss": 1.2025, + "step": 2669 + }, + { + "epoch": 0.08, + "learning_rate": 4.9667286644196735e-06, + "loss": 1.1801, + "step": 2670 + }, + { + "epoch": 0.08, + "learning_rate": 4.9666889903852555e-06, + "loss": 1.2102, + "step": 2671 + }, + { + "epoch": 0.08, + "learning_rate": 4.966649292869147e-06, + "loss": 1.1164, + "step": 2672 + }, + { + "epoch": 0.08, + "learning_rate": 4.966609571871724e-06, + "loss": 1.1183, + "step": 2673 + }, + { + "epoch": 0.08, + "learning_rate": 4.966569827393367e-06, + "loss": 1.1655, + "step": 2674 + }, + { + "epoch": 0.08, + "learning_rate": 4.966530059434452e-06, + "loss": 1.0982, + "step": 2675 + }, + { + "epoch": 0.08, + "learning_rate": 4.96649026799536e-06, + "loss": 1.0613, + "step": 2676 + }, + { + "epoch": 0.08, + "learning_rate": 4.966450453076468e-06, + "loss": 1.2664, + "step": 2677 + }, + { + "epoch": 0.08, + "learning_rate": 4.966410614678155e-06, + "loss": 1.0391, + "step": 2678 + }, + { + "epoch": 0.08, + "learning_rate": 4.966370752800802e-06, + "loss": 1.1491, + "step": 2679 + }, + { + "epoch": 0.08, + "learning_rate": 4.966330867444786e-06, + "loss": 1.1532, + "step": 2680 + }, + { + "epoch": 0.08, + "learning_rate": 4.966290958610489e-06, + "loss": 1.1063, + "step": 2681 + }, + { + "epoch": 0.08, + "learning_rate": 4.96625102629829e-06, + "loss": 1.1137, + "step": 2682 + }, + { + "epoch": 0.08, + "learning_rate": 4.9662110705085684e-06, + "loss": 1.1227, + "step": 2683 + }, + { + "epoch": 0.08, + "learning_rate": 4.966171091241705e-06, + "loss": 1.1021, + "step": 2684 + }, + { + "epoch": 0.08, + "learning_rate": 4.966131088498081e-06, + "loss": 1.2235, + "step": 2685 + }, + { + "epoch": 0.08, + "learning_rate": 4.9660910622780764e-06, + "loss": 1.1677, + "step": 2686 + }, + { + "epoch": 0.08, + "learning_rate": 4.966051012582073e-06, + "loss": 1.1419, + "step": 2687 + }, + { + "epoch": 0.08, + "learning_rate": 4.966010939410451e-06, + "loss": 1.1201, + "step": 2688 + }, + { + "epoch": 0.08, + "learning_rate": 4.965970842763594e-06, + "loss": 1.1387, + "step": 2689 + }, + { + "epoch": 0.08, + "learning_rate": 4.96593072264188e-06, + "loss": 1.1815, + "step": 2690 + }, + { + "epoch": 0.08, + "learning_rate": 4.965890579045695e-06, + "loss": 1.1275, + "step": 2691 + }, + { + "epoch": 0.08, + "learning_rate": 4.9658504119754185e-06, + "loss": 1.157, + "step": 2692 + }, + { + "epoch": 0.08, + "learning_rate": 4.965810221431434e-06, + "loss": 1.1127, + "step": 2693 + }, + { + "epoch": 0.08, + "learning_rate": 4.965770007414124e-06, + "loss": 1.1695, + "step": 2694 + }, + { + "epoch": 0.08, + "learning_rate": 4.96572976992387e-06, + "loss": 1.0901, + "step": 2695 + }, + { + "epoch": 0.08, + "learning_rate": 4.9656895089610565e-06, + "loss": 1.1124, + "step": 2696 + }, + { + "epoch": 0.08, + "learning_rate": 4.965649224526067e-06, + "loss": 1.2206, + "step": 2697 + }, + { + "epoch": 0.08, + "learning_rate": 4.9656089166192845e-06, + "loss": 1.2491, + "step": 2698 + }, + { + "epoch": 0.08, + "learning_rate": 4.965568585241092e-06, + "loss": 1.1542, + "step": 2699 + }, + { + "epoch": 0.08, + "learning_rate": 4.965528230391874e-06, + "loss": 1.116, + "step": 2700 + }, + { + "epoch": 0.08, + "learning_rate": 4.965487852072015e-06, + "loss": 1.0494, + "step": 2701 + }, + { + "epoch": 0.08, + "learning_rate": 4.965447450281899e-06, + "loss": 1.0958, + "step": 2702 + }, + { + "epoch": 0.08, + "learning_rate": 4.965407025021911e-06, + "loss": 1.1385, + "step": 2703 + }, + { + "epoch": 0.08, + "learning_rate": 4.965366576292435e-06, + "loss": 1.2639, + "step": 2704 + }, + { + "epoch": 0.08, + "learning_rate": 4.965326104093857e-06, + "loss": 1.1647, + "step": 2705 + }, + { + "epoch": 0.08, + "learning_rate": 4.965285608426561e-06, + "loss": 1.0934, + "step": 2706 + }, + { + "epoch": 0.08, + "learning_rate": 4.9652450892909345e-06, + "loss": 1.1693, + "step": 2707 + }, + { + "epoch": 0.08, + "learning_rate": 4.965204546687361e-06, + "loss": 1.1772, + "step": 2708 + }, + { + "epoch": 0.08, + "learning_rate": 4.965163980616228e-06, + "loss": 1.1815, + "step": 2709 + }, + { + "epoch": 0.08, + "learning_rate": 4.965123391077921e-06, + "loss": 1.1492, + "step": 2710 + }, + { + "epoch": 0.08, + "learning_rate": 4.965082778072826e-06, + "loss": 1.0486, + "step": 2711 + }, + { + "epoch": 0.08, + "learning_rate": 4.965042141601332e-06, + "loss": 1.1584, + "step": 2712 + }, + { + "epoch": 0.08, + "learning_rate": 4.965001481663823e-06, + "loss": 1.1807, + "step": 2713 + }, + { + "epoch": 0.08, + "learning_rate": 4.9649607982606865e-06, + "loss": 1.1685, + "step": 2714 + }, + { + "epoch": 0.08, + "learning_rate": 4.96492009139231e-06, + "loss": 1.0996, + "step": 2715 + }, + { + "epoch": 0.08, + "learning_rate": 4.964879361059083e-06, + "loss": 1.1992, + "step": 2716 + }, + { + "epoch": 0.08, + "learning_rate": 4.96483860726139e-06, + "loss": 1.0641, + "step": 2717 + }, + { + "epoch": 0.08, + "learning_rate": 4.964797829999622e-06, + "loss": 1.3025, + "step": 2718 + }, + { + "epoch": 0.08, + "learning_rate": 4.964757029274164e-06, + "loss": 1.0355, + "step": 2719 + }, + { + "epoch": 0.08, + "learning_rate": 4.964716205085408e-06, + "loss": 1.1327, + "step": 2720 + }, + { + "epoch": 0.08, + "learning_rate": 4.9646753574337405e-06, + "loss": 1.1056, + "step": 2721 + }, + { + "epoch": 0.08, + "learning_rate": 4.96463448631955e-06, + "loss": 1.1147, + "step": 2722 + }, + { + "epoch": 0.08, + "learning_rate": 4.9645935917432265e-06, + "loss": 1.2156, + "step": 2723 + }, + { + "epoch": 0.08, + "learning_rate": 4.964552673705159e-06, + "loss": 1.1366, + "step": 2724 + }, + { + "epoch": 0.08, + "learning_rate": 4.964511732205736e-06, + "loss": 1.1793, + "step": 2725 + }, + { + "epoch": 0.08, + "learning_rate": 4.96447076724535e-06, + "loss": 1.171, + "step": 2726 + }, + { + "epoch": 0.08, + "learning_rate": 4.964429778824388e-06, + "loss": 1.1721, + "step": 2727 + }, + { + "epoch": 0.08, + "learning_rate": 4.964388766943241e-06, + "loss": 1.0599, + "step": 2728 + }, + { + "epoch": 0.08, + "learning_rate": 4.964347731602301e-06, + "loss": 1.1729, + "step": 2729 + }, + { + "epoch": 0.08, + "learning_rate": 4.964306672801957e-06, + "loss": 1.1495, + "step": 2730 + }, + { + "epoch": 0.08, + "learning_rate": 4.964265590542601e-06, + "loss": 1.2222, + "step": 2731 + }, + { + "epoch": 0.08, + "learning_rate": 4.964224484824622e-06, + "loss": 1.1937, + "step": 2732 + }, + { + "epoch": 0.08, + "learning_rate": 4.964183355648414e-06, + "loss": 1.1004, + "step": 2733 + }, + { + "epoch": 0.08, + "learning_rate": 4.964142203014366e-06, + "loss": 1.126, + "step": 2734 + }, + { + "epoch": 0.08, + "learning_rate": 4.964101026922872e-06, + "loss": 1.1624, + "step": 2735 + }, + { + "epoch": 0.08, + "learning_rate": 4.964059827374323e-06, + "loss": 1.1232, + "step": 2736 + }, + { + "epoch": 0.08, + "learning_rate": 4.964018604369111e-06, + "loss": 1.1885, + "step": 2737 + }, + { + "epoch": 0.08, + "learning_rate": 4.963977357907628e-06, + "loss": 1.097, + "step": 2738 + }, + { + "epoch": 0.08, + "learning_rate": 4.963936087990267e-06, + "loss": 1.1998, + "step": 2739 + }, + { + "epoch": 0.08, + "learning_rate": 4.963894794617422e-06, + "loss": 1.1417, + "step": 2740 + }, + { + "epoch": 0.08, + "learning_rate": 4.963853477789486e-06, + "loss": 1.097, + "step": 2741 + }, + { + "epoch": 0.08, + "learning_rate": 4.96381213750685e-06, + "loss": 1.2522, + "step": 2742 + }, + { + "epoch": 0.08, + "learning_rate": 4.96377077376991e-06, + "loss": 1.2993, + "step": 2743 + }, + { + "epoch": 0.08, + "learning_rate": 4.963729386579058e-06, + "loss": 1.0817, + "step": 2744 + }, + { + "epoch": 0.08, + "learning_rate": 4.96368797593469e-06, + "loss": 1.0551, + "step": 2745 + }, + { + "epoch": 0.08, + "learning_rate": 4.9636465418371984e-06, + "loss": 1.1349, + "step": 2746 + }, + { + "epoch": 0.08, + "learning_rate": 4.963605084286978e-06, + "loss": 1.0811, + "step": 2747 + }, + { + "epoch": 0.08, + "learning_rate": 4.963563603284424e-06, + "loss": 1.1995, + "step": 2748 + }, + { + "epoch": 0.08, + "learning_rate": 4.963522098829931e-06, + "loss": 1.1502, + "step": 2749 + }, + { + "epoch": 0.08, + "learning_rate": 4.963480570923893e-06, + "loss": 1.243, + "step": 2750 + }, + { + "epoch": 0.08, + "learning_rate": 4.963439019566708e-06, + "loss": 1.1171, + "step": 2751 + }, + { + "epoch": 0.08, + "learning_rate": 4.963397444758769e-06, + "loss": 1.0053, + "step": 2752 + }, + { + "epoch": 0.08, + "learning_rate": 4.9633558465004736e-06, + "loss": 1.176, + "step": 2753 + }, + { + "epoch": 0.08, + "learning_rate": 4.963314224792216e-06, + "loss": 1.1128, + "step": 2754 + }, + { + "epoch": 0.08, + "learning_rate": 4.963272579634394e-06, + "loss": 1.1052, + "step": 2755 + }, + { + "epoch": 0.08, + "learning_rate": 4.9632309110274026e-06, + "loss": 1.2751, + "step": 2756 + }, + { + "epoch": 0.08, + "learning_rate": 4.96318921897164e-06, + "loss": 1.1329, + "step": 2757 + }, + { + "epoch": 0.08, + "learning_rate": 4.963147503467503e-06, + "loss": 1.2058, + "step": 2758 + }, + { + "epoch": 0.08, + "learning_rate": 4.963105764515387e-06, + "loss": 1.1125, + "step": 2759 + }, + { + "epoch": 0.08, + "learning_rate": 4.96306400211569e-06, + "loss": 1.2148, + "step": 2760 + }, + { + "epoch": 0.08, + "learning_rate": 4.963022216268811e-06, + "loss": 1.1965, + "step": 2761 + }, + { + "epoch": 0.08, + "learning_rate": 4.962980406975147e-06, + "loss": 1.1906, + "step": 2762 + }, + { + "epoch": 0.08, + "learning_rate": 4.962938574235095e-06, + "loss": 1.1367, + "step": 2763 + }, + { + "epoch": 0.08, + "learning_rate": 4.962896718049053e-06, + "loss": 1.1877, + "step": 2764 + }, + { + "epoch": 0.08, + "learning_rate": 4.9628548384174215e-06, + "loss": 1.144, + "step": 2765 + }, + { + "epoch": 0.08, + "learning_rate": 4.962812935340598e-06, + "loss": 1.1688, + "step": 2766 + }, + { + "epoch": 0.08, + "learning_rate": 4.962771008818982e-06, + "loss": 1.1544, + "step": 2767 + }, + { + "epoch": 0.08, + "learning_rate": 4.962729058852971e-06, + "loss": 1.214, + "step": 2768 + }, + { + "epoch": 0.08, + "learning_rate": 4.9626870854429665e-06, + "loss": 1.3304, + "step": 2769 + }, + { + "epoch": 0.08, + "learning_rate": 4.962645088589366e-06, + "loss": 1.1343, + "step": 2770 + }, + { + "epoch": 0.08, + "learning_rate": 4.9626030682925705e-06, + "loss": 1.2582, + "step": 2771 + }, + { + "epoch": 0.08, + "learning_rate": 4.962561024552981e-06, + "loss": 1.0654, + "step": 2772 + }, + { + "epoch": 0.08, + "learning_rate": 4.962518957370995e-06, + "loss": 1.2671, + "step": 2773 + }, + { + "epoch": 0.08, + "learning_rate": 4.962476866747015e-06, + "loss": 1.2588, + "step": 2774 + }, + { + "epoch": 0.08, + "learning_rate": 4.962434752681442e-06, + "loss": 1.2294, + "step": 2775 + }, + { + "epoch": 0.08, + "learning_rate": 4.962392615174676e-06, + "loss": 1.1812, + "step": 2776 + }, + { + "epoch": 0.08, + "learning_rate": 4.962350454227118e-06, + "loss": 1.2864, + "step": 2777 + }, + { + "epoch": 0.08, + "learning_rate": 4.962308269839169e-06, + "loss": 1.1523, + "step": 2778 + }, + { + "epoch": 0.08, + "learning_rate": 4.9622660620112315e-06, + "loss": 1.0493, + "step": 2779 + }, + { + "epoch": 0.08, + "learning_rate": 4.962223830743707e-06, + "loss": 1.1545, + "step": 2780 + }, + { + "epoch": 0.08, + "learning_rate": 4.962181576036997e-06, + "loss": 1.1458, + "step": 2781 + }, + { + "epoch": 0.08, + "learning_rate": 4.962139297891505e-06, + "loss": 1.1403, + "step": 2782 + }, + { + "epoch": 0.08, + "learning_rate": 4.962096996307633e-06, + "loss": 1.1707, + "step": 2783 + }, + { + "epoch": 0.08, + "learning_rate": 4.962054671285782e-06, + "loss": 1.0922, + "step": 2784 + }, + { + "epoch": 0.08, + "learning_rate": 4.962012322826357e-06, + "loss": 1.1339, + "step": 2785 + }, + { + "epoch": 0.08, + "learning_rate": 4.961969950929761e-06, + "loss": 1.0613, + "step": 2786 + }, + { + "epoch": 0.08, + "learning_rate": 4.961927555596397e-06, + "loss": 1.1302, + "step": 2787 + }, + { + "epoch": 0.08, + "learning_rate": 4.961885136826667e-06, + "loss": 1.2122, + "step": 2788 + }, + { + "epoch": 0.08, + "learning_rate": 4.9618426946209765e-06, + "loss": 1.1237, + "step": 2789 + }, + { + "epoch": 0.08, + "learning_rate": 4.961800228979729e-06, + "loss": 1.1555, + "step": 2790 + }, + { + "epoch": 0.08, + "learning_rate": 4.96175773990333e-06, + "loss": 1.1367, + "step": 2791 + }, + { + "epoch": 0.08, + "learning_rate": 4.961715227392183e-06, + "loss": 1.1972, + "step": 2792 + }, + { + "epoch": 0.08, + "learning_rate": 4.961672691446692e-06, + "loss": 1.1879, + "step": 2793 + }, + { + "epoch": 0.08, + "learning_rate": 4.9616301320672626e-06, + "loss": 1.2675, + "step": 2794 + }, + { + "epoch": 0.08, + "learning_rate": 4.9615875492543e-06, + "loss": 1.1414, + "step": 2795 + }, + { + "epoch": 0.08, + "learning_rate": 4.961544943008209e-06, + "loss": 1.1978, + "step": 2796 + }, + { + "epoch": 0.08, + "learning_rate": 4.961502313329397e-06, + "loss": 1.2128, + "step": 2797 + }, + { + "epoch": 0.08, + "learning_rate": 4.961459660218267e-06, + "loss": 1.2065, + "step": 2798 + }, + { + "epoch": 0.08, + "learning_rate": 4.9614169836752275e-06, + "loss": 1.1356, + "step": 2799 + }, + { + "epoch": 0.08, + "learning_rate": 4.961374283700683e-06, + "loss": 1.2502, + "step": 2800 + }, + { + "epoch": 0.08, + "learning_rate": 4.9613315602950414e-06, + "loss": 1.161, + "step": 2801 + }, + { + "epoch": 0.08, + "learning_rate": 4.961288813458708e-06, + "loss": 1.176, + "step": 2802 + }, + { + "epoch": 0.08, + "learning_rate": 4.961246043192091e-06, + "loss": 1.0763, + "step": 2803 + }, + { + "epoch": 0.08, + "learning_rate": 4.9612032494955976e-06, + "loss": 1.2213, + "step": 2804 + }, + { + "epoch": 0.08, + "learning_rate": 4.961160432369634e-06, + "loss": 1.2661, + "step": 2805 + }, + { + "epoch": 0.08, + "learning_rate": 4.961117591814608e-06, + "loss": 1.1155, + "step": 2806 + }, + { + "epoch": 0.08, + "learning_rate": 4.961074727830929e-06, + "loss": 1.2029, + "step": 2807 + }, + { + "epoch": 0.08, + "learning_rate": 4.9610318404190025e-06, + "loss": 1.1664, + "step": 2808 + }, + { + "epoch": 0.08, + "learning_rate": 4.960988929579239e-06, + "loss": 1.1469, + "step": 2809 + }, + { + "epoch": 0.08, + "learning_rate": 4.960945995312046e-06, + "loss": 1.1771, + "step": 2810 + }, + { + "epoch": 0.08, + "learning_rate": 4.960903037617833e-06, + "loss": 1.1181, + "step": 2811 + }, + { + "epoch": 0.08, + "learning_rate": 4.960860056497007e-06, + "loss": 1.1193, + "step": 2812 + }, + { + "epoch": 0.08, + "learning_rate": 4.960817051949979e-06, + "loss": 1.114, + "step": 2813 + }, + { + "epoch": 0.08, + "learning_rate": 4.960774023977159e-06, + "loss": 1.1881, + "step": 2814 + }, + { + "epoch": 0.08, + "learning_rate": 4.960730972578954e-06, + "loss": 1.1499, + "step": 2815 + }, + { + "epoch": 0.08, + "learning_rate": 4.9606878977557756e-06, + "loss": 1.172, + "step": 2816 + }, + { + "epoch": 0.08, + "learning_rate": 4.960644799508033e-06, + "loss": 1.1717, + "step": 2817 + }, + { + "epoch": 0.08, + "learning_rate": 4.960601677836138e-06, + "loss": 1.0978, + "step": 2818 + }, + { + "epoch": 0.08, + "learning_rate": 4.960558532740499e-06, + "loss": 1.2255, + "step": 2819 + }, + { + "epoch": 0.08, + "learning_rate": 4.960515364221528e-06, + "loss": 1.1669, + "step": 2820 + }, + { + "epoch": 0.08, + "learning_rate": 4.960472172279637e-06, + "loss": 1.1379, + "step": 2821 + }, + { + "epoch": 0.09, + "learning_rate": 4.960428956915236e-06, + "loss": 1.0958, + "step": 2822 + }, + { + "epoch": 0.09, + "learning_rate": 4.9603857181287355e-06, + "loss": 1.1822, + "step": 2823 + }, + { + "epoch": 0.09, + "learning_rate": 4.960342455920547e-06, + "loss": 1.152, + "step": 2824 + }, + { + "epoch": 0.09, + "learning_rate": 4.9602991702910845e-06, + "loss": 1.2315, + "step": 2825 + }, + { + "epoch": 0.09, + "learning_rate": 4.960255861240758e-06, + "loss": 1.2033, + "step": 2826 + }, + { + "epoch": 0.09, + "learning_rate": 4.960212528769982e-06, + "loss": 1.1248, + "step": 2827 + }, + { + "epoch": 0.09, + "learning_rate": 4.960169172879166e-06, + "loss": 1.132, + "step": 2828 + }, + { + "epoch": 0.09, + "learning_rate": 4.960125793568725e-06, + "loss": 1.199, + "step": 2829 + }, + { + "epoch": 0.09, + "learning_rate": 4.960082390839072e-06, + "loss": 1.0803, + "step": 2830 + }, + { + "epoch": 0.09, + "learning_rate": 4.960038964690618e-06, + "loss": 1.2107, + "step": 2831 + }, + { + "epoch": 0.09, + "learning_rate": 4.9599955151237785e-06, + "loss": 1.25, + "step": 2832 + }, + { + "epoch": 0.09, + "learning_rate": 4.959952042138967e-06, + "loss": 1.2112, + "step": 2833 + }, + { + "epoch": 0.09, + "learning_rate": 4.959908545736596e-06, + "loss": 1.2318, + "step": 2834 + }, + { + "epoch": 0.09, + "learning_rate": 4.959865025917081e-06, + "loss": 1.0996, + "step": 2835 + }, + { + "epoch": 0.09, + "learning_rate": 4.959821482680836e-06, + "loss": 1.2566, + "step": 2836 + }, + { + "epoch": 0.09, + "learning_rate": 4.959777916028274e-06, + "loss": 1.1031, + "step": 2837 + }, + { + "epoch": 0.09, + "learning_rate": 4.959734325959812e-06, + "loss": 1.1603, + "step": 2838 + }, + { + "epoch": 0.09, + "learning_rate": 4.9596907124758634e-06, + "loss": 1.1903, + "step": 2839 + }, + { + "epoch": 0.09, + "learning_rate": 4.9596470755768435e-06, + "loss": 1.1596, + "step": 2840 + }, + { + "epoch": 0.09, + "learning_rate": 4.959603415263168e-06, + "loss": 1.1747, + "step": 2841 + }, + { + "epoch": 0.09, + "learning_rate": 4.9595597315352525e-06, + "loss": 1.2148, + "step": 2842 + }, + { + "epoch": 0.09, + "learning_rate": 4.959516024393514e-06, + "loss": 1.0595, + "step": 2843 + }, + { + "epoch": 0.09, + "learning_rate": 4.959472293838367e-06, + "loss": 1.1208, + "step": 2844 + }, + { + "epoch": 0.09, + "learning_rate": 4.959428539870228e-06, + "loss": 1.1919, + "step": 2845 + }, + { + "epoch": 0.09, + "learning_rate": 4.959384762489514e-06, + "loss": 1.118, + "step": 2846 + }, + { + "epoch": 0.09, + "learning_rate": 4.959340961696641e-06, + "loss": 1.0518, + "step": 2847 + }, + { + "epoch": 0.09, + "learning_rate": 4.959297137492027e-06, + "loss": 1.1677, + "step": 2848 + }, + { + "epoch": 0.09, + "learning_rate": 4.959253289876089e-06, + "loss": 1.2476, + "step": 2849 + }, + { + "epoch": 0.09, + "learning_rate": 4.959209418849244e-06, + "loss": 1.1789, + "step": 2850 + }, + { + "epoch": 0.09, + "learning_rate": 4.959165524411909e-06, + "loss": 1.1125, + "step": 2851 + }, + { + "epoch": 0.09, + "learning_rate": 4.959121606564503e-06, + "loss": 1.1019, + "step": 2852 + }, + { + "epoch": 0.09, + "learning_rate": 4.9590776653074444e-06, + "loss": 1.1956, + "step": 2853 + }, + { + "epoch": 0.09, + "learning_rate": 4.95903370064115e-06, + "loss": 1.1256, + "step": 2854 + }, + { + "epoch": 0.09, + "learning_rate": 4.958989712566039e-06, + "loss": 1.095, + "step": 2855 + }, + { + "epoch": 0.09, + "learning_rate": 4.95894570108253e-06, + "loss": 1.201, + "step": 2856 + }, + { + "epoch": 0.09, + "learning_rate": 4.958901666191042e-06, + "loss": 1.1095, + "step": 2857 + }, + { + "epoch": 0.09, + "learning_rate": 4.958857607891996e-06, + "loss": 1.2328, + "step": 2858 + }, + { + "epoch": 0.09, + "learning_rate": 4.9588135261858085e-06, + "loss": 1.1558, + "step": 2859 + }, + { + "epoch": 0.09, + "learning_rate": 4.9587694210729005e-06, + "loss": 1.2471, + "step": 2860 + }, + { + "epoch": 0.09, + "learning_rate": 4.958725292553693e-06, + "loss": 1.2534, + "step": 2861 + }, + { + "epoch": 0.09, + "learning_rate": 4.958681140628604e-06, + "loss": 1.2735, + "step": 2862 + }, + { + "epoch": 0.09, + "learning_rate": 4.9586369652980535e-06, + "loss": 1.1358, + "step": 2863 + }, + { + "epoch": 0.09, + "learning_rate": 4.958592766562464e-06, + "loss": 1.1526, + "step": 2864 + }, + { + "epoch": 0.09, + "learning_rate": 4.958548544422257e-06, + "loss": 1.126, + "step": 2865 + }, + { + "epoch": 0.09, + "learning_rate": 4.958504298877851e-06, + "loss": 1.2223, + "step": 2866 + }, + { + "epoch": 0.09, + "learning_rate": 4.958460029929667e-06, + "loss": 1.0379, + "step": 2867 + }, + { + "epoch": 0.09, + "learning_rate": 4.958415737578128e-06, + "loss": 1.1637, + "step": 2868 + }, + { + "epoch": 0.09, + "learning_rate": 4.958371421823656e-06, + "loss": 1.2047, + "step": 2869 + }, + { + "epoch": 0.09, + "learning_rate": 4.958327082666672e-06, + "loss": 1.1865, + "step": 2870 + }, + { + "epoch": 0.09, + "learning_rate": 4.958282720107598e-06, + "loss": 1.1909, + "step": 2871 + }, + { + "epoch": 0.09, + "learning_rate": 4.958238334146856e-06, + "loss": 1.0002, + "step": 2872 + }, + { + "epoch": 0.09, + "learning_rate": 4.958193924784869e-06, + "loss": 1.1626, + "step": 2873 + }, + { + "epoch": 0.09, + "learning_rate": 4.95814949202206e-06, + "loss": 1.1014, + "step": 2874 + }, + { + "epoch": 0.09, + "learning_rate": 4.958105035858851e-06, + "loss": 1.1494, + "step": 2875 + }, + { + "epoch": 0.09, + "learning_rate": 4.9580605562956675e-06, + "loss": 1.2157, + "step": 2876 + }, + { + "epoch": 0.09, + "learning_rate": 4.95801605333293e-06, + "loss": 1.129, + "step": 2877 + }, + { + "epoch": 0.09, + "learning_rate": 4.957971526971064e-06, + "loss": 1.0671, + "step": 2878 + }, + { + "epoch": 0.09, + "learning_rate": 4.957926977210492e-06, + "loss": 1.1183, + "step": 2879 + }, + { + "epoch": 0.09, + "learning_rate": 4.957882404051641e-06, + "loss": 1.252, + "step": 2880 + }, + { + "epoch": 0.09, + "learning_rate": 4.957837807494932e-06, + "loss": 1.1669, + "step": 2881 + }, + { + "epoch": 0.09, + "learning_rate": 4.95779318754079e-06, + "loss": 1.1483, + "step": 2882 + }, + { + "epoch": 0.09, + "learning_rate": 4.957748544189642e-06, + "loss": 1.1284, + "step": 2883 + }, + { + "epoch": 0.09, + "learning_rate": 4.957703877441911e-06, + "loss": 1.2583, + "step": 2884 + }, + { + "epoch": 0.09, + "learning_rate": 4.957659187298022e-06, + "loss": 1.1362, + "step": 2885 + }, + { + "epoch": 0.09, + "learning_rate": 4.957614473758402e-06, + "loss": 1.3756, + "step": 2886 + }, + { + "epoch": 0.09, + "learning_rate": 4.957569736823476e-06, + "loss": 1.2623, + "step": 2887 + }, + { + "epoch": 0.09, + "learning_rate": 4.95752497649367e-06, + "loss": 1.2458, + "step": 2888 + }, + { + "epoch": 0.09, + "learning_rate": 4.957480192769408e-06, + "loss": 1.2186, + "step": 2889 + }, + { + "epoch": 0.09, + "learning_rate": 4.95743538565112e-06, + "loss": 1.1446, + "step": 2890 + }, + { + "epoch": 0.09, + "learning_rate": 4.95739055513923e-06, + "loss": 1.1368, + "step": 2891 + }, + { + "epoch": 0.09, + "learning_rate": 4.957345701234165e-06, + "loss": 1.0597, + "step": 2892 + }, + { + "epoch": 0.09, + "learning_rate": 4.9573008239363535e-06, + "loss": 1.0554, + "step": 2893 + }, + { + "epoch": 0.09, + "learning_rate": 4.957255923246221e-06, + "loss": 1.1425, + "step": 2894 + }, + { + "epoch": 0.09, + "learning_rate": 4.957210999164196e-06, + "loss": 1.1835, + "step": 2895 + }, + { + "epoch": 0.09, + "learning_rate": 4.957166051690705e-06, + "loss": 1.1287, + "step": 2896 + }, + { + "epoch": 0.09, + "learning_rate": 4.957121080826177e-06, + "loss": 1.1, + "step": 2897 + }, + { + "epoch": 0.09, + "learning_rate": 4.957076086571039e-06, + "loss": 1.0518, + "step": 2898 + }, + { + "epoch": 0.09, + "learning_rate": 4.957031068925721e-06, + "loss": 1.1307, + "step": 2899 + }, + { + "epoch": 0.09, + "learning_rate": 4.9569860278906504e-06, + "loss": 1.2936, + "step": 2900 + }, + { + "epoch": 0.09, + "learning_rate": 4.956940963466256e-06, + "loss": 1.1915, + "step": 2901 + }, + { + "epoch": 0.09, + "learning_rate": 4.956895875652967e-06, + "loss": 1.1116, + "step": 2902 + }, + { + "epoch": 0.09, + "learning_rate": 4.956850764451212e-06, + "loss": 1.1787, + "step": 2903 + }, + { + "epoch": 0.09, + "learning_rate": 4.956805629861421e-06, + "loss": 1.124, + "step": 2904 + }, + { + "epoch": 0.09, + "learning_rate": 4.9567604718840246e-06, + "loss": 1.1401, + "step": 2905 + }, + { + "epoch": 0.09, + "learning_rate": 4.956715290519452e-06, + "loss": 1.1183, + "step": 2906 + }, + { + "epoch": 0.09, + "learning_rate": 4.956670085768132e-06, + "loss": 1.1266, + "step": 2907 + }, + { + "epoch": 0.09, + "learning_rate": 4.956624857630496e-06, + "loss": 1.0953, + "step": 2908 + }, + { + "epoch": 0.09, + "learning_rate": 4.956579606106974e-06, + "loss": 1.1782, + "step": 2909 + }, + { + "epoch": 0.09, + "learning_rate": 4.956534331197998e-06, + "loss": 1.1417, + "step": 2910 + }, + { + "epoch": 0.09, + "learning_rate": 4.956489032903998e-06, + "loss": 1.1989, + "step": 2911 + }, + { + "epoch": 0.09, + "learning_rate": 4.956443711225406e-06, + "loss": 1.2491, + "step": 2912 + }, + { + "epoch": 0.09, + "learning_rate": 4.956398366162652e-06, + "loss": 1.141, + "step": 2913 + }, + { + "epoch": 0.09, + "learning_rate": 4.95635299771617e-06, + "loss": 1.1619, + "step": 2914 + }, + { + "epoch": 0.09, + "learning_rate": 4.95630760588639e-06, + "loss": 1.21, + "step": 2915 + }, + { + "epoch": 0.09, + "learning_rate": 4.956262190673744e-06, + "loss": 1.0958, + "step": 2916 + }, + { + "epoch": 0.09, + "learning_rate": 4.9562167520786655e-06, + "loss": 1.2206, + "step": 2917 + }, + { + "epoch": 0.09, + "learning_rate": 4.956171290101585e-06, + "loss": 1.2473, + "step": 2918 + }, + { + "epoch": 0.09, + "learning_rate": 4.956125804742939e-06, + "loss": 1.0616, + "step": 2919 + }, + { + "epoch": 0.09, + "learning_rate": 4.956080296003157e-06, + "loss": 1.2001, + "step": 2920 + }, + { + "epoch": 0.09, + "learning_rate": 4.956034763882674e-06, + "loss": 1.1131, + "step": 2921 + }, + { + "epoch": 0.09, + "learning_rate": 4.955989208381922e-06, + "loss": 1.1091, + "step": 2922 + }, + { + "epoch": 0.09, + "learning_rate": 4.955943629501336e-06, + "loss": 1.1005, + "step": 2923 + }, + { + "epoch": 0.09, + "learning_rate": 4.95589802724135e-06, + "loss": 1.078, + "step": 2924 + }, + { + "epoch": 0.09, + "learning_rate": 4.955852401602398e-06, + "loss": 1.1754, + "step": 2925 + }, + { + "epoch": 0.09, + "learning_rate": 4.955806752584913e-06, + "loss": 1.2648, + "step": 2926 + }, + { + "epoch": 0.09, + "learning_rate": 4.955761080189331e-06, + "loss": 1.1819, + "step": 2927 + }, + { + "epoch": 0.09, + "learning_rate": 4.955715384416085e-06, + "loss": 1.1382, + "step": 2928 + }, + { + "epoch": 0.09, + "learning_rate": 4.955669665265612e-06, + "loss": 1.2815, + "step": 2929 + }, + { + "epoch": 0.09, + "learning_rate": 4.955623922738347e-06, + "loss": 1.1447, + "step": 2930 + }, + { + "epoch": 0.09, + "learning_rate": 4.955578156834724e-06, + "loss": 1.1628, + "step": 2931 + }, + { + "epoch": 0.09, + "learning_rate": 4.9555323675551806e-06, + "loss": 1.194, + "step": 2932 + }, + { + "epoch": 0.09, + "learning_rate": 4.955486554900152e-06, + "loss": 1.149, + "step": 2933 + }, + { + "epoch": 0.09, + "learning_rate": 4.955440718870073e-06, + "loss": 1.1058, + "step": 2934 + }, + { + "epoch": 0.09, + "learning_rate": 4.95539485946538e-06, + "loss": 1.1619, + "step": 2935 + }, + { + "epoch": 0.09, + "learning_rate": 4.955348976686513e-06, + "loss": 1.2661, + "step": 2936 + }, + { + "epoch": 0.09, + "learning_rate": 4.9553030705339045e-06, + "loss": 1.1799, + "step": 2937 + }, + { + "epoch": 0.09, + "learning_rate": 4.955257141007993e-06, + "loss": 1.1459, + "step": 2938 + }, + { + "epoch": 0.09, + "learning_rate": 4.955211188109217e-06, + "loss": 1.088, + "step": 2939 + }, + { + "epoch": 0.09, + "learning_rate": 4.955165211838013e-06, + "loss": 1.1271, + "step": 2940 + }, + { + "epoch": 0.09, + "learning_rate": 4.955119212194818e-06, + "loss": 1.1577, + "step": 2941 + }, + { + "epoch": 0.09, + "learning_rate": 4.955073189180071e-06, + "loss": 1.1111, + "step": 2942 + }, + { + "epoch": 0.09, + "learning_rate": 4.955027142794209e-06, + "loss": 1.249, + "step": 2943 + }, + { + "epoch": 0.09, + "learning_rate": 4.954981073037672e-06, + "loss": 1.0096, + "step": 2944 + }, + { + "epoch": 0.09, + "learning_rate": 4.954934979910897e-06, + "loss": 1.2083, + "step": 2945 + }, + { + "epoch": 0.09, + "learning_rate": 4.954888863414323e-06, + "loss": 1.1092, + "step": 2946 + }, + { + "epoch": 0.09, + "learning_rate": 4.95484272354839e-06, + "loss": 1.1303, + "step": 2947 + }, + { + "epoch": 0.09, + "learning_rate": 4.954796560313536e-06, + "loss": 1.1561, + "step": 2948 + }, + { + "epoch": 0.09, + "learning_rate": 4.9547503737102005e-06, + "loss": 1.2074, + "step": 2949 + }, + { + "epoch": 0.09, + "learning_rate": 4.954704163738825e-06, + "loss": 1.2646, + "step": 2950 + }, + { + "epoch": 0.09, + "learning_rate": 4.954657930399848e-06, + "loss": 1.2678, + "step": 2951 + }, + { + "epoch": 0.09, + "learning_rate": 4.954611673693709e-06, + "loss": 1.1319, + "step": 2952 + }, + { + "epoch": 0.09, + "learning_rate": 4.954565393620849e-06, + "loss": 1.0924, + "step": 2953 + }, + { + "epoch": 0.09, + "learning_rate": 4.954519090181709e-06, + "loss": 1.1284, + "step": 2954 + }, + { + "epoch": 0.09, + "learning_rate": 4.95447276337673e-06, + "loss": 1.1402, + "step": 2955 + }, + { + "epoch": 0.09, + "learning_rate": 4.954426413206351e-06, + "loss": 1.2806, + "step": 2956 + }, + { + "epoch": 0.09, + "learning_rate": 4.954380039671016e-06, + "loss": 1.0561, + "step": 2957 + }, + { + "epoch": 0.09, + "learning_rate": 4.954333642771164e-06, + "loss": 1.1332, + "step": 2958 + }, + { + "epoch": 0.09, + "learning_rate": 4.954287222507238e-06, + "loss": 1.1481, + "step": 2959 + }, + { + "epoch": 0.09, + "learning_rate": 4.9542407788796796e-06, + "loss": 1.2453, + "step": 2960 + }, + { + "epoch": 0.09, + "learning_rate": 4.954194311888932e-06, + "loss": 1.179, + "step": 2961 + }, + { + "epoch": 0.09, + "learning_rate": 4.954147821535435e-06, + "loss": 1.1689, + "step": 2962 + }, + { + "epoch": 0.09, + "learning_rate": 4.954101307819634e-06, + "loss": 1.1328, + "step": 2963 + }, + { + "epoch": 0.09, + "learning_rate": 4.954054770741969e-06, + "loss": 1.0934, + "step": 2964 + }, + { + "epoch": 0.09, + "learning_rate": 4.9540082103028865e-06, + "loss": 1.1627, + "step": 2965 + }, + { + "epoch": 0.09, + "learning_rate": 4.9539616265028266e-06, + "loss": 1.1274, + "step": 2966 + }, + { + "epoch": 0.09, + "learning_rate": 4.953915019342234e-06, + "loss": 1.1003, + "step": 2967 + }, + { + "epoch": 0.09, + "learning_rate": 4.953868388821552e-06, + "loss": 1.2547, + "step": 2968 + }, + { + "epoch": 0.09, + "learning_rate": 4.953821734941226e-06, + "loss": 1.146, + "step": 2969 + }, + { + "epoch": 0.09, + "learning_rate": 4.953775057701698e-06, + "loss": 1.2314, + "step": 2970 + }, + { + "epoch": 0.09, + "learning_rate": 4.9537283571034125e-06, + "loss": 1.0841, + "step": 2971 + }, + { + "epoch": 0.09, + "learning_rate": 4.953681633146815e-06, + "loss": 1.2333, + "step": 2972 + }, + { + "epoch": 0.09, + "learning_rate": 4.95363488583235e-06, + "loss": 1.1464, + "step": 2973 + }, + { + "epoch": 0.09, + "learning_rate": 4.953588115160463e-06, + "loss": 1.1412, + "step": 2974 + }, + { + "epoch": 0.09, + "learning_rate": 4.9535413211316e-06, + "loss": 1.106, + "step": 2975 + }, + { + "epoch": 0.09, + "learning_rate": 4.953494503746203e-06, + "loss": 1.1857, + "step": 2976 + }, + { + "epoch": 0.09, + "learning_rate": 4.953447663004723e-06, + "loss": 1.1918, + "step": 2977 + }, + { + "epoch": 0.09, + "learning_rate": 4.9534007989076e-06, + "loss": 1.199, + "step": 2978 + }, + { + "epoch": 0.09, + "learning_rate": 4.9533539114552845e-06, + "loss": 1.1473, + "step": 2979 + }, + { + "epoch": 0.09, + "learning_rate": 4.95330700064822e-06, + "loss": 1.174, + "step": 2980 + }, + { + "epoch": 0.09, + "learning_rate": 4.953260066486856e-06, + "loss": 1.2944, + "step": 2981 + }, + { + "epoch": 0.09, + "learning_rate": 4.9532131089716365e-06, + "loss": 1.0835, + "step": 2982 + }, + { + "epoch": 0.09, + "learning_rate": 4.9531661281030104e-06, + "loss": 1.1403, + "step": 2983 + }, + { + "epoch": 0.09, + "learning_rate": 4.953119123881424e-06, + "loss": 1.053, + "step": 2984 + }, + { + "epoch": 0.09, + "learning_rate": 4.953072096307325e-06, + "loss": 1.164, + "step": 2985 + }, + { + "epoch": 0.09, + "learning_rate": 4.953025045381161e-06, + "loss": 1.0737, + "step": 2986 + }, + { + "epoch": 0.09, + "learning_rate": 4.95297797110338e-06, + "loss": 1.2275, + "step": 2987 + }, + { + "epoch": 0.09, + "learning_rate": 4.952930873474431e-06, + "loss": 1.0624, + "step": 2988 + }, + { + "epoch": 0.09, + "learning_rate": 4.95288375249476e-06, + "loss": 1.243, + "step": 2989 + }, + { + "epoch": 0.09, + "learning_rate": 4.952836608164818e-06, + "loss": 1.1124, + "step": 2990 + }, + { + "epoch": 0.09, + "learning_rate": 4.952789440485053e-06, + "loss": 1.1404, + "step": 2991 + }, + { + "epoch": 0.09, + "learning_rate": 4.952742249455913e-06, + "loss": 1.1454, + "step": 2992 + }, + { + "epoch": 0.09, + "learning_rate": 4.952695035077848e-06, + "loss": 1.2654, + "step": 2993 + }, + { + "epoch": 0.09, + "learning_rate": 4.952647797351308e-06, + "loss": 1.1131, + "step": 2994 + }, + { + "epoch": 0.09, + "learning_rate": 4.952600536276743e-06, + "loss": 1.2073, + "step": 2995 + }, + { + "epoch": 0.09, + "learning_rate": 4.9525532518546e-06, + "loss": 1.1879, + "step": 2996 + }, + { + "epoch": 0.09, + "learning_rate": 4.952505944085333e-06, + "loss": 1.1146, + "step": 2997 + }, + { + "epoch": 0.09, + "learning_rate": 4.95245861296939e-06, + "loss": 1.1635, + "step": 2998 + }, + { + "epoch": 0.09, + "learning_rate": 4.952411258507223e-06, + "loss": 1.2443, + "step": 2999 + }, + { + "epoch": 0.09, + "learning_rate": 4.95236388069928e-06, + "loss": 1.0307, + "step": 3000 + }, + { + "epoch": 0.09, + "learning_rate": 4.952316479546015e-06, + "loss": 1.1652, + "step": 3001 + }, + { + "epoch": 0.09, + "learning_rate": 4.9522690550478795e-06, + "loss": 1.1127, + "step": 3002 + }, + { + "epoch": 0.09, + "learning_rate": 4.9522216072053216e-06, + "loss": 1.2559, + "step": 3003 + }, + { + "epoch": 0.09, + "learning_rate": 4.952174136018796e-06, + "loss": 1.0496, + "step": 3004 + }, + { + "epoch": 0.09, + "learning_rate": 4.952126641488754e-06, + "loss": 1.2035, + "step": 3005 + }, + { + "epoch": 0.09, + "learning_rate": 4.952079123615647e-06, + "loss": 1.1141, + "step": 3006 + }, + { + "epoch": 0.09, + "learning_rate": 4.952031582399927e-06, + "loss": 1.1975, + "step": 3007 + }, + { + "epoch": 0.09, + "learning_rate": 4.951984017842048e-06, + "loss": 1.1378, + "step": 3008 + }, + { + "epoch": 0.09, + "learning_rate": 4.951936429942462e-06, + "loss": 1.1065, + "step": 3009 + }, + { + "epoch": 0.09, + "learning_rate": 4.951888818701623e-06, + "loss": 1.0911, + "step": 3010 + }, + { + "epoch": 0.09, + "learning_rate": 4.951841184119981e-06, + "loss": 1.174, + "step": 3011 + }, + { + "epoch": 0.09, + "learning_rate": 4.951793526197993e-06, + "loss": 1.055, + "step": 3012 + }, + { + "epoch": 0.09, + "learning_rate": 4.951745844936112e-06, + "loss": 1.2589, + "step": 3013 + }, + { + "epoch": 0.09, + "learning_rate": 4.951698140334791e-06, + "loss": 1.1311, + "step": 3014 + }, + { + "epoch": 0.09, + "learning_rate": 4.951650412394484e-06, + "loss": 1.162, + "step": 3015 + }, + { + "epoch": 0.09, + "learning_rate": 4.951602661115647e-06, + "loss": 1.1169, + "step": 3016 + }, + { + "epoch": 0.09, + "learning_rate": 4.9515548864987315e-06, + "loss": 1.1342, + "step": 3017 + }, + { + "epoch": 0.09, + "learning_rate": 4.951507088544196e-06, + "loss": 1.2395, + "step": 3018 + }, + { + "epoch": 0.09, + "learning_rate": 4.951459267252493e-06, + "loss": 1.0309, + "step": 3019 + }, + { + "epoch": 0.09, + "learning_rate": 4.9514114226240785e-06, + "loss": 1.1552, + "step": 3020 + }, + { + "epoch": 0.09, + "learning_rate": 4.951363554659408e-06, + "loss": 1.116, + "step": 3021 + }, + { + "epoch": 0.09, + "learning_rate": 4.951315663358936e-06, + "loss": 1.1329, + "step": 3022 + }, + { + "epoch": 0.09, + "learning_rate": 4.951267748723121e-06, + "loss": 1.2539, + "step": 3023 + }, + { + "epoch": 0.09, + "learning_rate": 4.951219810752417e-06, + "loss": 1.1234, + "step": 3024 + }, + { + "epoch": 0.09, + "learning_rate": 4.951171849447281e-06, + "loss": 1.2551, + "step": 3025 + }, + { + "epoch": 0.09, + "learning_rate": 4.9511238648081695e-06, + "loss": 1.1614, + "step": 3026 + }, + { + "epoch": 0.09, + "learning_rate": 4.951075856835539e-06, + "loss": 1.1934, + "step": 3027 + }, + { + "epoch": 0.09, + "learning_rate": 4.951027825529847e-06, + "loss": 1.1982, + "step": 3028 + }, + { + "epoch": 0.09, + "learning_rate": 4.950979770891551e-06, + "loss": 1.2494, + "step": 3029 + }, + { + "epoch": 0.09, + "learning_rate": 4.950931692921107e-06, + "loss": 1.1052, + "step": 3030 + }, + { + "epoch": 0.09, + "learning_rate": 4.950883591618974e-06, + "loss": 1.1008, + "step": 3031 + }, + { + "epoch": 0.09, + "learning_rate": 4.950835466985611e-06, + "loss": 1.1154, + "step": 3032 + }, + { + "epoch": 0.09, + "learning_rate": 4.9507873190214735e-06, + "loss": 1.1808, + "step": 3033 + }, + { + "epoch": 0.09, + "learning_rate": 4.950739147727022e-06, + "loss": 1.1859, + "step": 3034 + }, + { + "epoch": 0.09, + "learning_rate": 4.9506909531027125e-06, + "loss": 1.1058, + "step": 3035 + }, + { + "epoch": 0.09, + "learning_rate": 4.950642735149007e-06, + "loss": 1.1637, + "step": 3036 + }, + { + "epoch": 0.09, + "learning_rate": 4.950594493866362e-06, + "loss": 1.1268, + "step": 3037 + }, + { + "epoch": 0.09, + "learning_rate": 4.9505462292552375e-06, + "loss": 1.215, + "step": 3038 + }, + { + "epoch": 0.09, + "learning_rate": 4.9504979413160936e-06, + "loss": 1.1657, + "step": 3039 + }, + { + "epoch": 0.09, + "learning_rate": 4.9504496300493895e-06, + "loss": 1.1212, + "step": 3040 + }, + { + "epoch": 0.09, + "learning_rate": 4.9504012954555845e-06, + "loss": 1.1094, + "step": 3041 + }, + { + "epoch": 0.09, + "learning_rate": 4.95035293753514e-06, + "loss": 1.1282, + "step": 3042 + }, + { + "epoch": 0.09, + "learning_rate": 4.950304556288515e-06, + "loss": 1.2154, + "step": 3043 + }, + { + "epoch": 0.09, + "learning_rate": 4.950256151716172e-06, + "loss": 1.2187, + "step": 3044 + }, + { + "epoch": 0.09, + "learning_rate": 4.95020772381857e-06, + "loss": 1.1254, + "step": 3045 + }, + { + "epoch": 0.09, + "learning_rate": 4.95015927259617e-06, + "loss": 1.0997, + "step": 3046 + }, + { + "epoch": 0.09, + "learning_rate": 4.950110798049434e-06, + "loss": 1.166, + "step": 3047 + }, + { + "epoch": 0.09, + "learning_rate": 4.9500623001788225e-06, + "loss": 1.2461, + "step": 3048 + }, + { + "epoch": 0.09, + "learning_rate": 4.950013778984799e-06, + "loss": 1.1938, + "step": 3049 + }, + { + "epoch": 0.09, + "learning_rate": 4.949965234467824e-06, + "loss": 1.207, + "step": 3050 + }, + { + "epoch": 0.09, + "learning_rate": 4.94991666662836e-06, + "loss": 1.1436, + "step": 3051 + }, + { + "epoch": 0.09, + "learning_rate": 4.9498680754668695e-06, + "loss": 1.1876, + "step": 3052 + }, + { + "epoch": 0.09, + "learning_rate": 4.949819460983814e-06, + "loss": 1.129, + "step": 3053 + }, + { + "epoch": 0.09, + "learning_rate": 4.9497708231796576e-06, + "loss": 1.1506, + "step": 3054 + }, + { + "epoch": 0.09, + "learning_rate": 4.949722162054863e-06, + "loss": 1.1866, + "step": 3055 + }, + { + "epoch": 0.09, + "learning_rate": 4.949673477609893e-06, + "loss": 1.2469, + "step": 3056 + }, + { + "epoch": 0.09, + "learning_rate": 4.949624769845211e-06, + "loss": 1.0456, + "step": 3057 + }, + { + "epoch": 0.09, + "learning_rate": 4.9495760387612816e-06, + "loss": 1.1716, + "step": 3058 + }, + { + "epoch": 0.09, + "learning_rate": 4.949527284358567e-06, + "loss": 1.1522, + "step": 3059 + }, + { + "epoch": 0.09, + "learning_rate": 4.949478506637533e-06, + "loss": 1.1436, + "step": 3060 + }, + { + "epoch": 0.09, + "learning_rate": 4.949429705598644e-06, + "loss": 1.1643, + "step": 3061 + }, + { + "epoch": 0.09, + "learning_rate": 4.949380881242363e-06, + "loss": 1.0874, + "step": 3062 + }, + { + "epoch": 0.09, + "learning_rate": 4.949332033569156e-06, + "loss": 1.0877, + "step": 3063 + }, + { + "epoch": 0.09, + "learning_rate": 4.949283162579488e-06, + "loss": 1.1614, + "step": 3064 + }, + { + "epoch": 0.09, + "learning_rate": 4.949234268273824e-06, + "loss": 1.0795, + "step": 3065 + }, + { + "epoch": 0.09, + "learning_rate": 4.949185350652628e-06, + "loss": 1.1821, + "step": 3066 + }, + { + "epoch": 0.09, + "learning_rate": 4.949136409716369e-06, + "loss": 1.1685, + "step": 3067 + }, + { + "epoch": 0.09, + "learning_rate": 4.949087445465509e-06, + "loss": 1.2958, + "step": 3068 + }, + { + "epoch": 0.09, + "learning_rate": 4.949038457900517e-06, + "loss": 1.1119, + "step": 3069 + }, + { + "epoch": 0.09, + "learning_rate": 4.9489894470218584e-06, + "loss": 1.1686, + "step": 3070 + }, + { + "epoch": 0.09, + "learning_rate": 4.94894041283e-06, + "loss": 1.1072, + "step": 3071 + }, + { + "epoch": 0.09, + "learning_rate": 4.9488913553254074e-06, + "loss": 1.1416, + "step": 3072 + }, + { + "epoch": 0.09, + "learning_rate": 4.94884227450855e-06, + "loss": 1.2028, + "step": 3073 + }, + { + "epoch": 0.09, + "learning_rate": 4.948793170379892e-06, + "loss": 1.1866, + "step": 3074 + }, + { + "epoch": 0.09, + "learning_rate": 4.948744042939903e-06, + "loss": 1.135, + "step": 3075 + }, + { + "epoch": 0.09, + "learning_rate": 4.9486948921890495e-06, + "loss": 1.1364, + "step": 3076 + }, + { + "epoch": 0.09, + "learning_rate": 4.9486457181278016e-06, + "loss": 1.178, + "step": 3077 + }, + { + "epoch": 0.09, + "learning_rate": 4.9485965207566245e-06, + "loss": 1.1921, + "step": 3078 + }, + { + "epoch": 0.09, + "learning_rate": 4.9485473000759875e-06, + "loss": 1.2326, + "step": 3079 + }, + { + "epoch": 0.09, + "learning_rate": 4.948498056086361e-06, + "loss": 1.233, + "step": 3080 + }, + { + "epoch": 0.09, + "learning_rate": 4.94844878878821e-06, + "loss": 1.2241, + "step": 3081 + }, + { + "epoch": 0.09, + "learning_rate": 4.9483994981820075e-06, + "loss": 1.092, + "step": 3082 + }, + { + "epoch": 0.09, + "learning_rate": 4.94835018426822e-06, + "loss": 1.0873, + "step": 3083 + }, + { + "epoch": 0.09, + "learning_rate": 4.9483008470473186e-06, + "loss": 1.1432, + "step": 3084 + }, + { + "epoch": 0.09, + "learning_rate": 4.9482514865197726e-06, + "loss": 1.0893, + "step": 3085 + }, + { + "epoch": 0.09, + "learning_rate": 4.948202102686051e-06, + "loss": 1.2275, + "step": 3086 + }, + { + "epoch": 0.09, + "learning_rate": 4.948152695546624e-06, + "loss": 1.0777, + "step": 3087 + }, + { + "epoch": 0.09, + "learning_rate": 4.948103265101964e-06, + "loss": 1.0773, + "step": 3088 + }, + { + "epoch": 0.09, + "learning_rate": 4.948053811352538e-06, + "loss": 1.0984, + "step": 3089 + }, + { + "epoch": 0.09, + "learning_rate": 4.948004334298819e-06, + "loss": 1.1216, + "step": 3090 + }, + { + "epoch": 0.09, + "learning_rate": 4.947954833941279e-06, + "loss": 1.2062, + "step": 3091 + }, + { + "epoch": 0.09, + "learning_rate": 4.947905310280388e-06, + "loss": 1.2548, + "step": 3092 + }, + { + "epoch": 0.09, + "learning_rate": 4.947855763316616e-06, + "loss": 1.224, + "step": 3093 + }, + { + "epoch": 0.09, + "learning_rate": 4.947806193050436e-06, + "loss": 1.2088, + "step": 3094 + }, + { + "epoch": 0.09, + "learning_rate": 4.947756599482321e-06, + "loss": 1.1069, + "step": 3095 + }, + { + "epoch": 0.09, + "learning_rate": 4.947706982612742e-06, + "loss": 1.1532, + "step": 3096 + }, + { + "epoch": 0.09, + "learning_rate": 4.947657342442171e-06, + "loss": 1.1392, + "step": 3097 + }, + { + "epoch": 0.09, + "learning_rate": 4.947607678971082e-06, + "loss": 1.1431, + "step": 3098 + }, + { + "epoch": 0.09, + "learning_rate": 4.9475579921999455e-06, + "loss": 1.1683, + "step": 3099 + }, + { + "epoch": 0.09, + "learning_rate": 4.947508282129235e-06, + "loss": 1.239, + "step": 3100 + }, + { + "epoch": 0.09, + "learning_rate": 4.9474585487594265e-06, + "loss": 1.1583, + "step": 3101 + }, + { + "epoch": 0.09, + "learning_rate": 4.94740879209099e-06, + "loss": 1.1873, + "step": 3102 + }, + { + "epoch": 0.09, + "learning_rate": 4.947359012124401e-06, + "loss": 1.1223, + "step": 3103 + }, + { + "epoch": 0.09, + "learning_rate": 4.947309208860132e-06, + "loss": 1.1236, + "step": 3104 + }, + { + "epoch": 0.09, + "learning_rate": 4.947259382298659e-06, + "loss": 1.0648, + "step": 3105 + }, + { + "epoch": 0.09, + "learning_rate": 4.947209532440455e-06, + "loss": 1.1274, + "step": 3106 + }, + { + "epoch": 0.09, + "learning_rate": 4.947159659285994e-06, + "loss": 1.2524, + "step": 3107 + }, + { + "epoch": 0.09, + "learning_rate": 4.947109762835753e-06, + "loss": 1.0714, + "step": 3108 + }, + { + "epoch": 0.09, + "learning_rate": 4.947059843090205e-06, + "loss": 1.1623, + "step": 3109 + }, + { + "epoch": 0.09, + "learning_rate": 4.947009900049826e-06, + "loss": 1.046, + "step": 3110 + }, + { + "epoch": 0.09, + "learning_rate": 4.946959933715091e-06, + "loss": 1.1246, + "step": 3111 + }, + { + "epoch": 0.09, + "learning_rate": 4.946909944086477e-06, + "loss": 1.191, + "step": 3112 + }, + { + "epoch": 0.09, + "learning_rate": 4.946859931164457e-06, + "loss": 1.1734, + "step": 3113 + }, + { + "epoch": 0.09, + "learning_rate": 4.94680989494951e-06, + "loss": 1.0986, + "step": 3114 + }, + { + "epoch": 0.09, + "learning_rate": 4.946759835442111e-06, + "loss": 1.2231, + "step": 3115 + }, + { + "epoch": 0.09, + "learning_rate": 4.9467097526427365e-06, + "loss": 1.1915, + "step": 3116 + }, + { + "epoch": 0.09, + "learning_rate": 4.946659646551864e-06, + "loss": 1.1704, + "step": 3117 + }, + { + "epoch": 0.09, + "learning_rate": 4.94660951716997e-06, + "loss": 1.2746, + "step": 3118 + }, + { + "epoch": 0.09, + "learning_rate": 4.946559364497532e-06, + "loss": 1.2865, + "step": 3119 + }, + { + "epoch": 0.09, + "learning_rate": 4.9465091885350265e-06, + "loss": 1.0979, + "step": 3120 + }, + { + "epoch": 0.09, + "learning_rate": 4.946458989282932e-06, + "loss": 1.0971, + "step": 3121 + }, + { + "epoch": 0.09, + "learning_rate": 4.946408766741726e-06, + "loss": 1.1631, + "step": 3122 + }, + { + "epoch": 0.09, + "learning_rate": 4.946358520911887e-06, + "loss": 1.2045, + "step": 3123 + }, + { + "epoch": 0.09, + "learning_rate": 4.9463082517938934e-06, + "loss": 1.0795, + "step": 3124 + }, + { + "epoch": 0.09, + "learning_rate": 4.946257959388223e-06, + "loss": 1.252, + "step": 3125 + }, + { + "epoch": 0.09, + "learning_rate": 4.946207643695355e-06, + "loss": 1.205, + "step": 3126 + }, + { + "epoch": 0.09, + "learning_rate": 4.9461573047157686e-06, + "loss": 1.1415, + "step": 3127 + }, + { + "epoch": 0.09, + "learning_rate": 4.946106942449942e-06, + "loss": 1.1571, + "step": 3128 + }, + { + "epoch": 0.09, + "learning_rate": 4.946056556898357e-06, + "loss": 1.0463, + "step": 3129 + }, + { + "epoch": 0.09, + "learning_rate": 4.94600614806149e-06, + "loss": 1.2162, + "step": 3130 + }, + { + "epoch": 0.09, + "learning_rate": 4.945955715939823e-06, + "loss": 1.137, + "step": 3131 + }, + { + "epoch": 0.09, + "learning_rate": 4.945905260533836e-06, + "loss": 1.1024, + "step": 3132 + }, + { + "epoch": 0.09, + "learning_rate": 4.945854781844009e-06, + "loss": 1.1042, + "step": 3133 + }, + { + "epoch": 0.09, + "learning_rate": 4.945804279870822e-06, + "loss": 1.1397, + "step": 3134 + }, + { + "epoch": 0.09, + "learning_rate": 4.945753754614756e-06, + "loss": 1.1523, + "step": 3135 + }, + { + "epoch": 0.09, + "learning_rate": 4.945703206076293e-06, + "loss": 1.2143, + "step": 3136 + }, + { + "epoch": 0.09, + "learning_rate": 4.945652634255912e-06, + "loss": 1.1299, + "step": 3137 + }, + { + "epoch": 0.09, + "learning_rate": 4.945602039154097e-06, + "loss": 1.328, + "step": 3138 + }, + { + "epoch": 0.09, + "learning_rate": 4.945551420771329e-06, + "loss": 1.0591, + "step": 3139 + }, + { + "epoch": 0.09, + "learning_rate": 4.945500779108088e-06, + "loss": 1.1744, + "step": 3140 + }, + { + "epoch": 0.09, + "learning_rate": 4.945450114164858e-06, + "loss": 1.1287, + "step": 3141 + }, + { + "epoch": 0.09, + "learning_rate": 4.94539942594212e-06, + "loss": 1.1609, + "step": 3142 + }, + { + "epoch": 0.09, + "learning_rate": 4.945348714440357e-06, + "loss": 1.1583, + "step": 3143 + }, + { + "epoch": 0.09, + "learning_rate": 4.945297979660053e-06, + "loss": 1.0555, + "step": 3144 + }, + { + "epoch": 0.09, + "learning_rate": 4.94524722160169e-06, + "loss": 1.1729, + "step": 3145 + }, + { + "epoch": 0.09, + "learning_rate": 4.94519644026575e-06, + "loss": 1.1287, + "step": 3146 + }, + { + "epoch": 0.09, + "learning_rate": 4.9451456356527184e-06, + "loss": 1.0883, + "step": 3147 + }, + { + "epoch": 0.09, + "learning_rate": 4.945094807763078e-06, + "loss": 1.1818, + "step": 3148 + }, + { + "epoch": 0.09, + "learning_rate": 4.945043956597312e-06, + "loss": 1.1029, + "step": 3149 + }, + { + "epoch": 0.09, + "learning_rate": 4.944993082155906e-06, + "loss": 1.1542, + "step": 3150 + }, + { + "epoch": 0.09, + "learning_rate": 4.944942184439343e-06, + "loss": 1.155, + "step": 3151 + }, + { + "epoch": 0.09, + "learning_rate": 4.944891263448108e-06, + "loss": 1.1722, + "step": 3152 + }, + { + "epoch": 0.09, + "learning_rate": 4.944840319182685e-06, + "loss": 1.196, + "step": 3153 + }, + { + "epoch": 0.1, + "learning_rate": 4.94478935164356e-06, + "loss": 1.2339, + "step": 3154 + }, + { + "epoch": 0.1, + "learning_rate": 4.9447383608312185e-06, + "loss": 1.3003, + "step": 3155 + }, + { + "epoch": 0.1, + "learning_rate": 4.9446873467461445e-06, + "loss": 1.3044, + "step": 3156 + }, + { + "epoch": 0.1, + "learning_rate": 4.944636309388824e-06, + "loss": 1.1417, + "step": 3157 + }, + { + "epoch": 0.1, + "learning_rate": 4.944585248759744e-06, + "loss": 1.1194, + "step": 3158 + }, + { + "epoch": 0.1, + "learning_rate": 4.944534164859389e-06, + "loss": 1.2091, + "step": 3159 + }, + { + "epoch": 0.1, + "learning_rate": 4.944483057688248e-06, + "loss": 1.1187, + "step": 3160 + }, + { + "epoch": 0.1, + "learning_rate": 4.944431927246803e-06, + "loss": 1.1237, + "step": 3161 + }, + { + "epoch": 0.1, + "learning_rate": 4.944380773535545e-06, + "loss": 1.3811, + "step": 3162 + }, + { + "epoch": 0.1, + "learning_rate": 4.944329596554959e-06, + "loss": 1.0936, + "step": 3163 + }, + { + "epoch": 0.1, + "learning_rate": 4.944278396305532e-06, + "loss": 1.1062, + "step": 3164 + }, + { + "epoch": 0.1, + "learning_rate": 4.944227172787752e-06, + "loss": 1.0694, + "step": 3165 + }, + { + "epoch": 0.1, + "learning_rate": 4.9441759260021076e-06, + "loss": 1.1559, + "step": 3166 + }, + { + "epoch": 0.1, + "learning_rate": 4.944124655949084e-06, + "loss": 1.2209, + "step": 3167 + }, + { + "epoch": 0.1, + "learning_rate": 4.944073362629171e-06, + "loss": 1.1547, + "step": 3168 + }, + { + "epoch": 0.1, + "learning_rate": 4.9440220460428575e-06, + "loss": 1.1335, + "step": 3169 + }, + { + "epoch": 0.1, + "learning_rate": 4.9439707061906305e-06, + "loss": 1.3018, + "step": 3170 + }, + { + "epoch": 0.1, + "learning_rate": 4.94391934307298e-06, + "loss": 1.1504, + "step": 3171 + }, + { + "epoch": 0.1, + "learning_rate": 4.943867956690394e-06, + "loss": 1.1912, + "step": 3172 + }, + { + "epoch": 0.1, + "learning_rate": 4.943816547043362e-06, + "loss": 1.1115, + "step": 3173 + }, + { + "epoch": 0.1, + "learning_rate": 4.943765114132374e-06, + "loss": 1.3207, + "step": 3174 + }, + { + "epoch": 0.1, + "learning_rate": 4.9437136579579185e-06, + "loss": 1.056, + "step": 3175 + }, + { + "epoch": 0.1, + "learning_rate": 4.943662178520486e-06, + "loss": 1.0392, + "step": 3176 + }, + { + "epoch": 0.1, + "learning_rate": 4.943610675820567e-06, + "loss": 1.1793, + "step": 3177 + }, + { + "epoch": 0.1, + "learning_rate": 4.943559149858651e-06, + "loss": 1.0989, + "step": 3178 + }, + { + "epoch": 0.1, + "learning_rate": 4.943507600635229e-06, + "loss": 1.1898, + "step": 3179 + }, + { + "epoch": 0.1, + "learning_rate": 4.94345602815079e-06, + "loss": 1.1816, + "step": 3180 + }, + { + "epoch": 0.1, + "learning_rate": 4.943404432405828e-06, + "loss": 1.2255, + "step": 3181 + }, + { + "epoch": 0.1, + "learning_rate": 4.943352813400832e-06, + "loss": 1.1296, + "step": 3182 + }, + { + "epoch": 0.1, + "learning_rate": 4.943301171136294e-06, + "loss": 1.1248, + "step": 3183 + }, + { + "epoch": 0.1, + "learning_rate": 4.943249505612705e-06, + "loss": 1.0747, + "step": 3184 + }, + { + "epoch": 0.1, + "learning_rate": 4.943197816830559e-06, + "loss": 1.1115, + "step": 3185 + }, + { + "epoch": 0.1, + "learning_rate": 4.943146104790345e-06, + "loss": 1.132, + "step": 3186 + }, + { + "epoch": 0.1, + "learning_rate": 4.943094369492558e-06, + "loss": 1.1797, + "step": 3187 + }, + { + "epoch": 0.1, + "learning_rate": 4.9430426109376885e-06, + "loss": 1.2031, + "step": 3188 + }, + { + "epoch": 0.1, + "learning_rate": 4.9429908291262295e-06, + "loss": 1.1906, + "step": 3189 + }, + { + "epoch": 0.1, + "learning_rate": 4.942939024058675e-06, + "loss": 1.0386, + "step": 3190 + }, + { + "epoch": 0.1, + "learning_rate": 4.942887195735518e-06, + "loss": 1.1169, + "step": 3191 + }, + { + "epoch": 0.1, + "learning_rate": 4.94283534415725e-06, + "loss": 1.1697, + "step": 3192 + }, + { + "epoch": 0.1, + "learning_rate": 4.9427834693243674e-06, + "loss": 1.1342, + "step": 3193 + }, + { + "epoch": 0.1, + "learning_rate": 4.942731571237361e-06, + "loss": 1.3251, + "step": 3194 + }, + { + "epoch": 0.1, + "learning_rate": 4.942679649896729e-06, + "loss": 1.2008, + "step": 3195 + }, + { + "epoch": 0.1, + "learning_rate": 4.942627705302962e-06, + "loss": 1.2267, + "step": 3196 + }, + { + "epoch": 0.1, + "learning_rate": 4.9425757374565545e-06, + "loss": 1.2269, + "step": 3197 + }, + { + "epoch": 0.1, + "learning_rate": 4.942523746358004e-06, + "loss": 1.2325, + "step": 3198 + }, + { + "epoch": 0.1, + "learning_rate": 4.942471732007802e-06, + "loss": 1.1465, + "step": 3199 + }, + { + "epoch": 0.1, + "learning_rate": 4.942419694406447e-06, + "loss": 1.1619, + "step": 3200 + }, + { + "epoch": 0.1, + "learning_rate": 4.942367633554432e-06, + "loss": 1.1921, + "step": 3201 + }, + { + "epoch": 0.1, + "learning_rate": 4.942315549452254e-06, + "loss": 1.1981, + "step": 3202 + }, + { + "epoch": 0.1, + "learning_rate": 4.9422634421004075e-06, + "loss": 1.1534, + "step": 3203 + }, + { + "epoch": 0.1, + "learning_rate": 4.942211311499391e-06, + "loss": 1.1879, + "step": 3204 + }, + { + "epoch": 0.1, + "learning_rate": 4.942159157649698e-06, + "loss": 1.1458, + "step": 3205 + }, + { + "epoch": 0.1, + "learning_rate": 4.942106980551825e-06, + "loss": 1.0948, + "step": 3206 + }, + { + "epoch": 0.1, + "learning_rate": 4.942054780206271e-06, + "loss": 1.1998, + "step": 3207 + }, + { + "epoch": 0.1, + "learning_rate": 4.942002556613531e-06, + "loss": 1.0822, + "step": 3208 + }, + { + "epoch": 0.1, + "learning_rate": 4.941950309774103e-06, + "loss": 1.1339, + "step": 3209 + }, + { + "epoch": 0.1, + "learning_rate": 4.941898039688484e-06, + "loss": 1.0731, + "step": 3210 + }, + { + "epoch": 0.1, + "learning_rate": 4.941845746357171e-06, + "loss": 1.2609, + "step": 3211 + }, + { + "epoch": 0.1, + "learning_rate": 4.941793429780663e-06, + "loss": 1.1724, + "step": 3212 + }, + { + "epoch": 0.1, + "learning_rate": 4.941741089959459e-06, + "loss": 1.1368, + "step": 3213 + }, + { + "epoch": 0.1, + "learning_rate": 4.941688726894054e-06, + "loss": 1.1832, + "step": 3214 + }, + { + "epoch": 0.1, + "learning_rate": 4.941636340584949e-06, + "loss": 1.1823, + "step": 3215 + }, + { + "epoch": 0.1, + "learning_rate": 4.941583931032642e-06, + "loss": 1.1663, + "step": 3216 + }, + { + "epoch": 0.1, + "learning_rate": 4.9415314982376314e-06, + "loss": 1.1896, + "step": 3217 + }, + { + "epoch": 0.1, + "learning_rate": 4.941479042200417e-06, + "loss": 1.2441, + "step": 3218 + }, + { + "epoch": 0.1, + "learning_rate": 4.941426562921498e-06, + "loss": 1.2274, + "step": 3219 + }, + { + "epoch": 0.1, + "learning_rate": 4.941374060401375e-06, + "loss": 1.0997, + "step": 3220 + }, + { + "epoch": 0.1, + "learning_rate": 4.941321534640546e-06, + "loss": 1.1738, + "step": 3221 + }, + { + "epoch": 0.1, + "learning_rate": 4.941268985639512e-06, + "loss": 1.1628, + "step": 3222 + }, + { + "epoch": 0.1, + "learning_rate": 4.9412164133987725e-06, + "loss": 1.2013, + "step": 3223 + }, + { + "epoch": 0.1, + "learning_rate": 4.941163817918828e-06, + "loss": 1.302, + "step": 3224 + }, + { + "epoch": 0.1, + "learning_rate": 4.941111199200181e-06, + "loss": 1.2356, + "step": 3225 + }, + { + "epoch": 0.1, + "learning_rate": 4.94105855724333e-06, + "loss": 1.1663, + "step": 3226 + }, + { + "epoch": 0.1, + "learning_rate": 4.941005892048778e-06, + "loss": 1.144, + "step": 3227 + }, + { + "epoch": 0.1, + "learning_rate": 4.940953203617025e-06, + "loss": 1.1669, + "step": 3228 + }, + { + "epoch": 0.1, + "learning_rate": 4.9409004919485725e-06, + "loss": 1.1443, + "step": 3229 + }, + { + "epoch": 0.1, + "learning_rate": 4.940847757043924e-06, + "loss": 1.2047, + "step": 3230 + }, + { + "epoch": 0.1, + "learning_rate": 4.94079499890358e-06, + "loss": 1.1426, + "step": 3231 + }, + { + "epoch": 0.1, + "learning_rate": 4.940742217528043e-06, + "loss": 1.1597, + "step": 3232 + }, + { + "epoch": 0.1, + "learning_rate": 4.940689412917815e-06, + "loss": 1.1186, + "step": 3233 + }, + { + "epoch": 0.1, + "learning_rate": 4.9406365850734e-06, + "loss": 1.1689, + "step": 3234 + }, + { + "epoch": 0.1, + "learning_rate": 4.940583733995301e-06, + "loss": 1.1313, + "step": 3235 + }, + { + "epoch": 0.1, + "learning_rate": 4.9405308596840195e-06, + "loss": 1.3175, + "step": 3236 + }, + { + "epoch": 0.1, + "learning_rate": 4.940477962140059e-06, + "loss": 1.1793, + "step": 3237 + }, + { + "epoch": 0.1, + "learning_rate": 4.940425041363924e-06, + "loss": 1.213, + "step": 3238 + }, + { + "epoch": 0.1, + "learning_rate": 4.940372097356119e-06, + "loss": 1.1903, + "step": 3239 + }, + { + "epoch": 0.1, + "learning_rate": 4.940319130117146e-06, + "loss": 1.1159, + "step": 3240 + }, + { + "epoch": 0.1, + "learning_rate": 4.94026613964751e-06, + "loss": 1.0696, + "step": 3241 + }, + { + "epoch": 0.1, + "learning_rate": 4.940213125947716e-06, + "loss": 1.1241, + "step": 3242 + }, + { + "epoch": 0.1, + "learning_rate": 4.940160089018268e-06, + "loss": 1.1562, + "step": 3243 + }, + { + "epoch": 0.1, + "learning_rate": 4.940107028859672e-06, + "loss": 1.1665, + "step": 3244 + }, + { + "epoch": 0.1, + "learning_rate": 4.940053945472431e-06, + "loss": 1.2174, + "step": 3245 + }, + { + "epoch": 0.1, + "learning_rate": 4.940000838857053e-06, + "loss": 1.1779, + "step": 3246 + }, + { + "epoch": 0.1, + "learning_rate": 4.939947709014041e-06, + "loss": 1.1841, + "step": 3247 + }, + { + "epoch": 0.1, + "learning_rate": 4.939894555943903e-06, + "loss": 1.1656, + "step": 3248 + }, + { + "epoch": 0.1, + "learning_rate": 4.9398413796471425e-06, + "loss": 1.1201, + "step": 3249 + }, + { + "epoch": 0.1, + "learning_rate": 4.939788180124269e-06, + "loss": 1.2313, + "step": 3250 + }, + { + "epoch": 0.1, + "learning_rate": 4.939734957375785e-06, + "loss": 1.0853, + "step": 3251 + }, + { + "epoch": 0.1, + "learning_rate": 4.939681711402201e-06, + "loss": 1.2091, + "step": 3252 + }, + { + "epoch": 0.1, + "learning_rate": 4.939628442204021e-06, + "loss": 1.1669, + "step": 3253 + }, + { + "epoch": 0.1, + "learning_rate": 4.9395751497817535e-06, + "loss": 1.1957, + "step": 3254 + }, + { + "epoch": 0.1, + "learning_rate": 4.939521834135905e-06, + "loss": 1.2679, + "step": 3255 + }, + { + "epoch": 0.1, + "learning_rate": 4.939468495266984e-06, + "loss": 1.2571, + "step": 3256 + }, + { + "epoch": 0.1, + "learning_rate": 4.939415133175498e-06, + "loss": 1.2072, + "step": 3257 + }, + { + "epoch": 0.1, + "learning_rate": 4.939361747861955e-06, + "loss": 1.1359, + "step": 3258 + }, + { + "epoch": 0.1, + "learning_rate": 4.9393083393268625e-06, + "loss": 1.2828, + "step": 3259 + }, + { + "epoch": 0.1, + "learning_rate": 4.939254907570729e-06, + "loss": 1.1078, + "step": 3260 + }, + { + "epoch": 0.1, + "learning_rate": 4.939201452594065e-06, + "loss": 1.2144, + "step": 3261 + }, + { + "epoch": 0.1, + "learning_rate": 4.939147974397377e-06, + "loss": 1.083, + "step": 3262 + }, + { + "epoch": 0.1, + "learning_rate": 4.939094472981175e-06, + "loss": 1.1946, + "step": 3263 + }, + { + "epoch": 0.1, + "learning_rate": 4.939040948345969e-06, + "loss": 1.2006, + "step": 3264 + }, + { + "epoch": 0.1, + "learning_rate": 4.938987400492266e-06, + "loss": 1.0947, + "step": 3265 + }, + { + "epoch": 0.1, + "learning_rate": 4.93893382942058e-06, + "loss": 1.196, + "step": 3266 + }, + { + "epoch": 0.1, + "learning_rate": 4.938880235131417e-06, + "loss": 1.2109, + "step": 3267 + }, + { + "epoch": 0.1, + "learning_rate": 4.938826617625289e-06, + "loss": 1.1995, + "step": 3268 + }, + { + "epoch": 0.1, + "learning_rate": 4.938772976902707e-06, + "loss": 1.1738, + "step": 3269 + }, + { + "epoch": 0.1, + "learning_rate": 4.9387193129641806e-06, + "loss": 1.2452, + "step": 3270 + }, + { + "epoch": 0.1, + "learning_rate": 4.93866562581022e-06, + "loss": 1.1177, + "step": 3271 + }, + { + "epoch": 0.1, + "learning_rate": 4.938611915441338e-06, + "loss": 1.0631, + "step": 3272 + }, + { + "epoch": 0.1, + "learning_rate": 4.938558181858044e-06, + "loss": 1.2183, + "step": 3273 + }, + { + "epoch": 0.1, + "learning_rate": 4.938504425060851e-06, + "loss": 1.1512, + "step": 3274 + }, + { + "epoch": 0.1, + "learning_rate": 4.938450645050271e-06, + "loss": 1.1235, + "step": 3275 + }, + { + "epoch": 0.1, + "learning_rate": 4.938396841826815e-06, + "loss": 1.1399, + "step": 3276 + }, + { + "epoch": 0.1, + "learning_rate": 4.938343015390995e-06, + "loss": 1.1996, + "step": 3277 + }, + { + "epoch": 0.1, + "learning_rate": 4.938289165743324e-06, + "loss": 1.2607, + "step": 3278 + }, + { + "epoch": 0.1, + "learning_rate": 4.938235292884314e-06, + "loss": 1.16, + "step": 3279 + }, + { + "epoch": 0.1, + "learning_rate": 4.93818139681448e-06, + "loss": 1.1288, + "step": 3280 + }, + { + "epoch": 0.1, + "learning_rate": 4.938127477534332e-06, + "loss": 1.1241, + "step": 3281 + }, + { + "epoch": 0.1, + "learning_rate": 4.938073535044385e-06, + "loss": 1.1732, + "step": 3282 + }, + { + "epoch": 0.1, + "learning_rate": 4.938019569345152e-06, + "loss": 1.1703, + "step": 3283 + }, + { + "epoch": 0.1, + "learning_rate": 4.937965580437147e-06, + "loss": 1.0999, + "step": 3284 + }, + { + "epoch": 0.1, + "learning_rate": 4.937911568320883e-06, + "loss": 1.079, + "step": 3285 + }, + { + "epoch": 0.1, + "learning_rate": 4.937857532996877e-06, + "loss": 1.2935, + "step": 3286 + }, + { + "epoch": 0.1, + "learning_rate": 4.9378034744656395e-06, + "loss": 1.1606, + "step": 3287 + }, + { + "epoch": 0.1, + "learning_rate": 4.9377493927276875e-06, + "loss": 1.1111, + "step": 3288 + }, + { + "epoch": 0.1, + "learning_rate": 4.937695287783536e-06, + "loss": 1.1775, + "step": 3289 + }, + { + "epoch": 0.1, + "learning_rate": 4.937641159633699e-06, + "loss": 1.0975, + "step": 3290 + }, + { + "epoch": 0.1, + "learning_rate": 4.937587008278691e-06, + "loss": 1.1409, + "step": 3291 + }, + { + "epoch": 0.1, + "learning_rate": 4.937532833719031e-06, + "loss": 1.0377, + "step": 3292 + }, + { + "epoch": 0.1, + "learning_rate": 4.937478635955231e-06, + "loss": 1.3254, + "step": 3293 + }, + { + "epoch": 0.1, + "learning_rate": 4.937424414987808e-06, + "loss": 1.103, + "step": 3294 + }, + { + "epoch": 0.1, + "learning_rate": 4.937370170817279e-06, + "loss": 1.1545, + "step": 3295 + }, + { + "epoch": 0.1, + "learning_rate": 4.9373159034441594e-06, + "loss": 1.0788, + "step": 3296 + }, + { + "epoch": 0.1, + "learning_rate": 4.937261612868966e-06, + "loss": 1.1106, + "step": 3297 + }, + { + "epoch": 0.1, + "learning_rate": 4.937207299092217e-06, + "loss": 1.1582, + "step": 3298 + }, + { + "epoch": 0.1, + "learning_rate": 4.937152962114428e-06, + "loss": 1.2495, + "step": 3299 + }, + { + "epoch": 0.1, + "learning_rate": 4.937098601936116e-06, + "loss": 1.0928, + "step": 3300 + }, + { + "epoch": 0.1, + "learning_rate": 4.9370442185578e-06, + "loss": 1.193, + "step": 3301 + }, + { + "epoch": 0.1, + "learning_rate": 4.936989811979997e-06, + "loss": 1.1707, + "step": 3302 + }, + { + "epoch": 0.1, + "learning_rate": 4.936935382203223e-06, + "loss": 1.1005, + "step": 3303 + }, + { + "epoch": 0.1, + "learning_rate": 4.936880929227998e-06, + "loss": 1.1647, + "step": 3304 + }, + { + "epoch": 0.1, + "learning_rate": 4.936826453054841e-06, + "loss": 1.2374, + "step": 3305 + }, + { + "epoch": 0.1, + "learning_rate": 4.936771953684271e-06, + "loss": 1.1423, + "step": 3306 + }, + { + "epoch": 0.1, + "learning_rate": 4.936717431116804e-06, + "loss": 1.1233, + "step": 3307 + }, + { + "epoch": 0.1, + "learning_rate": 4.936662885352961e-06, + "loss": 1.1556, + "step": 3308 + }, + { + "epoch": 0.1, + "learning_rate": 4.936608316393261e-06, + "loss": 1.0271, + "step": 3309 + }, + { + "epoch": 0.1, + "learning_rate": 4.936553724238222e-06, + "loss": 1.189, + "step": 3310 + }, + { + "epoch": 0.1, + "learning_rate": 4.936499108888366e-06, + "loss": 1.1667, + "step": 3311 + }, + { + "epoch": 0.1, + "learning_rate": 4.936444470344213e-06, + "loss": 1.2149, + "step": 3312 + }, + { + "epoch": 0.1, + "learning_rate": 4.936389808606281e-06, + "loss": 1.1875, + "step": 3313 + }, + { + "epoch": 0.1, + "learning_rate": 4.936335123675091e-06, + "loss": 1.1714, + "step": 3314 + }, + { + "epoch": 0.1, + "learning_rate": 4.9362804155511655e-06, + "loss": 1.1285, + "step": 3315 + }, + { + "epoch": 0.1, + "learning_rate": 4.936225684235022e-06, + "loss": 1.2261, + "step": 3316 + }, + { + "epoch": 0.1, + "learning_rate": 4.936170929727184e-06, + "loss": 1.2345, + "step": 3317 + }, + { + "epoch": 0.1, + "learning_rate": 4.936116152028173e-06, + "loss": 1.1685, + "step": 3318 + }, + { + "epoch": 0.1, + "learning_rate": 4.936061351138509e-06, + "loss": 1.168, + "step": 3319 + }, + { + "epoch": 0.1, + "learning_rate": 4.936006527058713e-06, + "loss": 1.0818, + "step": 3320 + }, + { + "epoch": 0.1, + "learning_rate": 4.935951679789309e-06, + "loss": 1.1556, + "step": 3321 + }, + { + "epoch": 0.1, + "learning_rate": 4.935896809330819e-06, + "loss": 1.0913, + "step": 3322 + }, + { + "epoch": 0.1, + "learning_rate": 4.935841915683763e-06, + "loss": 1.106, + "step": 3323 + }, + { + "epoch": 0.1, + "learning_rate": 4.935786998848666e-06, + "loss": 1.2561, + "step": 3324 + }, + { + "epoch": 0.1, + "learning_rate": 4.93573205882605e-06, + "loss": 1.1467, + "step": 3325 + }, + { + "epoch": 0.1, + "learning_rate": 4.935677095616438e-06, + "loss": 1.1143, + "step": 3326 + }, + { + "epoch": 0.1, + "learning_rate": 4.9356221092203525e-06, + "loss": 1.2142, + "step": 3327 + }, + { + "epoch": 0.1, + "learning_rate": 4.935567099638317e-06, + "loss": 1.2629, + "step": 3328 + }, + { + "epoch": 0.1, + "learning_rate": 4.935512066870857e-06, + "loss": 1.1329, + "step": 3329 + }, + { + "epoch": 0.1, + "learning_rate": 4.9354570109184956e-06, + "loss": 1.0713, + "step": 3330 + }, + { + "epoch": 0.1, + "learning_rate": 4.935401931781754e-06, + "loss": 1.1721, + "step": 3331 + }, + { + "epoch": 0.1, + "learning_rate": 4.9353468294611615e-06, + "loss": 1.2061, + "step": 3332 + }, + { + "epoch": 0.1, + "learning_rate": 4.935291703957239e-06, + "loss": 1.1255, + "step": 3333 + }, + { + "epoch": 0.1, + "learning_rate": 4.935236555270511e-06, + "loss": 1.1553, + "step": 3334 + }, + { + "epoch": 0.1, + "learning_rate": 4.935181383401506e-06, + "loss": 1.2321, + "step": 3335 + }, + { + "epoch": 0.1, + "learning_rate": 4.935126188350746e-06, + "loss": 1.2395, + "step": 3336 + }, + { + "epoch": 0.1, + "learning_rate": 4.935070970118758e-06, + "loss": 1.1923, + "step": 3337 + }, + { + "epoch": 0.1, + "learning_rate": 4.935015728706067e-06, + "loss": 1.2054, + "step": 3338 + }, + { + "epoch": 0.1, + "learning_rate": 4.934960464113199e-06, + "loss": 1.1159, + "step": 3339 + }, + { + "epoch": 0.1, + "learning_rate": 4.934905176340679e-06, + "loss": 1.13, + "step": 3340 + }, + { + "epoch": 0.1, + "learning_rate": 4.934849865389037e-06, + "loss": 1.1716, + "step": 3341 + }, + { + "epoch": 0.1, + "learning_rate": 4.934794531258794e-06, + "loss": 1.1248, + "step": 3342 + }, + { + "epoch": 0.1, + "learning_rate": 4.934739173950481e-06, + "loss": 1.157, + "step": 3343 + }, + { + "epoch": 0.1, + "learning_rate": 4.934683793464624e-06, + "loss": 1.0784, + "step": 3344 + }, + { + "epoch": 0.1, + "learning_rate": 4.93462838980175e-06, + "loss": 1.2245, + "step": 3345 + }, + { + "epoch": 0.1, + "learning_rate": 4.934572962962385e-06, + "loss": 1.1561, + "step": 3346 + }, + { + "epoch": 0.1, + "learning_rate": 4.934517512947059e-06, + "loss": 1.1293, + "step": 3347 + }, + { + "epoch": 0.1, + "learning_rate": 4.934462039756299e-06, + "loss": 1.1183, + "step": 3348 + }, + { + "epoch": 0.1, + "learning_rate": 4.9344065433906315e-06, + "loss": 1.1609, + "step": 3349 + }, + { + "epoch": 0.1, + "learning_rate": 4.9343510238505876e-06, + "loss": 1.1381, + "step": 3350 + }, + { + "epoch": 0.1, + "learning_rate": 4.934295481136694e-06, + "loss": 1.1951, + "step": 3351 + }, + { + "epoch": 0.1, + "learning_rate": 4.934239915249479e-06, + "loss": 1.124, + "step": 3352 + }, + { + "epoch": 0.1, + "learning_rate": 4.934184326189474e-06, + "loss": 1.1193, + "step": 3353 + }, + { + "epoch": 0.1, + "learning_rate": 4.934128713957205e-06, + "loss": 1.0648, + "step": 3354 + }, + { + "epoch": 0.1, + "learning_rate": 4.934073078553204e-06, + "loss": 1.282, + "step": 3355 + }, + { + "epoch": 0.1, + "learning_rate": 4.934017419977999e-06, + "loss": 1.1743, + "step": 3356 + }, + { + "epoch": 0.1, + "learning_rate": 4.9339617382321205e-06, + "loss": 1.2332, + "step": 3357 + }, + { + "epoch": 0.1, + "learning_rate": 4.933906033316098e-06, + "loss": 1.2386, + "step": 3358 + }, + { + "epoch": 0.1, + "learning_rate": 4.933850305230463e-06, + "loss": 1.0814, + "step": 3359 + }, + { + "epoch": 0.1, + "learning_rate": 4.933794553975746e-06, + "loss": 1.2441, + "step": 3360 + }, + { + "epoch": 0.1, + "learning_rate": 4.933738779552476e-06, + "loss": 1.3041, + "step": 3361 + }, + { + "epoch": 0.1, + "learning_rate": 4.933682981961184e-06, + "loss": 1.1505, + "step": 3362 + }, + { + "epoch": 0.1, + "learning_rate": 4.933627161202403e-06, + "loss": 1.1757, + "step": 3363 + }, + { + "epoch": 0.1, + "learning_rate": 4.933571317276664e-06, + "loss": 1.1968, + "step": 3364 + }, + { + "epoch": 0.1, + "learning_rate": 4.933515450184498e-06, + "loss": 1.155, + "step": 3365 + }, + { + "epoch": 0.1, + "learning_rate": 4.933459559926437e-06, + "loss": 1.1531, + "step": 3366 + }, + { + "epoch": 0.1, + "learning_rate": 4.933403646503012e-06, + "loss": 1.2979, + "step": 3367 + }, + { + "epoch": 0.1, + "learning_rate": 4.9333477099147575e-06, + "loss": 1.2175, + "step": 3368 + }, + { + "epoch": 0.1, + "learning_rate": 4.933291750162204e-06, + "loss": 1.1884, + "step": 3369 + }, + { + "epoch": 0.1, + "learning_rate": 4.9332357672458855e-06, + "loss": 1.2201, + "step": 3370 + }, + { + "epoch": 0.1, + "learning_rate": 4.933179761166334e-06, + "loss": 1.111, + "step": 3371 + }, + { + "epoch": 0.1, + "learning_rate": 4.9331237319240825e-06, + "loss": 1.0825, + "step": 3372 + }, + { + "epoch": 0.1, + "learning_rate": 4.933067679519665e-06, + "loss": 1.1298, + "step": 3373 + }, + { + "epoch": 0.1, + "learning_rate": 4.933011603953616e-06, + "loss": 1.276, + "step": 3374 + }, + { + "epoch": 0.1, + "learning_rate": 4.932955505226468e-06, + "loss": 1.2413, + "step": 3375 + }, + { + "epoch": 0.1, + "learning_rate": 4.932899383338755e-06, + "loss": 1.1909, + "step": 3376 + }, + { + "epoch": 0.1, + "learning_rate": 4.932843238291012e-06, + "loss": 1.1685, + "step": 3377 + }, + { + "epoch": 0.1, + "learning_rate": 4.932787070083772e-06, + "loss": 1.0543, + "step": 3378 + }, + { + "epoch": 0.1, + "learning_rate": 4.932730878717572e-06, + "loss": 1.1591, + "step": 3379 + }, + { + "epoch": 0.1, + "learning_rate": 4.9326746641929454e-06, + "loss": 1.0785, + "step": 3380 + }, + { + "epoch": 0.1, + "learning_rate": 4.932618426510427e-06, + "loss": 1.2025, + "step": 3381 + }, + { + "epoch": 0.1, + "learning_rate": 4.9325621656705535e-06, + "loss": 1.2467, + "step": 3382 + }, + { + "epoch": 0.1, + "learning_rate": 4.932505881673859e-06, + "loss": 1.1617, + "step": 3383 + }, + { + "epoch": 0.1, + "learning_rate": 4.93244957452088e-06, + "loss": 1.1282, + "step": 3384 + }, + { + "epoch": 0.1, + "learning_rate": 4.932393244212154e-06, + "loss": 1.1138, + "step": 3385 + }, + { + "epoch": 0.1, + "learning_rate": 4.932336890748215e-06, + "loss": 1.1248, + "step": 3386 + }, + { + "epoch": 0.1, + "learning_rate": 4.932280514129599e-06, + "loss": 1.1731, + "step": 3387 + }, + { + "epoch": 0.1, + "learning_rate": 4.932224114356846e-06, + "loss": 1.2731, + "step": 3388 + }, + { + "epoch": 0.1, + "learning_rate": 4.93216769143049e-06, + "loss": 1.2245, + "step": 3389 + }, + { + "epoch": 0.1, + "learning_rate": 4.932111245351069e-06, + "loss": 1.1549, + "step": 3390 + }, + { + "epoch": 0.1, + "learning_rate": 4.932054776119119e-06, + "loss": 1.1214, + "step": 3391 + }, + { + "epoch": 0.1, + "learning_rate": 4.93199828373518e-06, + "loss": 1.1395, + "step": 3392 + }, + { + "epoch": 0.1, + "learning_rate": 4.931941768199789e-06, + "loss": 1.1882, + "step": 3393 + }, + { + "epoch": 0.1, + "learning_rate": 4.931885229513483e-06, + "loss": 1.2229, + "step": 3394 + }, + { + "epoch": 0.1, + "learning_rate": 4.931828667676801e-06, + "loss": 1.2153, + "step": 3395 + }, + { + "epoch": 0.1, + "learning_rate": 4.931772082690281e-06, + "loss": 1.1734, + "step": 3396 + }, + { + "epoch": 0.1, + "learning_rate": 4.9317154745544624e-06, + "loss": 1.1954, + "step": 3397 + }, + { + "epoch": 0.1, + "learning_rate": 4.931658843269884e-06, + "loss": 1.1566, + "step": 3398 + }, + { + "epoch": 0.1, + "learning_rate": 4.931602188837084e-06, + "loss": 1.2188, + "step": 3399 + }, + { + "epoch": 0.1, + "learning_rate": 4.9315455112566024e-06, + "loss": 1.1617, + "step": 3400 + }, + { + "epoch": 0.1, + "learning_rate": 4.931488810528978e-06, + "loss": 1.2358, + "step": 3401 + }, + { + "epoch": 0.1, + "learning_rate": 4.931432086654752e-06, + "loss": 1.1324, + "step": 3402 + }, + { + "epoch": 0.1, + "learning_rate": 4.931375339634464e-06, + "loss": 1.1686, + "step": 3403 + }, + { + "epoch": 0.1, + "learning_rate": 4.931318569468652e-06, + "loss": 1.0759, + "step": 3404 + }, + { + "epoch": 0.1, + "learning_rate": 4.93126177615786e-06, + "loss": 1.1357, + "step": 3405 + }, + { + "epoch": 0.1, + "learning_rate": 4.931204959702626e-06, + "loss": 1.0846, + "step": 3406 + }, + { + "epoch": 0.1, + "learning_rate": 4.9311481201034915e-06, + "loss": 1.1639, + "step": 3407 + }, + { + "epoch": 0.1, + "learning_rate": 4.931091257360998e-06, + "loss": 1.2931, + "step": 3408 + }, + { + "epoch": 0.1, + "learning_rate": 4.931034371475686e-06, + "loss": 1.1605, + "step": 3409 + }, + { + "epoch": 0.1, + "learning_rate": 4.930977462448098e-06, + "loss": 1.2118, + "step": 3410 + }, + { + "epoch": 0.1, + "learning_rate": 4.930920530278776e-06, + "loss": 1.1773, + "step": 3411 + }, + { + "epoch": 0.1, + "learning_rate": 4.930863574968261e-06, + "loss": 1.1764, + "step": 3412 + }, + { + "epoch": 0.1, + "learning_rate": 4.930806596517095e-06, + "loss": 1.1806, + "step": 3413 + }, + { + "epoch": 0.1, + "learning_rate": 4.930749594925821e-06, + "loss": 1.0569, + "step": 3414 + }, + { + "epoch": 0.1, + "learning_rate": 4.930692570194983e-06, + "loss": 1.0665, + "step": 3415 + }, + { + "epoch": 0.1, + "learning_rate": 4.93063552232512e-06, + "loss": 1.1355, + "step": 3416 + }, + { + "epoch": 0.1, + "learning_rate": 4.930578451316779e-06, + "loss": 1.1921, + "step": 3417 + }, + { + "epoch": 0.1, + "learning_rate": 4.930521357170501e-06, + "loss": 1.0889, + "step": 3418 + }, + { + "epoch": 0.1, + "learning_rate": 4.930464239886832e-06, + "loss": 1.1192, + "step": 3419 + }, + { + "epoch": 0.1, + "learning_rate": 4.930407099466312e-06, + "loss": 1.0779, + "step": 3420 + }, + { + "epoch": 0.1, + "learning_rate": 4.930349935909488e-06, + "loss": 1.1828, + "step": 3421 + }, + { + "epoch": 0.1, + "learning_rate": 4.930292749216902e-06, + "loss": 1.1103, + "step": 3422 + }, + { + "epoch": 0.1, + "learning_rate": 4.930235539389101e-06, + "loss": 1.1831, + "step": 3423 + }, + { + "epoch": 0.1, + "learning_rate": 4.9301783064266265e-06, + "loss": 1.2289, + "step": 3424 + }, + { + "epoch": 0.1, + "learning_rate": 4.9301210503300264e-06, + "loss": 1.0843, + "step": 3425 + }, + { + "epoch": 0.1, + "learning_rate": 4.930063771099844e-06, + "loss": 1.1751, + "step": 3426 + }, + { + "epoch": 0.1, + "learning_rate": 4.930006468736624e-06, + "loss": 1.161, + "step": 3427 + }, + { + "epoch": 0.1, + "learning_rate": 4.929949143240913e-06, + "loss": 1.0482, + "step": 3428 + }, + { + "epoch": 0.1, + "learning_rate": 4.929891794613257e-06, + "loss": 1.276, + "step": 3429 + }, + { + "epoch": 0.1, + "learning_rate": 4.929834422854201e-06, + "loss": 1.1403, + "step": 3430 + }, + { + "epoch": 0.1, + "learning_rate": 4.929777027964292e-06, + "loss": 1.1631, + "step": 3431 + }, + { + "epoch": 0.1, + "learning_rate": 4.929719609944076e-06, + "loss": 1.2028, + "step": 3432 + }, + { + "epoch": 0.1, + "learning_rate": 4.929662168794098e-06, + "loss": 1.108, + "step": 3433 + }, + { + "epoch": 0.1, + "learning_rate": 4.929604704514907e-06, + "loss": 1.0583, + "step": 3434 + }, + { + "epoch": 0.1, + "learning_rate": 4.92954721710705e-06, + "loss": 1.196, + "step": 3435 + }, + { + "epoch": 0.1, + "learning_rate": 4.9294897065710735e-06, + "loss": 1.2368, + "step": 3436 + }, + { + "epoch": 0.1, + "learning_rate": 4.929432172907525e-06, + "loss": 1.2068, + "step": 3437 + }, + { + "epoch": 0.1, + "learning_rate": 4.929374616116952e-06, + "loss": 1.1431, + "step": 3438 + }, + { + "epoch": 0.1, + "learning_rate": 4.929317036199903e-06, + "loss": 1.1902, + "step": 3439 + }, + { + "epoch": 0.1, + "learning_rate": 4.929259433156926e-06, + "loss": 1.1426, + "step": 3440 + }, + { + "epoch": 0.1, + "learning_rate": 4.929201806988569e-06, + "loss": 1.1915, + "step": 3441 + }, + { + "epoch": 0.1, + "learning_rate": 4.92914415769538e-06, + "loss": 1.2585, + "step": 3442 + }, + { + "epoch": 0.1, + "learning_rate": 4.92908648527791e-06, + "loss": 1.2078, + "step": 3443 + }, + { + "epoch": 0.1, + "learning_rate": 4.929028789736705e-06, + "loss": 1.3217, + "step": 3444 + }, + { + "epoch": 0.1, + "learning_rate": 4.9289710710723175e-06, + "loss": 1.1298, + "step": 3445 + }, + { + "epoch": 0.1, + "learning_rate": 4.928913329285293e-06, + "loss": 1.183, + "step": 3446 + }, + { + "epoch": 0.1, + "learning_rate": 4.928855564376185e-06, + "loss": 1.0795, + "step": 3447 + }, + { + "epoch": 0.1, + "learning_rate": 4.928797776345542e-06, + "loss": 1.0203, + "step": 3448 + }, + { + "epoch": 0.1, + "learning_rate": 4.928739965193913e-06, + "loss": 1.1268, + "step": 3449 + }, + { + "epoch": 0.1, + "learning_rate": 4.928682130921849e-06, + "loss": 1.1587, + "step": 3450 + }, + { + "epoch": 0.1, + "learning_rate": 4.928624273529902e-06, + "loss": 1.1679, + "step": 3451 + }, + { + "epoch": 0.1, + "learning_rate": 4.92856639301862e-06, + "loss": 1.0667, + "step": 3452 + }, + { + "epoch": 0.1, + "learning_rate": 4.928508489388557e-06, + "loss": 1.1591, + "step": 3453 + }, + { + "epoch": 0.1, + "learning_rate": 4.928450562640262e-06, + "loss": 1.0694, + "step": 3454 + }, + { + "epoch": 0.1, + "learning_rate": 4.928392612774288e-06, + "loss": 1.101, + "step": 3455 + }, + { + "epoch": 0.1, + "learning_rate": 4.928334639791185e-06, + "loss": 1.2019, + "step": 3456 + }, + { + "epoch": 0.1, + "learning_rate": 4.928276643691507e-06, + "loss": 1.1002, + "step": 3457 + }, + { + "epoch": 0.1, + "learning_rate": 4.928218624475803e-06, + "loss": 1.0591, + "step": 3458 + }, + { + "epoch": 0.1, + "learning_rate": 4.928160582144628e-06, + "loss": 1.0807, + "step": 3459 + }, + { + "epoch": 0.1, + "learning_rate": 4.928102516698535e-06, + "loss": 1.2179, + "step": 3460 + }, + { + "epoch": 0.1, + "learning_rate": 4.928044428138075e-06, + "loss": 1.1128, + "step": 3461 + }, + { + "epoch": 0.1, + "learning_rate": 4.9279863164638e-06, + "loss": 1.137, + "step": 3462 + }, + { + "epoch": 0.1, + "learning_rate": 4.9279281816762655e-06, + "loss": 1.3337, + "step": 3463 + }, + { + "epoch": 0.1, + "learning_rate": 4.927870023776024e-06, + "loss": 1.1205, + "step": 3464 + }, + { + "epoch": 0.1, + "learning_rate": 4.927811842763629e-06, + "loss": 1.0752, + "step": 3465 + }, + { + "epoch": 0.1, + "learning_rate": 4.9277536386396355e-06, + "loss": 1.1647, + "step": 3466 + }, + { + "epoch": 0.1, + "learning_rate": 4.927695411404595e-06, + "loss": 1.2195, + "step": 3467 + }, + { + "epoch": 0.1, + "learning_rate": 4.927637161059065e-06, + "loss": 1.2367, + "step": 3468 + }, + { + "epoch": 0.1, + "learning_rate": 4.927578887603597e-06, + "loss": 1.2635, + "step": 3469 + }, + { + "epoch": 0.1, + "learning_rate": 4.927520591038748e-06, + "loss": 1.1798, + "step": 3470 + }, + { + "epoch": 0.1, + "learning_rate": 4.927462271365072e-06, + "loss": 1.2372, + "step": 3471 + }, + { + "epoch": 0.1, + "learning_rate": 4.927403928583124e-06, + "loss": 1.1016, + "step": 3472 + }, + { + "epoch": 0.1, + "learning_rate": 4.927345562693459e-06, + "loss": 1.1756, + "step": 3473 + }, + { + "epoch": 0.1, + "learning_rate": 4.927287173696634e-06, + "loss": 1.2414, + "step": 3474 + }, + { + "epoch": 0.1, + "learning_rate": 4.927228761593205e-06, + "loss": 1.1159, + "step": 3475 + }, + { + "epoch": 0.1, + "learning_rate": 4.927170326383726e-06, + "loss": 1.2666, + "step": 3476 + }, + { + "epoch": 0.1, + "learning_rate": 4.9271118680687554e-06, + "loss": 1.1105, + "step": 3477 + }, + { + "epoch": 0.1, + "learning_rate": 4.927053386648848e-06, + "loss": 1.0909, + "step": 3478 + }, + { + "epoch": 0.1, + "learning_rate": 4.9269948821245616e-06, + "loss": 1.1592, + "step": 3479 + }, + { + "epoch": 0.1, + "learning_rate": 4.9269363544964525e-06, + "loss": 1.1574, + "step": 3480 + }, + { + "epoch": 0.1, + "learning_rate": 4.9268778037650785e-06, + "loss": 1.1025, + "step": 3481 + }, + { + "epoch": 0.1, + "learning_rate": 4.926819229930997e-06, + "loss": 1.0784, + "step": 3482 + }, + { + "epoch": 0.1, + "learning_rate": 4.926760632994764e-06, + "loss": 1.0974, + "step": 3483 + }, + { + "epoch": 0.1, + "learning_rate": 4.92670201295694e-06, + "loss": 1.2345, + "step": 3484 + }, + { + "epoch": 0.1, + "learning_rate": 4.92664336981808e-06, + "loss": 1.0013, + "step": 3485 + }, + { + "epoch": 0.11, + "learning_rate": 4.926584703578745e-06, + "loss": 1.1995, + "step": 3486 + }, + { + "epoch": 0.11, + "learning_rate": 4.9265260142394925e-06, + "loss": 1.2115, + "step": 3487 + }, + { + "epoch": 0.11, + "learning_rate": 4.92646730180088e-06, + "loss": 1.1637, + "step": 3488 + }, + { + "epoch": 0.11, + "learning_rate": 4.926408566263468e-06, + "loss": 1.2194, + "step": 3489 + }, + { + "epoch": 0.11, + "learning_rate": 4.9263498076278146e-06, + "loss": 1.157, + "step": 3490 + }, + { + "epoch": 0.11, + "learning_rate": 4.92629102589448e-06, + "loss": 1.0804, + "step": 3491 + }, + { + "epoch": 0.11, + "learning_rate": 4.926232221064023e-06, + "loss": 1.1135, + "step": 3492 + }, + { + "epoch": 0.11, + "learning_rate": 4.926173393137005e-06, + "loss": 1.2081, + "step": 3493 + }, + { + "epoch": 0.11, + "learning_rate": 4.926114542113983e-06, + "loss": 1.0988, + "step": 3494 + }, + { + "epoch": 0.11, + "learning_rate": 4.926055667995521e-06, + "loss": 1.2161, + "step": 3495 + }, + { + "epoch": 0.11, + "learning_rate": 4.9259967707821755e-06, + "loss": 1.1963, + "step": 3496 + }, + { + "epoch": 0.11, + "learning_rate": 4.92593785047451e-06, + "loss": 1.2029, + "step": 3497 + }, + { + "epoch": 0.11, + "learning_rate": 4.925878907073085e-06, + "loss": 1.1039, + "step": 3498 + }, + { + "epoch": 0.11, + "learning_rate": 4.92581994057846e-06, + "loss": 1.1082, + "step": 3499 + }, + { + "epoch": 0.11, + "learning_rate": 4.925760950991198e-06, + "loss": 1.2742, + "step": 3500 + }, + { + "epoch": 0.11, + "learning_rate": 4.925701938311861e-06, + "loss": 1.1989, + "step": 3501 + }, + { + "epoch": 0.11, + "learning_rate": 4.925642902541009e-06, + "loss": 1.1265, + "step": 3502 + }, + { + "epoch": 0.11, + "learning_rate": 4.925583843679205e-06, + "loss": 1.0261, + "step": 3503 + }, + { + "epoch": 0.11, + "learning_rate": 4.925524761727011e-06, + "loss": 1.1196, + "step": 3504 + }, + { + "epoch": 0.11, + "learning_rate": 4.925465656684989e-06, + "loss": 1.1654, + "step": 3505 + }, + { + "epoch": 0.11, + "learning_rate": 4.925406528553702e-06, + "loss": 1.1317, + "step": 3506 + }, + { + "epoch": 0.11, + "learning_rate": 4.9253473773337135e-06, + "loss": 1.2106, + "step": 3507 + }, + { + "epoch": 0.11, + "learning_rate": 4.925288203025585e-06, + "loss": 1.1327, + "step": 3508 + }, + { + "epoch": 0.11, + "learning_rate": 4.9252290056298824e-06, + "loss": 1.22, + "step": 3509 + }, + { + "epoch": 0.11, + "learning_rate": 4.925169785147167e-06, + "loss": 1.1777, + "step": 3510 + }, + { + "epoch": 0.11, + "learning_rate": 4.925110541578003e-06, + "loss": 1.2552, + "step": 3511 + }, + { + "epoch": 0.11, + "learning_rate": 4.925051274922955e-06, + "loss": 1.2845, + "step": 3512 + }, + { + "epoch": 0.11, + "learning_rate": 4.924991985182587e-06, + "loss": 1.1943, + "step": 3513 + }, + { + "epoch": 0.11, + "learning_rate": 4.924932672357463e-06, + "loss": 1.0872, + "step": 3514 + }, + { + "epoch": 0.11, + "learning_rate": 4.924873336448147e-06, + "loss": 1.1602, + "step": 3515 + }, + { + "epoch": 0.11, + "learning_rate": 4.9248139774552066e-06, + "loss": 1.1207, + "step": 3516 + }, + { + "epoch": 0.11, + "learning_rate": 4.924754595379203e-06, + "loss": 1.2198, + "step": 3517 + }, + { + "epoch": 0.11, + "learning_rate": 4.924695190220704e-06, + "loss": 1.3135, + "step": 3518 + }, + { + "epoch": 0.11, + "learning_rate": 4.924635761980275e-06, + "loss": 1.0959, + "step": 3519 + }, + { + "epoch": 0.11, + "learning_rate": 4.924576310658482e-06, + "loss": 1.1465, + "step": 3520 + }, + { + "epoch": 0.11, + "learning_rate": 4.924516836255888e-06, + "loss": 1.1741, + "step": 3521 + }, + { + "epoch": 0.11, + "learning_rate": 4.924457338773063e-06, + "loss": 1.1625, + "step": 3522 + }, + { + "epoch": 0.11, + "learning_rate": 4.9243978182105725e-06, + "loss": 1.1263, + "step": 3523 + }, + { + "epoch": 0.11, + "learning_rate": 4.924338274568981e-06, + "loss": 1.3348, + "step": 3524 + }, + { + "epoch": 0.11, + "learning_rate": 4.924278707848858e-06, + "loss": 1.037, + "step": 3525 + }, + { + "epoch": 0.11, + "learning_rate": 4.924219118050768e-06, + "loss": 1.0818, + "step": 3526 + }, + { + "epoch": 0.11, + "learning_rate": 4.92415950517528e-06, + "loss": 1.0959, + "step": 3527 + }, + { + "epoch": 0.11, + "learning_rate": 4.9240998692229605e-06, + "loss": 1.1094, + "step": 3528 + }, + { + "epoch": 0.11, + "learning_rate": 4.9240402101943786e-06, + "loss": 1.1663, + "step": 3529 + }, + { + "epoch": 0.11, + "learning_rate": 4.923980528090101e-06, + "loss": 1.207, + "step": 3530 + }, + { + "epoch": 0.11, + "learning_rate": 4.923920822910696e-06, + "loss": 1.1185, + "step": 3531 + }, + { + "epoch": 0.11, + "learning_rate": 4.923861094656732e-06, + "loss": 1.1317, + "step": 3532 + }, + { + "epoch": 0.11, + "learning_rate": 4.923801343328779e-06, + "loss": 1.1742, + "step": 3533 + }, + { + "epoch": 0.11, + "learning_rate": 4.923741568927404e-06, + "loss": 1.2179, + "step": 3534 + }, + { + "epoch": 0.11, + "learning_rate": 4.923681771453176e-06, + "loss": 1.2127, + "step": 3535 + }, + { + "epoch": 0.11, + "learning_rate": 4.923621950906665e-06, + "loss": 1.2599, + "step": 3536 + }, + { + "epoch": 0.11, + "learning_rate": 4.92356210728844e-06, + "loss": 0.977, + "step": 3537 + }, + { + "epoch": 0.11, + "learning_rate": 4.923502240599072e-06, + "loss": 1.1709, + "step": 3538 + }, + { + "epoch": 0.11, + "learning_rate": 4.923442350839129e-06, + "loss": 1.1567, + "step": 3539 + }, + { + "epoch": 0.11, + "learning_rate": 4.923382438009182e-06, + "loss": 1.1774, + "step": 3540 + }, + { + "epoch": 0.11, + "learning_rate": 4.923322502109801e-06, + "loss": 1.1028, + "step": 3541 + }, + { + "epoch": 0.11, + "learning_rate": 4.923262543141558e-06, + "loss": 1.2083, + "step": 3542 + }, + { + "epoch": 0.11, + "learning_rate": 4.923202561105022e-06, + "loss": 1.2598, + "step": 3543 + }, + { + "epoch": 0.11, + "learning_rate": 4.923142556000765e-06, + "loss": 1.0657, + "step": 3544 + }, + { + "epoch": 0.11, + "learning_rate": 4.923082527829357e-06, + "loss": 1.2072, + "step": 3545 + }, + { + "epoch": 0.11, + "learning_rate": 4.923022476591371e-06, + "loss": 1.1859, + "step": 3546 + }, + { + "epoch": 0.11, + "learning_rate": 4.922962402287379e-06, + "loss": 1.22, + "step": 3547 + }, + { + "epoch": 0.11, + "learning_rate": 4.922902304917951e-06, + "loss": 1.2292, + "step": 3548 + }, + { + "epoch": 0.11, + "learning_rate": 4.9228421844836594e-06, + "loss": 1.1436, + "step": 3549 + }, + { + "epoch": 0.11, + "learning_rate": 4.922782040985077e-06, + "loss": 1.1429, + "step": 3550 + }, + { + "epoch": 0.11, + "learning_rate": 4.922721874422777e-06, + "loss": 1.1891, + "step": 3551 + }, + { + "epoch": 0.11, + "learning_rate": 4.922661684797332e-06, + "loss": 1.047, + "step": 3552 + }, + { + "epoch": 0.11, + "learning_rate": 4.922601472109313e-06, + "loss": 1.0425, + "step": 3553 + }, + { + "epoch": 0.11, + "learning_rate": 4.922541236359296e-06, + "loss": 1.1476, + "step": 3554 + }, + { + "epoch": 0.11, + "learning_rate": 4.922480977547853e-06, + "loss": 1.1392, + "step": 3555 + }, + { + "epoch": 0.11, + "learning_rate": 4.922420695675559e-06, + "loss": 1.1694, + "step": 3556 + }, + { + "epoch": 0.11, + "learning_rate": 4.9223603907429845e-06, + "loss": 1.2326, + "step": 3557 + }, + { + "epoch": 0.11, + "learning_rate": 4.9223000627507065e-06, + "loss": 1.1963, + "step": 3558 + }, + { + "epoch": 0.11, + "learning_rate": 4.922239711699299e-06, + "loss": 1.0914, + "step": 3559 + }, + { + "epoch": 0.11, + "learning_rate": 4.922179337589336e-06, + "loss": 1.1835, + "step": 3560 + }, + { + "epoch": 0.11, + "learning_rate": 4.922118940421392e-06, + "loss": 1.1022, + "step": 3561 + }, + { + "epoch": 0.11, + "learning_rate": 4.922058520196042e-06, + "loss": 1.1613, + "step": 3562 + }, + { + "epoch": 0.11, + "learning_rate": 4.921998076913861e-06, + "loss": 1.3109, + "step": 3563 + }, + { + "epoch": 0.11, + "learning_rate": 4.921937610575426e-06, + "loss": 1.3114, + "step": 3564 + }, + { + "epoch": 0.11, + "learning_rate": 4.9218771211813105e-06, + "loss": 1.0707, + "step": 3565 + }, + { + "epoch": 0.11, + "learning_rate": 4.9218166087320916e-06, + "loss": 1.1171, + "step": 3566 + }, + { + "epoch": 0.11, + "learning_rate": 4.921756073228345e-06, + "loss": 1.2383, + "step": 3567 + }, + { + "epoch": 0.11, + "learning_rate": 4.921695514670647e-06, + "loss": 1.1896, + "step": 3568 + }, + { + "epoch": 0.11, + "learning_rate": 4.9216349330595735e-06, + "loss": 1.2147, + "step": 3569 + }, + { + "epoch": 0.11, + "learning_rate": 4.921574328395702e-06, + "loss": 1.187, + "step": 3570 + }, + { + "epoch": 0.11, + "learning_rate": 4.92151370067961e-06, + "loss": 1.0742, + "step": 3571 + }, + { + "epoch": 0.11, + "learning_rate": 4.921453049911872e-06, + "loss": 1.1075, + "step": 3572 + }, + { + "epoch": 0.11, + "learning_rate": 4.921392376093068e-06, + "loss": 1.1472, + "step": 3573 + }, + { + "epoch": 0.11, + "learning_rate": 4.921331679223775e-06, + "loss": 1.1713, + "step": 3574 + }, + { + "epoch": 0.11, + "learning_rate": 4.921270959304571e-06, + "loss": 1.2493, + "step": 3575 + }, + { + "epoch": 0.11, + "learning_rate": 4.9212102163360334e-06, + "loss": 1.1574, + "step": 3576 + }, + { + "epoch": 0.11, + "learning_rate": 4.92114945031874e-06, + "loss": 1.0933, + "step": 3577 + }, + { + "epoch": 0.11, + "learning_rate": 4.92108866125327e-06, + "loss": 1.1713, + "step": 3578 + }, + { + "epoch": 0.11, + "learning_rate": 4.921027849140203e-06, + "loss": 1.1281, + "step": 3579 + }, + { + "epoch": 0.11, + "learning_rate": 4.920967013980116e-06, + "loss": 1.1271, + "step": 3580 + }, + { + "epoch": 0.11, + "learning_rate": 4.9209061557735894e-06, + "loss": 1.1141, + "step": 3581 + }, + { + "epoch": 0.11, + "learning_rate": 4.9208452745212015e-06, + "loss": 1.097, + "step": 3582 + }, + { + "epoch": 0.11, + "learning_rate": 4.920784370223533e-06, + "loss": 1.1538, + "step": 3583 + }, + { + "epoch": 0.11, + "learning_rate": 4.920723442881164e-06, + "loss": 1.1877, + "step": 3584 + }, + { + "epoch": 0.11, + "learning_rate": 4.9206624924946715e-06, + "loss": 1.224, + "step": 3585 + }, + { + "epoch": 0.11, + "learning_rate": 4.92060151906464e-06, + "loss": 1.15, + "step": 3586 + }, + { + "epoch": 0.11, + "learning_rate": 4.9205405225916466e-06, + "loss": 1.1931, + "step": 3587 + }, + { + "epoch": 0.11, + "learning_rate": 4.920479503076273e-06, + "loss": 1.1834, + "step": 3588 + }, + { + "epoch": 0.11, + "learning_rate": 4.920418460519102e-06, + "loss": 1.2601, + "step": 3589 + }, + { + "epoch": 0.11, + "learning_rate": 4.920357394920711e-06, + "loss": 1.0837, + "step": 3590 + }, + { + "epoch": 0.11, + "learning_rate": 4.920296306281684e-06, + "loss": 1.2236, + "step": 3591 + }, + { + "epoch": 0.11, + "learning_rate": 4.9202351946026024e-06, + "loss": 1.241, + "step": 3592 + }, + { + "epoch": 0.11, + "learning_rate": 4.9201740598840465e-06, + "loss": 1.2531, + "step": 3593 + }, + { + "epoch": 0.11, + "learning_rate": 4.920112902126599e-06, + "loss": 1.0288, + "step": 3594 + }, + { + "epoch": 0.11, + "learning_rate": 4.920051721330844e-06, + "loss": 1.1758, + "step": 3595 + }, + { + "epoch": 0.11, + "learning_rate": 4.9199905174973605e-06, + "loss": 1.1531, + "step": 3596 + }, + { + "epoch": 0.11, + "learning_rate": 4.9199292906267335e-06, + "loss": 1.1441, + "step": 3597 + }, + { + "epoch": 0.11, + "learning_rate": 4.9198680407195445e-06, + "loss": 1.16, + "step": 3598 + }, + { + "epoch": 0.11, + "learning_rate": 4.919806767776378e-06, + "loss": 1.1661, + "step": 3599 + }, + { + "epoch": 0.11, + "learning_rate": 4.919745471797815e-06, + "loss": 1.1763, + "step": 3600 + }, + { + "epoch": 0.11, + "learning_rate": 4.919684152784442e-06, + "loss": 1.1813, + "step": 3601 + }, + { + "epoch": 0.11, + "learning_rate": 4.919622810736841e-06, + "loss": 1.1475, + "step": 3602 + }, + { + "epoch": 0.11, + "learning_rate": 4.919561445655596e-06, + "loss": 1.0714, + "step": 3603 + }, + { + "epoch": 0.11, + "learning_rate": 4.919500057541292e-06, + "loss": 1.2421, + "step": 3604 + }, + { + "epoch": 0.11, + "learning_rate": 4.919438646394511e-06, + "loss": 1.1782, + "step": 3605 + }, + { + "epoch": 0.11, + "learning_rate": 4.9193772122158416e-06, + "loss": 1.1196, + "step": 3606 + }, + { + "epoch": 0.11, + "learning_rate": 4.919315755005864e-06, + "loss": 1.1804, + "step": 3607 + }, + { + "epoch": 0.11, + "learning_rate": 4.919254274765168e-06, + "loss": 1.2288, + "step": 3608 + }, + { + "epoch": 0.11, + "learning_rate": 4.919192771494335e-06, + "loss": 1.0918, + "step": 3609 + }, + { + "epoch": 0.11, + "learning_rate": 4.919131245193951e-06, + "loss": 1.2185, + "step": 3610 + }, + { + "epoch": 0.11, + "learning_rate": 4.919069695864604e-06, + "loss": 1.2608, + "step": 3611 + }, + { + "epoch": 0.11, + "learning_rate": 4.919008123506878e-06, + "loss": 1.159, + "step": 3612 + }, + { + "epoch": 0.11, + "learning_rate": 4.91894652812136e-06, + "loss": 1.1128, + "step": 3613 + }, + { + "epoch": 0.11, + "learning_rate": 4.918884909708637e-06, + "loss": 1.1409, + "step": 3614 + }, + { + "epoch": 0.11, + "learning_rate": 4.9188232682692925e-06, + "loss": 1.1243, + "step": 3615 + }, + { + "epoch": 0.11, + "learning_rate": 4.918761603803917e-06, + "loss": 1.1956, + "step": 3616 + }, + { + "epoch": 0.11, + "learning_rate": 4.918699916313096e-06, + "loss": 1.1477, + "step": 3617 + }, + { + "epoch": 0.11, + "learning_rate": 4.918638205797416e-06, + "loss": 1.2828, + "step": 3618 + }, + { + "epoch": 0.11, + "learning_rate": 4.918576472257465e-06, + "loss": 1.1533, + "step": 3619 + }, + { + "epoch": 0.11, + "learning_rate": 4.9185147156938315e-06, + "loss": 1.1677, + "step": 3620 + }, + { + "epoch": 0.11, + "learning_rate": 4.918452936107102e-06, + "loss": 1.1226, + "step": 3621 + }, + { + "epoch": 0.11, + "learning_rate": 4.918391133497867e-06, + "loss": 1.0166, + "step": 3622 + }, + { + "epoch": 0.11, + "learning_rate": 4.918329307866711e-06, + "loss": 1.1672, + "step": 3623 + }, + { + "epoch": 0.11, + "learning_rate": 4.9182674592142254e-06, + "loss": 1.2058, + "step": 3624 + }, + { + "epoch": 0.11, + "learning_rate": 4.918205587540998e-06, + "loss": 1.2291, + "step": 3625 + }, + { + "epoch": 0.11, + "learning_rate": 4.918143692847619e-06, + "loss": 1.2146, + "step": 3626 + }, + { + "epoch": 0.11, + "learning_rate": 4.918081775134676e-06, + "loss": 1.1763, + "step": 3627 + }, + { + "epoch": 0.11, + "learning_rate": 4.91801983440276e-06, + "loss": 1.076, + "step": 3628 + }, + { + "epoch": 0.11, + "learning_rate": 4.9179578706524585e-06, + "loss": 1.0945, + "step": 3629 + }, + { + "epoch": 0.11, + "learning_rate": 4.917895883884363e-06, + "loss": 1.2259, + "step": 3630 + }, + { + "epoch": 0.11, + "learning_rate": 4.917833874099063e-06, + "loss": 1.2255, + "step": 3631 + }, + { + "epoch": 0.11, + "learning_rate": 4.917771841297149e-06, + "loss": 1.163, + "step": 3632 + }, + { + "epoch": 0.11, + "learning_rate": 4.917709785479212e-06, + "loss": 1.2288, + "step": 3633 + }, + { + "epoch": 0.11, + "learning_rate": 4.917647706645842e-06, + "loss": 1.1825, + "step": 3634 + }, + { + "epoch": 0.11, + "learning_rate": 4.91758560479763e-06, + "loss": 1.2191, + "step": 3635 + }, + { + "epoch": 0.11, + "learning_rate": 4.917523479935168e-06, + "loss": 1.1838, + "step": 3636 + }, + { + "epoch": 0.11, + "learning_rate": 4.917461332059046e-06, + "loss": 1.005, + "step": 3637 + }, + { + "epoch": 0.11, + "learning_rate": 4.917399161169857e-06, + "loss": 1.2609, + "step": 3638 + }, + { + "epoch": 0.11, + "learning_rate": 4.917336967268192e-06, + "loss": 1.1004, + "step": 3639 + }, + { + "epoch": 0.11, + "learning_rate": 4.917274750354644e-06, + "loss": 1.1979, + "step": 3640 + }, + { + "epoch": 0.11, + "learning_rate": 4.917212510429803e-06, + "loss": 1.0795, + "step": 3641 + }, + { + "epoch": 0.11, + "learning_rate": 4.917150247494265e-06, + "loss": 1.1809, + "step": 3642 + }, + { + "epoch": 0.11, + "learning_rate": 4.917087961548619e-06, + "loss": 1.2954, + "step": 3643 + }, + { + "epoch": 0.11, + "learning_rate": 4.91702565259346e-06, + "loss": 1.226, + "step": 3644 + }, + { + "epoch": 0.11, + "learning_rate": 4.916963320629382e-06, + "loss": 1.1742, + "step": 3645 + }, + { + "epoch": 0.11, + "learning_rate": 4.916900965656977e-06, + "loss": 1.075, + "step": 3646 + }, + { + "epoch": 0.11, + "learning_rate": 4.916838587676837e-06, + "loss": 1.0941, + "step": 3647 + }, + { + "epoch": 0.11, + "learning_rate": 4.91677618668956e-06, + "loss": 1.1373, + "step": 3648 + }, + { + "epoch": 0.11, + "learning_rate": 4.916713762695736e-06, + "loss": 1.1924, + "step": 3649 + }, + { + "epoch": 0.11, + "learning_rate": 4.916651315695962e-06, + "loss": 1.189, + "step": 3650 + }, + { + "epoch": 0.11, + "learning_rate": 4.916588845690831e-06, + "loss": 1.0974, + "step": 3651 + }, + { + "epoch": 0.11, + "learning_rate": 4.916526352680938e-06, + "loss": 1.1963, + "step": 3652 + }, + { + "epoch": 0.11, + "learning_rate": 4.916463836666878e-06, + "loss": 1.0002, + "step": 3653 + }, + { + "epoch": 0.11, + "learning_rate": 4.916401297649246e-06, + "loss": 1.142, + "step": 3654 + }, + { + "epoch": 0.11, + "learning_rate": 4.916338735628638e-06, + "loss": 1.2803, + "step": 3655 + }, + { + "epoch": 0.11, + "learning_rate": 4.916276150605648e-06, + "loss": 1.0876, + "step": 3656 + }, + { + "epoch": 0.11, + "learning_rate": 4.916213542580873e-06, + "loss": 1.1625, + "step": 3657 + }, + { + "epoch": 0.11, + "learning_rate": 4.916150911554909e-06, + "loss": 1.252, + "step": 3658 + }, + { + "epoch": 0.11, + "learning_rate": 4.916088257528352e-06, + "loss": 1.213, + "step": 3659 + }, + { + "epoch": 0.11, + "learning_rate": 4.9160255805017985e-06, + "loss": 1.2091, + "step": 3660 + }, + { + "epoch": 0.11, + "learning_rate": 4.915962880475845e-06, + "loss": 1.1509, + "step": 3661 + }, + { + "epoch": 0.11, + "learning_rate": 4.915900157451089e-06, + "loss": 1.1786, + "step": 3662 + }, + { + "epoch": 0.11, + "learning_rate": 4.915837411428126e-06, + "loss": 1.08, + "step": 3663 + }, + { + "epoch": 0.11, + "learning_rate": 4.9157746424075555e-06, + "loss": 1.1235, + "step": 3664 + }, + { + "epoch": 0.11, + "learning_rate": 4.915711850389973e-06, + "loss": 1.1707, + "step": 3665 + }, + { + "epoch": 0.11, + "learning_rate": 4.915649035375977e-06, + "loss": 1.0886, + "step": 3666 + }, + { + "epoch": 0.11, + "learning_rate": 4.915586197366166e-06, + "loss": 1.231, + "step": 3667 + }, + { + "epoch": 0.11, + "learning_rate": 4.915523336361137e-06, + "loss": 1.1635, + "step": 3668 + }, + { + "epoch": 0.11, + "learning_rate": 4.915460452361491e-06, + "loss": 1.2129, + "step": 3669 + }, + { + "epoch": 0.11, + "learning_rate": 4.9153975453678235e-06, + "loss": 1.1391, + "step": 3670 + }, + { + "epoch": 0.11, + "learning_rate": 4.915334615380735e-06, + "loss": 1.1783, + "step": 3671 + }, + { + "epoch": 0.11, + "learning_rate": 4.915271662400824e-06, + "loss": 1.2493, + "step": 3672 + }, + { + "epoch": 0.11, + "learning_rate": 4.9152086864286905e-06, + "loss": 1.1921, + "step": 3673 + }, + { + "epoch": 0.11, + "learning_rate": 4.915145687464933e-06, + "loss": 1.0383, + "step": 3674 + }, + { + "epoch": 0.11, + "learning_rate": 4.915082665510152e-06, + "loss": 1.1871, + "step": 3675 + }, + { + "epoch": 0.11, + "learning_rate": 4.915019620564947e-06, + "loss": 1.1065, + "step": 3676 + }, + { + "epoch": 0.11, + "learning_rate": 4.914956552629918e-06, + "loss": 1.1786, + "step": 3677 + }, + { + "epoch": 0.11, + "learning_rate": 4.914893461705667e-06, + "loss": 1.056, + "step": 3678 + }, + { + "epoch": 0.11, + "learning_rate": 4.9148303477927915e-06, + "loss": 1.1888, + "step": 3679 + }, + { + "epoch": 0.11, + "learning_rate": 4.914767210891895e-06, + "loss": 1.1558, + "step": 3680 + }, + { + "epoch": 0.11, + "learning_rate": 4.914704051003578e-06, + "loss": 1.175, + "step": 3681 + }, + { + "epoch": 0.11, + "learning_rate": 4.914640868128441e-06, + "loss": 1.0614, + "step": 3682 + }, + { + "epoch": 0.11, + "learning_rate": 4.914577662267086e-06, + "loss": 1.2244, + "step": 3683 + }, + { + "epoch": 0.11, + "learning_rate": 4.914514433420114e-06, + "loss": 1.1647, + "step": 3684 + }, + { + "epoch": 0.11, + "learning_rate": 4.914451181588128e-06, + "loss": 1.1341, + "step": 3685 + }, + { + "epoch": 0.11, + "learning_rate": 4.914387906771729e-06, + "loss": 1.2634, + "step": 3686 + }, + { + "epoch": 0.11, + "learning_rate": 4.914324608971521e-06, + "loss": 1.1183, + "step": 3687 + }, + { + "epoch": 0.11, + "learning_rate": 4.914261288188105e-06, + "loss": 1.2073, + "step": 3688 + }, + { + "epoch": 0.11, + "learning_rate": 4.914197944422085e-06, + "loss": 1.1934, + "step": 3689 + }, + { + "epoch": 0.11, + "learning_rate": 4.914134577674062e-06, + "loss": 1.1349, + "step": 3690 + }, + { + "epoch": 0.11, + "learning_rate": 4.914071187944641e-06, + "loss": 1.1729, + "step": 3691 + }, + { + "epoch": 0.11, + "learning_rate": 4.914007775234425e-06, + "loss": 1.1388, + "step": 3692 + }, + { + "epoch": 0.11, + "learning_rate": 4.913944339544018e-06, + "loss": 1.2302, + "step": 3693 + }, + { + "epoch": 0.11, + "learning_rate": 4.9138808808740226e-06, + "loss": 1.1105, + "step": 3694 + }, + { + "epoch": 0.11, + "learning_rate": 4.9138173992250435e-06, + "loss": 1.1605, + "step": 3695 + }, + { + "epoch": 0.11, + "learning_rate": 4.913753894597687e-06, + "loss": 1.1894, + "step": 3696 + }, + { + "epoch": 0.11, + "learning_rate": 4.913690366992554e-06, + "loss": 1.1411, + "step": 3697 + }, + { + "epoch": 0.11, + "learning_rate": 4.9136268164102525e-06, + "loss": 1.1094, + "step": 3698 + }, + { + "epoch": 0.11, + "learning_rate": 4.913563242851386e-06, + "loss": 1.3678, + "step": 3699 + }, + { + "epoch": 0.11, + "learning_rate": 4.913499646316559e-06, + "loss": 1.1576, + "step": 3700 + }, + { + "epoch": 0.11, + "learning_rate": 4.913436026806378e-06, + "loss": 1.1562, + "step": 3701 + }, + { + "epoch": 0.11, + "learning_rate": 4.91337238432145e-06, + "loss": 1.1625, + "step": 3702 + }, + { + "epoch": 0.11, + "learning_rate": 4.9133087188623775e-06, + "loss": 1.091, + "step": 3703 + }, + { + "epoch": 0.11, + "learning_rate": 4.913245030429768e-06, + "loss": 1.1547, + "step": 3704 + }, + { + "epoch": 0.11, + "learning_rate": 4.91318131902423e-06, + "loss": 1.0096, + "step": 3705 + }, + { + "epoch": 0.11, + "learning_rate": 4.9131175846463665e-06, + "loss": 1.1373, + "step": 3706 + }, + { + "epoch": 0.11, + "learning_rate": 4.913053827296787e-06, + "loss": 1.0222, + "step": 3707 + }, + { + "epoch": 0.11, + "learning_rate": 4.912990046976096e-06, + "loss": 1.1248, + "step": 3708 + }, + { + "epoch": 0.11, + "learning_rate": 4.912926243684902e-06, + "loss": 1.0232, + "step": 3709 + }, + { + "epoch": 0.11, + "learning_rate": 4.9128624174238125e-06, + "loss": 1.2214, + "step": 3710 + }, + { + "epoch": 0.11, + "learning_rate": 4.912798568193435e-06, + "loss": 1.1442, + "step": 3711 + }, + { + "epoch": 0.11, + "learning_rate": 4.912734695994377e-06, + "loss": 1.0867, + "step": 3712 + }, + { + "epoch": 0.11, + "learning_rate": 4.9126708008272475e-06, + "loss": 1.0908, + "step": 3713 + }, + { + "epoch": 0.11, + "learning_rate": 4.912606882692652e-06, + "loss": 1.2321, + "step": 3714 + }, + { + "epoch": 0.11, + "learning_rate": 4.9125429415912025e-06, + "loss": 1.1205, + "step": 3715 + }, + { + "epoch": 0.11, + "learning_rate": 4.912478977523506e-06, + "loss": 1.1006, + "step": 3716 + }, + { + "epoch": 0.11, + "learning_rate": 4.912414990490171e-06, + "loss": 1.1176, + "step": 3717 + }, + { + "epoch": 0.11, + "learning_rate": 4.912350980491808e-06, + "loss": 1.2316, + "step": 3718 + }, + { + "epoch": 0.11, + "learning_rate": 4.912286947529024e-06, + "loss": 1.2239, + "step": 3719 + }, + { + "epoch": 0.11, + "learning_rate": 4.912222891602431e-06, + "loss": 1.1663, + "step": 3720 + }, + { + "epoch": 0.11, + "learning_rate": 4.912158812712639e-06, + "loss": 1.183, + "step": 3721 + }, + { + "epoch": 0.11, + "learning_rate": 4.912094710860256e-06, + "loss": 1.0963, + "step": 3722 + }, + { + "epoch": 0.11, + "learning_rate": 4.912030586045893e-06, + "loss": 1.1252, + "step": 3723 + }, + { + "epoch": 0.11, + "learning_rate": 4.91196643827016e-06, + "loss": 1.1432, + "step": 3724 + }, + { + "epoch": 0.11, + "learning_rate": 4.911902267533668e-06, + "loss": 1.205, + "step": 3725 + }, + { + "epoch": 0.11, + "learning_rate": 4.911838073837028e-06, + "loss": 1.119, + "step": 3726 + }, + { + "epoch": 0.11, + "learning_rate": 4.911773857180852e-06, + "loss": 1.1483, + "step": 3727 + }, + { + "epoch": 0.11, + "learning_rate": 4.91170961756575e-06, + "loss": 1.0544, + "step": 3728 + }, + { + "epoch": 0.11, + "learning_rate": 4.9116453549923335e-06, + "loss": 1.1783, + "step": 3729 + }, + { + "epoch": 0.11, + "learning_rate": 4.911581069461216e-06, + "loss": 1.1866, + "step": 3730 + }, + { + "epoch": 0.11, + "learning_rate": 4.911516760973007e-06, + "loss": 1.0441, + "step": 3731 + }, + { + "epoch": 0.11, + "learning_rate": 4.91145242952832e-06, + "loss": 1.1967, + "step": 3732 + }, + { + "epoch": 0.11, + "learning_rate": 4.9113880751277674e-06, + "loss": 1.1449, + "step": 3733 + }, + { + "epoch": 0.11, + "learning_rate": 4.911323697771962e-06, + "loss": 1.1879, + "step": 3734 + }, + { + "epoch": 0.11, + "learning_rate": 4.911259297461516e-06, + "loss": 1.117, + "step": 3735 + }, + { + "epoch": 0.11, + "learning_rate": 4.911194874197043e-06, + "loss": 1.21, + "step": 3736 + }, + { + "epoch": 0.11, + "learning_rate": 4.911130427979156e-06, + "loss": 1.0952, + "step": 3737 + }, + { + "epoch": 0.11, + "learning_rate": 4.911065958808468e-06, + "loss": 1.1127, + "step": 3738 + }, + { + "epoch": 0.11, + "learning_rate": 4.9110014666855945e-06, + "loss": 1.1763, + "step": 3739 + }, + { + "epoch": 0.11, + "learning_rate": 4.910936951611147e-06, + "loss": 1.1679, + "step": 3740 + }, + { + "epoch": 0.11, + "learning_rate": 4.9108724135857415e-06, + "loss": 1.182, + "step": 3741 + }, + { + "epoch": 0.11, + "learning_rate": 4.910807852609991e-06, + "loss": 1.195, + "step": 3742 + }, + { + "epoch": 0.11, + "learning_rate": 4.910743268684513e-06, + "loss": 1.2163, + "step": 3743 + }, + { + "epoch": 0.11, + "learning_rate": 4.9106786618099175e-06, + "loss": 1.2831, + "step": 3744 + }, + { + "epoch": 0.11, + "learning_rate": 4.910614031986824e-06, + "loss": 1.142, + "step": 3745 + }, + { + "epoch": 0.11, + "learning_rate": 4.910549379215845e-06, + "loss": 1.0944, + "step": 3746 + }, + { + "epoch": 0.11, + "learning_rate": 4.910484703497597e-06, + "loss": 1.1822, + "step": 3747 + }, + { + "epoch": 0.11, + "learning_rate": 4.910420004832696e-06, + "loss": 1.2083, + "step": 3748 + }, + { + "epoch": 0.11, + "learning_rate": 4.910355283221756e-06, + "loss": 1.1741, + "step": 3749 + }, + { + "epoch": 0.11, + "learning_rate": 4.910290538665396e-06, + "loss": 1.1692, + "step": 3750 + }, + { + "epoch": 0.11, + "learning_rate": 4.910225771164231e-06, + "loss": 1.1307, + "step": 3751 + }, + { + "epoch": 0.11, + "learning_rate": 4.910160980718876e-06, + "loss": 1.1163, + "step": 3752 + }, + { + "epoch": 0.11, + "learning_rate": 4.910096167329951e-06, + "loss": 1.2538, + "step": 3753 + }, + { + "epoch": 0.11, + "learning_rate": 4.9100313309980694e-06, + "loss": 1.2217, + "step": 3754 + }, + { + "epoch": 0.11, + "learning_rate": 4.909966471723852e-06, + "loss": 1.1719, + "step": 3755 + }, + { + "epoch": 0.11, + "learning_rate": 4.909901589507914e-06, + "loss": 1.2068, + "step": 3756 + }, + { + "epoch": 0.11, + "learning_rate": 4.909836684350873e-06, + "loss": 1.167, + "step": 3757 + }, + { + "epoch": 0.11, + "learning_rate": 4.909771756253347e-06, + "loss": 1.0681, + "step": 3758 + }, + { + "epoch": 0.11, + "learning_rate": 4.909706805215956e-06, + "loss": 1.1189, + "step": 3759 + }, + { + "epoch": 0.11, + "learning_rate": 4.909641831239316e-06, + "loss": 1.1713, + "step": 3760 + }, + { + "epoch": 0.11, + "learning_rate": 4.909576834324046e-06, + "loss": 1.2914, + "step": 3761 + }, + { + "epoch": 0.11, + "learning_rate": 4.909511814470765e-06, + "loss": 1.2556, + "step": 3762 + }, + { + "epoch": 0.11, + "learning_rate": 4.909446771680092e-06, + "loss": 1.1819, + "step": 3763 + }, + { + "epoch": 0.11, + "learning_rate": 4.909381705952646e-06, + "loss": 1.2318, + "step": 3764 + }, + { + "epoch": 0.11, + "learning_rate": 4.909316617289047e-06, + "loss": 1.1026, + "step": 3765 + }, + { + "epoch": 0.11, + "learning_rate": 4.909251505689915e-06, + "loss": 1.239, + "step": 3766 + }, + { + "epoch": 0.11, + "learning_rate": 4.909186371155868e-06, + "loss": 1.2426, + "step": 3767 + }, + { + "epoch": 0.11, + "learning_rate": 4.909121213687526e-06, + "loss": 1.1406, + "step": 3768 + }, + { + "epoch": 0.11, + "learning_rate": 4.909056033285512e-06, + "loss": 1.0969, + "step": 3769 + }, + { + "epoch": 0.11, + "learning_rate": 4.908990829950444e-06, + "loss": 1.1278, + "step": 3770 + }, + { + "epoch": 0.11, + "learning_rate": 4.9089256036829435e-06, + "loss": 1.0952, + "step": 3771 + }, + { + "epoch": 0.11, + "learning_rate": 4.908860354483632e-06, + "loss": 1.0869, + "step": 3772 + }, + { + "epoch": 0.11, + "learning_rate": 4.90879508235313e-06, + "loss": 1.27, + "step": 3773 + }, + { + "epoch": 0.11, + "learning_rate": 4.908729787292058e-06, + "loss": 1.2869, + "step": 3774 + }, + { + "epoch": 0.11, + "learning_rate": 4.90866446930104e-06, + "loss": 1.2227, + "step": 3775 + }, + { + "epoch": 0.11, + "learning_rate": 4.908599128380696e-06, + "loss": 1.2103, + "step": 3776 + }, + { + "epoch": 0.11, + "learning_rate": 4.908533764531647e-06, + "loss": 1.1744, + "step": 3777 + }, + { + "epoch": 0.11, + "learning_rate": 4.908468377754517e-06, + "loss": 1.1023, + "step": 3778 + }, + { + "epoch": 0.11, + "learning_rate": 4.908402968049929e-06, + "loss": 1.2651, + "step": 3779 + }, + { + "epoch": 0.11, + "learning_rate": 4.908337535418503e-06, + "loss": 1.2577, + "step": 3780 + }, + { + "epoch": 0.11, + "learning_rate": 4.908272079860865e-06, + "loss": 1.2133, + "step": 3781 + }, + { + "epoch": 0.11, + "learning_rate": 4.9082066013776365e-06, + "loss": 1.1825, + "step": 3782 + }, + { + "epoch": 0.11, + "learning_rate": 4.908141099969441e-06, + "loss": 1.0724, + "step": 3783 + }, + { + "epoch": 0.11, + "learning_rate": 4.9080755756369015e-06, + "loss": 1.1942, + "step": 3784 + }, + { + "epoch": 0.11, + "learning_rate": 4.908010028380643e-06, + "loss": 1.1433, + "step": 3785 + }, + { + "epoch": 0.11, + "learning_rate": 4.907944458201288e-06, + "loss": 1.2177, + "step": 3786 + }, + { + "epoch": 0.11, + "learning_rate": 4.907878865099462e-06, + "loss": 1.2366, + "step": 3787 + }, + { + "epoch": 0.11, + "learning_rate": 4.907813249075788e-06, + "loss": 0.9567, + "step": 3788 + }, + { + "epoch": 0.11, + "learning_rate": 4.907747610130893e-06, + "loss": 1.0644, + "step": 3789 + }, + { + "epoch": 0.11, + "learning_rate": 4.907681948265399e-06, + "loss": 1.1862, + "step": 3790 + }, + { + "epoch": 0.11, + "learning_rate": 4.907616263479933e-06, + "loss": 1.1389, + "step": 3791 + }, + { + "epoch": 0.11, + "learning_rate": 4.90755055577512e-06, + "loss": 1.2206, + "step": 3792 + }, + { + "epoch": 0.11, + "learning_rate": 4.907484825151585e-06, + "loss": 1.3061, + "step": 3793 + }, + { + "epoch": 0.11, + "learning_rate": 4.9074190716099536e-06, + "loss": 1.2146, + "step": 3794 + }, + { + "epoch": 0.11, + "learning_rate": 4.907353295150853e-06, + "loss": 1.0967, + "step": 3795 + }, + { + "epoch": 0.11, + "learning_rate": 4.907287495774907e-06, + "loss": 1.1248, + "step": 3796 + }, + { + "epoch": 0.11, + "learning_rate": 4.907221673482745e-06, + "loss": 1.1443, + "step": 3797 + }, + { + "epoch": 0.11, + "learning_rate": 4.907155828274991e-06, + "loss": 1.1216, + "step": 3798 + }, + { + "epoch": 0.11, + "learning_rate": 4.907089960152273e-06, + "loss": 1.2531, + "step": 3799 + }, + { + "epoch": 0.11, + "learning_rate": 4.907024069115218e-06, + "loss": 1.2109, + "step": 3800 + }, + { + "epoch": 0.11, + "learning_rate": 4.906958155164453e-06, + "loss": 1.1774, + "step": 3801 + }, + { + "epoch": 0.11, + "learning_rate": 4.906892218300606e-06, + "loss": 1.0862, + "step": 3802 + }, + { + "epoch": 0.11, + "learning_rate": 4.906826258524304e-06, + "loss": 1.1412, + "step": 3803 + }, + { + "epoch": 0.11, + "learning_rate": 4.906760275836175e-06, + "loss": 1.0826, + "step": 3804 + }, + { + "epoch": 0.11, + "learning_rate": 4.906694270236848e-06, + "loss": 1.2266, + "step": 3805 + }, + { + "epoch": 0.11, + "learning_rate": 4.906628241726949e-06, + "loss": 1.222, + "step": 3806 + }, + { + "epoch": 0.11, + "learning_rate": 4.90656219030711e-06, + "loss": 1.2038, + "step": 3807 + }, + { + "epoch": 0.11, + "learning_rate": 4.906496115977957e-06, + "loss": 1.1667, + "step": 3808 + }, + { + "epoch": 0.11, + "learning_rate": 4.90643001874012e-06, + "loss": 1.2168, + "step": 3809 + }, + { + "epoch": 0.11, + "learning_rate": 4.9063638985942295e-06, + "loss": 1.1287, + "step": 3810 + }, + { + "epoch": 0.11, + "learning_rate": 4.906297755540912e-06, + "loss": 1.1664, + "step": 3811 + }, + { + "epoch": 0.11, + "learning_rate": 4.9062315895808e-06, + "loss": 1.1401, + "step": 3812 + }, + { + "epoch": 0.11, + "learning_rate": 4.906165400714521e-06, + "loss": 1.1536, + "step": 3813 + }, + { + "epoch": 0.11, + "learning_rate": 4.9060991889427065e-06, + "loss": 1.1313, + "step": 3814 + }, + { + "epoch": 0.11, + "learning_rate": 4.906032954265987e-06, + "loss": 1.0797, + "step": 3815 + }, + { + "epoch": 0.11, + "learning_rate": 4.905966696684993e-06, + "loss": 1.1058, + "step": 3816 + }, + { + "epoch": 0.11, + "learning_rate": 4.905900416200354e-06, + "loss": 1.1215, + "step": 3817 + }, + { + "epoch": 0.12, + "learning_rate": 4.905834112812702e-06, + "loss": 1.2072, + "step": 3818 + }, + { + "epoch": 0.12, + "learning_rate": 4.905767786522668e-06, + "loss": 1.1108, + "step": 3819 + }, + { + "epoch": 0.12, + "learning_rate": 4.905701437330883e-06, + "loss": 1.1523, + "step": 3820 + }, + { + "epoch": 0.12, + "learning_rate": 4.9056350652379795e-06, + "loss": 1.2406, + "step": 3821 + }, + { + "epoch": 0.12, + "learning_rate": 4.9055686702445885e-06, + "loss": 1.1937, + "step": 3822 + }, + { + "epoch": 0.12, + "learning_rate": 4.905502252351342e-06, + "loss": 1.1006, + "step": 3823 + }, + { + "epoch": 0.12, + "learning_rate": 4.905435811558873e-06, + "loss": 1.2583, + "step": 3824 + }, + { + "epoch": 0.12, + "learning_rate": 4.905369347867814e-06, + "loss": 1.1266, + "step": 3825 + }, + { + "epoch": 0.12, + "learning_rate": 4.905302861278795e-06, + "loss": 1.1691, + "step": 3826 + }, + { + "epoch": 0.12, + "learning_rate": 4.905236351792454e-06, + "loss": 1.1618, + "step": 3827 + }, + { + "epoch": 0.12, + "learning_rate": 4.90516981940942e-06, + "loss": 1.0877, + "step": 3828 + }, + { + "epoch": 0.12, + "learning_rate": 4.905103264130328e-06, + "loss": 1.1547, + "step": 3829 + }, + { + "epoch": 0.12, + "learning_rate": 4.905036685955811e-06, + "loss": 1.1295, + "step": 3830 + }, + { + "epoch": 0.12, + "learning_rate": 4.904970084886504e-06, + "loss": 1.123, + "step": 3831 + }, + { + "epoch": 0.12, + "learning_rate": 4.904903460923039e-06, + "loss": 1.1128, + "step": 3832 + }, + { + "epoch": 0.12, + "learning_rate": 4.904836814066052e-06, + "loss": 1.0942, + "step": 3833 + }, + { + "epoch": 0.12, + "learning_rate": 4.9047701443161755e-06, + "loss": 1.0676, + "step": 3834 + }, + { + "epoch": 0.12, + "learning_rate": 4.9047034516740465e-06, + "loss": 1.1337, + "step": 3835 + }, + { + "epoch": 0.12, + "learning_rate": 4.904636736140298e-06, + "loss": 1.2157, + "step": 3836 + }, + { + "epoch": 0.12, + "learning_rate": 4.904569997715567e-06, + "loss": 1.1801, + "step": 3837 + }, + { + "epoch": 0.12, + "learning_rate": 4.904503236400487e-06, + "loss": 1.1072, + "step": 3838 + }, + { + "epoch": 0.12, + "learning_rate": 4.904436452195695e-06, + "loss": 1.2249, + "step": 3839 + }, + { + "epoch": 0.12, + "learning_rate": 4.904369645101824e-06, + "loss": 1.0626, + "step": 3840 + }, + { + "epoch": 0.12, + "learning_rate": 4.904302815119514e-06, + "loss": 1.2014, + "step": 3841 + }, + { + "epoch": 0.12, + "learning_rate": 4.904235962249398e-06, + "loss": 1.1893, + "step": 3842 + }, + { + "epoch": 0.12, + "learning_rate": 4.9041690864921146e-06, + "loss": 1.1059, + "step": 3843 + }, + { + "epoch": 0.12, + "learning_rate": 4.904102187848299e-06, + "loss": 1.2748, + "step": 3844 + }, + { + "epoch": 0.12, + "learning_rate": 4.9040352663185875e-06, + "loss": 1.0477, + "step": 3845 + }, + { + "epoch": 0.12, + "learning_rate": 4.9039683219036196e-06, + "loss": 1.1299, + "step": 3846 + }, + { + "epoch": 0.12, + "learning_rate": 4.90390135460403e-06, + "loss": 1.1935, + "step": 3847 + }, + { + "epoch": 0.12, + "learning_rate": 4.903834364420457e-06, + "loss": 1.1942, + "step": 3848 + }, + { + "epoch": 0.12, + "learning_rate": 4.903767351353539e-06, + "loss": 1.1207, + "step": 3849 + }, + { + "epoch": 0.12, + "learning_rate": 4.903700315403914e-06, + "loss": 1.129, + "step": 3850 + }, + { + "epoch": 0.12, + "learning_rate": 4.903633256572219e-06, + "loss": 1.1104, + "step": 3851 + }, + { + "epoch": 0.12, + "learning_rate": 4.903566174859093e-06, + "loss": 1.1812, + "step": 3852 + }, + { + "epoch": 0.12, + "learning_rate": 4.9034990702651755e-06, + "loss": 1.0261, + "step": 3853 + }, + { + "epoch": 0.12, + "learning_rate": 4.903431942791104e-06, + "loss": 1.1824, + "step": 3854 + }, + { + "epoch": 0.12, + "learning_rate": 4.903364792437518e-06, + "loss": 1.2101, + "step": 3855 + }, + { + "epoch": 0.12, + "learning_rate": 4.903297619205057e-06, + "loss": 1.0961, + "step": 3856 + }, + { + "epoch": 0.12, + "learning_rate": 4.9032304230943585e-06, + "loss": 1.0741, + "step": 3857 + }, + { + "epoch": 0.12, + "learning_rate": 4.903163204106065e-06, + "loss": 1.1062, + "step": 3858 + }, + { + "epoch": 0.12, + "learning_rate": 4.903095962240815e-06, + "loss": 1.1115, + "step": 3859 + }, + { + "epoch": 0.12, + "learning_rate": 4.903028697499249e-06, + "loss": 1.311, + "step": 3860 + }, + { + "epoch": 0.12, + "learning_rate": 4.902961409882007e-06, + "loss": 1.145, + "step": 3861 + }, + { + "epoch": 0.12, + "learning_rate": 4.90289409938973e-06, + "loss": 1.2061, + "step": 3862 + }, + { + "epoch": 0.12, + "learning_rate": 4.902826766023058e-06, + "loss": 1.2921, + "step": 3863 + }, + { + "epoch": 0.12, + "learning_rate": 4.9027594097826325e-06, + "loss": 1.1395, + "step": 3864 + }, + { + "epoch": 0.12, + "learning_rate": 4.902692030669095e-06, + "loss": 1.0542, + "step": 3865 + }, + { + "epoch": 0.12, + "learning_rate": 4.902624628683086e-06, + "loss": 1.1779, + "step": 3866 + }, + { + "epoch": 0.12, + "learning_rate": 4.902557203825247e-06, + "loss": 1.2233, + "step": 3867 + }, + { + "epoch": 0.12, + "learning_rate": 4.902489756096223e-06, + "loss": 1.2007, + "step": 3868 + }, + { + "epoch": 0.12, + "learning_rate": 4.902422285496652e-06, + "loss": 1.0929, + "step": 3869 + }, + { + "epoch": 0.12, + "learning_rate": 4.902354792027177e-06, + "loss": 1.1567, + "step": 3870 + }, + { + "epoch": 0.12, + "learning_rate": 4.902287275688443e-06, + "loss": 1.1915, + "step": 3871 + }, + { + "epoch": 0.12, + "learning_rate": 4.902219736481091e-06, + "loss": 1.1322, + "step": 3872 + }, + { + "epoch": 0.12, + "learning_rate": 4.902152174405763e-06, + "loss": 1.1276, + "step": 3873 + }, + { + "epoch": 0.12, + "learning_rate": 4.902084589463104e-06, + "loss": 1.0775, + "step": 3874 + }, + { + "epoch": 0.12, + "learning_rate": 4.9020169816537565e-06, + "loss": 1.1167, + "step": 3875 + }, + { + "epoch": 0.12, + "learning_rate": 4.901949350978363e-06, + "loss": 1.1594, + "step": 3876 + }, + { + "epoch": 0.12, + "learning_rate": 4.901881697437571e-06, + "loss": 1.1308, + "step": 3877 + }, + { + "epoch": 0.12, + "learning_rate": 4.90181402103202e-06, + "loss": 1.212, + "step": 3878 + }, + { + "epoch": 0.12, + "learning_rate": 4.9017463217623566e-06, + "loss": 1.2384, + "step": 3879 + }, + { + "epoch": 0.12, + "learning_rate": 4.901678599629225e-06, + "loss": 1.1331, + "step": 3880 + }, + { + "epoch": 0.12, + "learning_rate": 4.90161085463327e-06, + "loss": 1.1794, + "step": 3881 + }, + { + "epoch": 0.12, + "learning_rate": 4.901543086775137e-06, + "loss": 1.167, + "step": 3882 + }, + { + "epoch": 0.12, + "learning_rate": 4.901475296055469e-06, + "loss": 1.139, + "step": 3883 + }, + { + "epoch": 0.12, + "learning_rate": 4.901407482474914e-06, + "loss": 1.1216, + "step": 3884 + }, + { + "epoch": 0.12, + "learning_rate": 4.901339646034116e-06, + "loss": 1.0746, + "step": 3885 + }, + { + "epoch": 0.12, + "learning_rate": 4.901271786733721e-06, + "loss": 1.1595, + "step": 3886 + }, + { + "epoch": 0.12, + "learning_rate": 4.901203904574374e-06, + "loss": 1.2838, + "step": 3887 + }, + { + "epoch": 0.12, + "learning_rate": 4.9011359995567245e-06, + "loss": 1.1126, + "step": 3888 + }, + { + "epoch": 0.12, + "learning_rate": 4.9010680716814154e-06, + "loss": 1.2271, + "step": 3889 + }, + { + "epoch": 0.12, + "learning_rate": 4.901000120949094e-06, + "loss": 1.1295, + "step": 3890 + }, + { + "epoch": 0.12, + "learning_rate": 4.900932147360409e-06, + "loss": 1.0453, + "step": 3891 + }, + { + "epoch": 0.12, + "learning_rate": 4.900864150916006e-06, + "loss": 1.1868, + "step": 3892 + }, + { + "epoch": 0.12, + "learning_rate": 4.900796131616532e-06, + "loss": 1.1673, + "step": 3893 + }, + { + "epoch": 0.12, + "learning_rate": 4.900728089462636e-06, + "loss": 1.1267, + "step": 3894 + }, + { + "epoch": 0.12, + "learning_rate": 4.900660024454964e-06, + "loss": 1.1162, + "step": 3895 + }, + { + "epoch": 0.12, + "learning_rate": 4.900591936594165e-06, + "loss": 1.178, + "step": 3896 + }, + { + "epoch": 0.12, + "learning_rate": 4.9005238258808874e-06, + "loss": 1.1284, + "step": 3897 + }, + { + "epoch": 0.12, + "learning_rate": 4.900455692315779e-06, + "loss": 1.1567, + "step": 3898 + }, + { + "epoch": 0.12, + "learning_rate": 4.900387535899488e-06, + "loss": 1.1257, + "step": 3899 + }, + { + "epoch": 0.12, + "learning_rate": 4.900319356632663e-06, + "loss": 1.2068, + "step": 3900 + }, + { + "epoch": 0.12, + "learning_rate": 4.900251154515956e-06, + "loss": 1.1018, + "step": 3901 + }, + { + "epoch": 0.12, + "learning_rate": 4.900182929550013e-06, + "loss": 1.1716, + "step": 3902 + }, + { + "epoch": 0.12, + "learning_rate": 4.900114681735484e-06, + "loss": 1.1536, + "step": 3903 + }, + { + "epoch": 0.12, + "learning_rate": 4.900046411073019e-06, + "loss": 1.2698, + "step": 3904 + }, + { + "epoch": 0.12, + "learning_rate": 4.899978117563268e-06, + "loss": 1.0598, + "step": 3905 + }, + { + "epoch": 0.12, + "learning_rate": 4.8999098012068825e-06, + "loss": 1.095, + "step": 3906 + }, + { + "epoch": 0.12, + "learning_rate": 4.8998414620045095e-06, + "loss": 1.1445, + "step": 3907 + }, + { + "epoch": 0.12, + "learning_rate": 4.899773099956804e-06, + "loss": 1.1417, + "step": 3908 + }, + { + "epoch": 0.12, + "learning_rate": 4.899704715064413e-06, + "loss": 1.2033, + "step": 3909 + }, + { + "epoch": 0.12, + "learning_rate": 4.899636307327988e-06, + "loss": 1.1727, + "step": 3910 + }, + { + "epoch": 0.12, + "learning_rate": 4.899567876748182e-06, + "loss": 1.1395, + "step": 3911 + }, + { + "epoch": 0.12, + "learning_rate": 4.8994994233256465e-06, + "loss": 1.1589, + "step": 3912 + }, + { + "epoch": 0.12, + "learning_rate": 4.899430947061031e-06, + "loss": 1.1224, + "step": 3913 + }, + { + "epoch": 0.12, + "learning_rate": 4.899362447954988e-06, + "loss": 1.181, + "step": 3914 + }, + { + "epoch": 0.12, + "learning_rate": 4.899293926008171e-06, + "loss": 1.1449, + "step": 3915 + }, + { + "epoch": 0.12, + "learning_rate": 4.899225381221231e-06, + "loss": 1.1795, + "step": 3916 + }, + { + "epoch": 0.12, + "learning_rate": 4.899156813594821e-06, + "loss": 1.2145, + "step": 3917 + }, + { + "epoch": 0.12, + "learning_rate": 4.899088223129593e-06, + "loss": 1.2585, + "step": 3918 + }, + { + "epoch": 0.12, + "learning_rate": 4.899019609826202e-06, + "loss": 1.1042, + "step": 3919 + }, + { + "epoch": 0.12, + "learning_rate": 4.898950973685299e-06, + "loss": 1.1929, + "step": 3920 + }, + { + "epoch": 0.12, + "learning_rate": 4.8988823147075374e-06, + "loss": 1.0876, + "step": 3921 + }, + { + "epoch": 0.12, + "learning_rate": 4.898813632893572e-06, + "loss": 1.1376, + "step": 3922 + }, + { + "epoch": 0.12, + "learning_rate": 4.898744928244056e-06, + "loss": 1.2063, + "step": 3923 + }, + { + "epoch": 0.12, + "learning_rate": 4.898676200759645e-06, + "loss": 1.1913, + "step": 3924 + }, + { + "epoch": 0.12, + "learning_rate": 4.89860745044099e-06, + "loss": 1.197, + "step": 3925 + }, + { + "epoch": 0.12, + "learning_rate": 4.898538677288748e-06, + "loss": 1.2088, + "step": 3926 + }, + { + "epoch": 0.12, + "learning_rate": 4.8984698813035725e-06, + "loss": 1.1063, + "step": 3927 + }, + { + "epoch": 0.12, + "learning_rate": 4.898401062486119e-06, + "loss": 1.1101, + "step": 3928 + }, + { + "epoch": 0.12, + "learning_rate": 4.898332220837043e-06, + "loss": 1.1447, + "step": 3929 + }, + { + "epoch": 0.12, + "learning_rate": 4.898263356356999e-06, + "loss": 1.2487, + "step": 3930 + }, + { + "epoch": 0.12, + "learning_rate": 4.898194469046643e-06, + "loss": 1.2354, + "step": 3931 + }, + { + "epoch": 0.12, + "learning_rate": 4.8981255589066305e-06, + "loss": 1.1313, + "step": 3932 + }, + { + "epoch": 0.12, + "learning_rate": 4.8980566259376175e-06, + "loss": 1.2632, + "step": 3933 + }, + { + "epoch": 0.12, + "learning_rate": 4.897987670140261e-06, + "loss": 1.1255, + "step": 3934 + }, + { + "epoch": 0.12, + "learning_rate": 4.897918691515216e-06, + "loss": 1.1288, + "step": 3935 + }, + { + "epoch": 0.12, + "learning_rate": 4.89784969006314e-06, + "loss": 1.1811, + "step": 3936 + }, + { + "epoch": 0.12, + "learning_rate": 4.897780665784691e-06, + "loss": 1.1877, + "step": 3937 + }, + { + "epoch": 0.12, + "learning_rate": 4.8977116186805225e-06, + "loss": 1.0468, + "step": 3938 + }, + { + "epoch": 0.12, + "learning_rate": 4.8976425487512955e-06, + "loss": 1.0877, + "step": 3939 + }, + { + "epoch": 0.12, + "learning_rate": 4.897573455997667e-06, + "loss": 1.1125, + "step": 3940 + }, + { + "epoch": 0.12, + "learning_rate": 4.897504340420293e-06, + "loss": 1.1697, + "step": 3941 + }, + { + "epoch": 0.12, + "learning_rate": 4.897435202019833e-06, + "loss": 1.1812, + "step": 3942 + }, + { + "epoch": 0.12, + "learning_rate": 4.897366040796944e-06, + "loss": 1.2584, + "step": 3943 + }, + { + "epoch": 0.12, + "learning_rate": 4.897296856752285e-06, + "loss": 1.1428, + "step": 3944 + }, + { + "epoch": 0.12, + "learning_rate": 4.897227649886515e-06, + "loss": 1.197, + "step": 3945 + }, + { + "epoch": 0.12, + "learning_rate": 4.897158420200291e-06, + "loss": 1.2014, + "step": 3946 + }, + { + "epoch": 0.12, + "learning_rate": 4.897089167694274e-06, + "loss": 1.0443, + "step": 3947 + }, + { + "epoch": 0.12, + "learning_rate": 4.897019892369123e-06, + "loss": 1.0811, + "step": 3948 + }, + { + "epoch": 0.12, + "learning_rate": 4.896950594225497e-06, + "loss": 1.0956, + "step": 3949 + }, + { + "epoch": 0.12, + "learning_rate": 4.8968812732640555e-06, + "loss": 1.2426, + "step": 3950 + }, + { + "epoch": 0.12, + "learning_rate": 4.896811929485459e-06, + "loss": 1.1926, + "step": 3951 + }, + { + "epoch": 0.12, + "learning_rate": 4.896742562890366e-06, + "loss": 1.1155, + "step": 3952 + }, + { + "epoch": 0.12, + "learning_rate": 4.89667317347944e-06, + "loss": 1.123, + "step": 3953 + }, + { + "epoch": 0.12, + "learning_rate": 4.896603761253339e-06, + "loss": 1.2751, + "step": 3954 + }, + { + "epoch": 0.12, + "learning_rate": 4.896534326212724e-06, + "loss": 1.0615, + "step": 3955 + }, + { + "epoch": 0.12, + "learning_rate": 4.8964648683582565e-06, + "loss": 1.1392, + "step": 3956 + }, + { + "epoch": 0.12, + "learning_rate": 4.8963953876905975e-06, + "loss": 1.1644, + "step": 3957 + }, + { + "epoch": 0.12, + "learning_rate": 4.896325884210409e-06, + "loss": 1.2327, + "step": 3958 + }, + { + "epoch": 0.12, + "learning_rate": 4.896256357918352e-06, + "loss": 1.0842, + "step": 3959 + }, + { + "epoch": 0.12, + "learning_rate": 4.896186808815089e-06, + "loss": 1.168, + "step": 3960 + }, + { + "epoch": 0.12, + "learning_rate": 4.896117236901281e-06, + "loss": 1.2195, + "step": 3961 + }, + { + "epoch": 0.12, + "learning_rate": 4.8960476421775915e-06, + "loss": 1.1719, + "step": 3962 + }, + { + "epoch": 0.12, + "learning_rate": 4.895978024644682e-06, + "loss": 1.1777, + "step": 3963 + }, + { + "epoch": 0.12, + "learning_rate": 4.895908384303215e-06, + "loss": 1.1725, + "step": 3964 + }, + { + "epoch": 0.12, + "learning_rate": 4.895838721153855e-06, + "loss": 1.2045, + "step": 3965 + }, + { + "epoch": 0.12, + "learning_rate": 4.895769035197264e-06, + "loss": 1.1152, + "step": 3966 + }, + { + "epoch": 0.12, + "learning_rate": 4.895699326434106e-06, + "loss": 1.157, + "step": 3967 + }, + { + "epoch": 0.12, + "learning_rate": 4.895629594865044e-06, + "loss": 1.1582, + "step": 3968 + }, + { + "epoch": 0.12, + "learning_rate": 4.8955598404907414e-06, + "loss": 1.0352, + "step": 3969 + }, + { + "epoch": 0.12, + "learning_rate": 4.895490063311864e-06, + "loss": 1.228, + "step": 3970 + }, + { + "epoch": 0.12, + "learning_rate": 4.895420263329074e-06, + "loss": 1.1202, + "step": 3971 + }, + { + "epoch": 0.12, + "learning_rate": 4.895350440543037e-06, + "loss": 1.129, + "step": 3972 + }, + { + "epoch": 0.12, + "learning_rate": 4.895280594954417e-06, + "loss": 1.2013, + "step": 3973 + }, + { + "epoch": 0.12, + "learning_rate": 4.89521072656388e-06, + "loss": 1.0619, + "step": 3974 + }, + { + "epoch": 0.12, + "learning_rate": 4.8951408353720905e-06, + "loss": 1.1498, + "step": 3975 + }, + { + "epoch": 0.12, + "learning_rate": 4.895070921379714e-06, + "loss": 1.0991, + "step": 3976 + }, + { + "epoch": 0.12, + "learning_rate": 4.8950009845874156e-06, + "loss": 1.0732, + "step": 3977 + }, + { + "epoch": 0.12, + "learning_rate": 4.89493102499586e-06, + "loss": 1.0986, + "step": 3978 + }, + { + "epoch": 0.12, + "learning_rate": 4.894861042605716e-06, + "loss": 1.167, + "step": 3979 + }, + { + "epoch": 0.12, + "learning_rate": 4.894791037417648e-06, + "loss": 1.1758, + "step": 3980 + }, + { + "epoch": 0.12, + "learning_rate": 4.8947210094323224e-06, + "loss": 1.172, + "step": 3981 + }, + { + "epoch": 0.12, + "learning_rate": 4.894650958650406e-06, + "loss": 1.0941, + "step": 3982 + }, + { + "epoch": 0.12, + "learning_rate": 4.894580885072566e-06, + "loss": 1.0895, + "step": 3983 + }, + { + "epoch": 0.12, + "learning_rate": 4.8945107886994706e-06, + "loss": 1.1082, + "step": 3984 + }, + { + "epoch": 0.12, + "learning_rate": 4.8944406695317835e-06, + "loss": 1.2477, + "step": 3985 + }, + { + "epoch": 0.12, + "learning_rate": 4.894370527570176e-06, + "loss": 1.0917, + "step": 3986 + }, + { + "epoch": 0.12, + "learning_rate": 4.8943003628153125e-06, + "loss": 1.247, + "step": 3987 + }, + { + "epoch": 0.12, + "learning_rate": 4.894230175267864e-06, + "loss": 1.1047, + "step": 3988 + }, + { + "epoch": 0.12, + "learning_rate": 4.894159964928498e-06, + "loss": 1.1296, + "step": 3989 + }, + { + "epoch": 0.12, + "learning_rate": 4.894089731797881e-06, + "loss": 1.1556, + "step": 3990 + }, + { + "epoch": 0.12, + "learning_rate": 4.894019475876684e-06, + "loss": 1.1533, + "step": 3991 + }, + { + "epoch": 0.12, + "learning_rate": 4.893949197165572e-06, + "loss": 1.1746, + "step": 3992 + }, + { + "epoch": 0.12, + "learning_rate": 4.893878895665219e-06, + "loss": 1.0939, + "step": 3993 + }, + { + "epoch": 0.12, + "learning_rate": 4.893808571376291e-06, + "loss": 1.1954, + "step": 3994 + }, + { + "epoch": 0.12, + "learning_rate": 4.893738224299459e-06, + "loss": 1.1938, + "step": 3995 + }, + { + "epoch": 0.12, + "learning_rate": 4.893667854435391e-06, + "loss": 1.1179, + "step": 3996 + }, + { + "epoch": 0.12, + "learning_rate": 4.893597461784758e-06, + "loss": 1.1261, + "step": 3997 + }, + { + "epoch": 0.12, + "learning_rate": 4.893527046348231e-06, + "loss": 1.1122, + "step": 3998 + }, + { + "epoch": 0.12, + "learning_rate": 4.893456608126478e-06, + "loss": 1.1415, + "step": 3999 + }, + { + "epoch": 0.12, + "learning_rate": 4.893386147120171e-06, + "loss": 1.1734, + "step": 4000 + }, + { + "epoch": 0.12, + "learning_rate": 4.893315663329982e-06, + "loss": 1.1876, + "step": 4001 + }, + { + "epoch": 0.12, + "learning_rate": 4.893245156756578e-06, + "loss": 1.0404, + "step": 4002 + }, + { + "epoch": 0.12, + "learning_rate": 4.893174627400635e-06, + "loss": 1.1534, + "step": 4003 + }, + { + "epoch": 0.12, + "learning_rate": 4.893104075262821e-06, + "loss": 1.2225, + "step": 4004 + }, + { + "epoch": 0.12, + "learning_rate": 4.893033500343809e-06, + "loss": 1.1874, + "step": 4005 + }, + { + "epoch": 0.12, + "learning_rate": 4.892962902644272e-06, + "loss": 1.1133, + "step": 4006 + }, + { + "epoch": 0.12, + "learning_rate": 4.892892282164878e-06, + "loss": 1.218, + "step": 4007 + }, + { + "epoch": 0.12, + "learning_rate": 4.892821638906304e-06, + "loss": 1.0092, + "step": 4008 + }, + { + "epoch": 0.12, + "learning_rate": 4.89275097286922e-06, + "loss": 1.1348, + "step": 4009 + }, + { + "epoch": 0.12, + "learning_rate": 4.892680284054299e-06, + "loss": 1.2776, + "step": 4010 + }, + { + "epoch": 0.12, + "learning_rate": 4.892609572462214e-06, + "loss": 1.2147, + "step": 4011 + }, + { + "epoch": 0.12, + "learning_rate": 4.892538838093638e-06, + "loss": 1.1154, + "step": 4012 + }, + { + "epoch": 0.12, + "learning_rate": 4.892468080949244e-06, + "loss": 1.1903, + "step": 4013 + }, + { + "epoch": 0.12, + "learning_rate": 4.8923973010297065e-06, + "loss": 1.1724, + "step": 4014 + }, + { + "epoch": 0.12, + "learning_rate": 4.892326498335699e-06, + "loss": 1.1935, + "step": 4015 + }, + { + "epoch": 0.12, + "learning_rate": 4.892255672867896e-06, + "loss": 1.1837, + "step": 4016 + }, + { + "epoch": 0.12, + "learning_rate": 4.892184824626971e-06, + "loss": 1.2003, + "step": 4017 + }, + { + "epoch": 0.12, + "learning_rate": 4.892113953613598e-06, + "loss": 1.0804, + "step": 4018 + }, + { + "epoch": 0.12, + "learning_rate": 4.892043059828453e-06, + "loss": 1.2259, + "step": 4019 + }, + { + "epoch": 0.12, + "learning_rate": 4.891972143272209e-06, + "loss": 1.2004, + "step": 4020 + }, + { + "epoch": 0.12, + "learning_rate": 4.891901203945543e-06, + "loss": 1.1108, + "step": 4021 + }, + { + "epoch": 0.12, + "learning_rate": 4.89183024184913e-06, + "loss": 1.1335, + "step": 4022 + }, + { + "epoch": 0.12, + "learning_rate": 4.891759256983644e-06, + "loss": 1.1189, + "step": 4023 + }, + { + "epoch": 0.12, + "learning_rate": 4.891688249349762e-06, + "loss": 1.1531, + "step": 4024 + }, + { + "epoch": 0.12, + "learning_rate": 4.8916172189481605e-06, + "loss": 1.1503, + "step": 4025 + }, + { + "epoch": 0.12, + "learning_rate": 4.8915461657795136e-06, + "loss": 1.2292, + "step": 4026 + }, + { + "epoch": 0.12, + "learning_rate": 4.8914750898445e-06, + "loss": 1.1169, + "step": 4027 + }, + { + "epoch": 0.12, + "learning_rate": 4.891403991143795e-06, + "loss": 1.0782, + "step": 4028 + }, + { + "epoch": 0.12, + "learning_rate": 4.891332869678076e-06, + "loss": 1.1432, + "step": 4029 + }, + { + "epoch": 0.12, + "learning_rate": 4.89126172544802e-06, + "loss": 1.0563, + "step": 4030 + }, + { + "epoch": 0.12, + "learning_rate": 4.891190558454303e-06, + "loss": 1.1417, + "step": 4031 + }, + { + "epoch": 0.12, + "learning_rate": 4.891119368697604e-06, + "loss": 1.2013, + "step": 4032 + }, + { + "epoch": 0.12, + "learning_rate": 4.891048156178601e-06, + "loss": 1.12, + "step": 4033 + }, + { + "epoch": 0.12, + "learning_rate": 4.8909769208979705e-06, + "loss": 1.1514, + "step": 4034 + }, + { + "epoch": 0.12, + "learning_rate": 4.8909056628563914e-06, + "loss": 1.228, + "step": 4035 + }, + { + "epoch": 0.12, + "learning_rate": 4.8908343820545415e-06, + "loss": 1.2348, + "step": 4036 + }, + { + "epoch": 0.12, + "learning_rate": 4.8907630784931e-06, + "loss": 1.2096, + "step": 4037 + }, + { + "epoch": 0.12, + "learning_rate": 4.890691752172746e-06, + "loss": 1.1274, + "step": 4038 + }, + { + "epoch": 0.12, + "learning_rate": 4.890620403094158e-06, + "loss": 1.0328, + "step": 4039 + }, + { + "epoch": 0.12, + "learning_rate": 4.8905490312580135e-06, + "loss": 1.1226, + "step": 4040 + }, + { + "epoch": 0.12, + "learning_rate": 4.890477636664994e-06, + "loss": 1.0697, + "step": 4041 + }, + { + "epoch": 0.12, + "learning_rate": 4.890406219315779e-06, + "loss": 1.122, + "step": 4042 + }, + { + "epoch": 0.12, + "learning_rate": 4.890334779211049e-06, + "loss": 1.2617, + "step": 4043 + }, + { + "epoch": 0.12, + "learning_rate": 4.890263316351482e-06, + "loss": 1.1417, + "step": 4044 + }, + { + "epoch": 0.12, + "learning_rate": 4.89019183073776e-06, + "loss": 1.2765, + "step": 4045 + }, + { + "epoch": 0.12, + "learning_rate": 4.890120322370563e-06, + "loss": 1.1327, + "step": 4046 + }, + { + "epoch": 0.12, + "learning_rate": 4.890048791250571e-06, + "loss": 1.1147, + "step": 4047 + }, + { + "epoch": 0.12, + "learning_rate": 4.889977237378466e-06, + "loss": 1.2142, + "step": 4048 + }, + { + "epoch": 0.12, + "learning_rate": 4.889905660754929e-06, + "loss": 1.177, + "step": 4049 + }, + { + "epoch": 0.12, + "learning_rate": 4.889834061380641e-06, + "loss": 1.0931, + "step": 4050 + }, + { + "epoch": 0.12, + "learning_rate": 4.889762439256283e-06, + "loss": 1.1876, + "step": 4051 + }, + { + "epoch": 0.12, + "learning_rate": 4.889690794382539e-06, + "loss": 1.1779, + "step": 4052 + }, + { + "epoch": 0.12, + "learning_rate": 4.889619126760088e-06, + "loss": 1.0864, + "step": 4053 + }, + { + "epoch": 0.12, + "learning_rate": 4.889547436389615e-06, + "loss": 1.1389, + "step": 4054 + }, + { + "epoch": 0.12, + "learning_rate": 4.889475723271801e-06, + "loss": 1.2325, + "step": 4055 + }, + { + "epoch": 0.12, + "learning_rate": 4.889403987407328e-06, + "loss": 1.1602, + "step": 4056 + }, + { + "epoch": 0.12, + "learning_rate": 4.8893322287968805e-06, + "loss": 1.0844, + "step": 4057 + }, + { + "epoch": 0.12, + "learning_rate": 4.889260447441141e-06, + "loss": 1.1474, + "step": 4058 + }, + { + "epoch": 0.12, + "learning_rate": 4.889188643340793e-06, + "loss": 1.0902, + "step": 4059 + }, + { + "epoch": 0.12, + "learning_rate": 4.889116816496519e-06, + "loss": 1.2163, + "step": 4060 + }, + { + "epoch": 0.12, + "learning_rate": 4.889044966909004e-06, + "loss": 1.2125, + "step": 4061 + }, + { + "epoch": 0.12, + "learning_rate": 4.888973094578932e-06, + "loss": 1.1246, + "step": 4062 + }, + { + "epoch": 0.12, + "learning_rate": 4.888901199506985e-06, + "loss": 1.1583, + "step": 4063 + }, + { + "epoch": 0.12, + "learning_rate": 4.888829281693851e-06, + "loss": 1.1205, + "step": 4064 + }, + { + "epoch": 0.12, + "learning_rate": 4.888757341140213e-06, + "loss": 1.0894, + "step": 4065 + }, + { + "epoch": 0.12, + "learning_rate": 4.8886853778467535e-06, + "loss": 1.1497, + "step": 4066 + }, + { + "epoch": 0.12, + "learning_rate": 4.888613391814161e-06, + "loss": 1.1808, + "step": 4067 + }, + { + "epoch": 0.12, + "learning_rate": 4.88854138304312e-06, + "loss": 1.1362, + "step": 4068 + }, + { + "epoch": 0.12, + "learning_rate": 4.888469351534314e-06, + "loss": 1.1041, + "step": 4069 + }, + { + "epoch": 0.12, + "learning_rate": 4.888397297288431e-06, + "loss": 1.2537, + "step": 4070 + }, + { + "epoch": 0.12, + "learning_rate": 4.888325220306155e-06, + "loss": 1.1071, + "step": 4071 + }, + { + "epoch": 0.12, + "learning_rate": 4.888253120588174e-06, + "loss": 1.2291, + "step": 4072 + }, + { + "epoch": 0.12, + "learning_rate": 4.888180998135174e-06, + "loss": 1.1534, + "step": 4073 + }, + { + "epoch": 0.12, + "learning_rate": 4.88810885294784e-06, + "loss": 1.2229, + "step": 4074 + }, + { + "epoch": 0.12, + "learning_rate": 4.88803668502686e-06, + "loss": 1.1582, + "step": 4075 + }, + { + "epoch": 0.12, + "learning_rate": 4.887964494372921e-06, + "loss": 1.1866, + "step": 4076 + }, + { + "epoch": 0.12, + "learning_rate": 4.8878922809867106e-06, + "loss": 1.2329, + "step": 4077 + }, + { + "epoch": 0.12, + "learning_rate": 4.887820044868915e-06, + "loss": 1.0984, + "step": 4078 + }, + { + "epoch": 0.12, + "learning_rate": 4.887747786020224e-06, + "loss": 1.153, + "step": 4079 + }, + { + "epoch": 0.12, + "learning_rate": 4.887675504441323e-06, + "loss": 1.1055, + "step": 4080 + }, + { + "epoch": 0.12, + "learning_rate": 4.887603200132901e-06, + "loss": 1.0225, + "step": 4081 + }, + { + "epoch": 0.12, + "learning_rate": 4.887530873095646e-06, + "loss": 1.0971, + "step": 4082 + }, + { + "epoch": 0.12, + "learning_rate": 4.887458523330248e-06, + "loss": 1.1726, + "step": 4083 + }, + { + "epoch": 0.12, + "learning_rate": 4.8873861508373945e-06, + "loss": 1.1087, + "step": 4084 + }, + { + "epoch": 0.12, + "learning_rate": 4.887313755617774e-06, + "loss": 1.1464, + "step": 4085 + }, + { + "epoch": 0.12, + "learning_rate": 4.887241337672077e-06, + "loss": 1.1987, + "step": 4086 + }, + { + "epoch": 0.12, + "learning_rate": 4.8871688970009924e-06, + "loss": 1.1808, + "step": 4087 + }, + { + "epoch": 0.12, + "learning_rate": 4.887096433605209e-06, + "loss": 1.0967, + "step": 4088 + }, + { + "epoch": 0.12, + "learning_rate": 4.887023947485417e-06, + "loss": 1.2094, + "step": 4089 + }, + { + "epoch": 0.12, + "learning_rate": 4.886951438642307e-06, + "loss": 1.1417, + "step": 4090 + }, + { + "epoch": 0.12, + "learning_rate": 4.886878907076569e-06, + "loss": 1.063, + "step": 4091 + }, + { + "epoch": 0.12, + "learning_rate": 4.886806352788893e-06, + "loss": 1.1398, + "step": 4092 + }, + { + "epoch": 0.12, + "learning_rate": 4.88673377577997e-06, + "loss": 1.0142, + "step": 4093 + }, + { + "epoch": 0.12, + "learning_rate": 4.886661176050492e-06, + "loss": 1.1533, + "step": 4094 + }, + { + "epoch": 0.12, + "learning_rate": 4.886588553601148e-06, + "loss": 1.157, + "step": 4095 + }, + { + "epoch": 0.12, + "learning_rate": 4.886515908432631e-06, + "loss": 1.1589, + "step": 4096 + }, + { + "epoch": 0.12, + "learning_rate": 4.886443240545632e-06, + "loss": 1.1262, + "step": 4097 + }, + { + "epoch": 0.12, + "learning_rate": 4.886370549940842e-06, + "loss": 1.1053, + "step": 4098 + }, + { + "epoch": 0.12, + "learning_rate": 4.8862978366189536e-06, + "loss": 1.1027, + "step": 4099 + }, + { + "epoch": 0.12, + "learning_rate": 4.8862251005806605e-06, + "loss": 1.1138, + "step": 4100 + }, + { + "epoch": 0.12, + "learning_rate": 4.886152341826652e-06, + "loss": 1.0983, + "step": 4101 + }, + { + "epoch": 0.12, + "learning_rate": 4.886079560357624e-06, + "loss": 1.166, + "step": 4102 + }, + { + "epoch": 0.12, + "learning_rate": 4.886006756174267e-06, + "loss": 1.1745, + "step": 4103 + }, + { + "epoch": 0.12, + "learning_rate": 4.885933929277274e-06, + "loss": 1.1185, + "step": 4104 + }, + { + "epoch": 0.12, + "learning_rate": 4.88586107966734e-06, + "loss": 1.2009, + "step": 4105 + }, + { + "epoch": 0.12, + "learning_rate": 4.8857882073451574e-06, + "loss": 1.3395, + "step": 4106 + }, + { + "epoch": 0.12, + "learning_rate": 4.8857153123114194e-06, + "loss": 1.1311, + "step": 4107 + }, + { + "epoch": 0.12, + "learning_rate": 4.885642394566822e-06, + "loss": 1.1235, + "step": 4108 + }, + { + "epoch": 0.12, + "learning_rate": 4.885569454112057e-06, + "loss": 1.1445, + "step": 4109 + }, + { + "epoch": 0.12, + "learning_rate": 4.88549649094782e-06, + "loss": 1.1967, + "step": 4110 + }, + { + "epoch": 0.12, + "learning_rate": 4.885423505074806e-06, + "loss": 1.2544, + "step": 4111 + }, + { + "epoch": 0.12, + "learning_rate": 4.885350496493708e-06, + "loss": 1.2159, + "step": 4112 + }, + { + "epoch": 0.12, + "learning_rate": 4.885277465205223e-06, + "loss": 1.0955, + "step": 4113 + }, + { + "epoch": 0.12, + "learning_rate": 4.885204411210045e-06, + "loss": 1.1412, + "step": 4114 + }, + { + "epoch": 0.12, + "learning_rate": 4.885131334508869e-06, + "loss": 1.1579, + "step": 4115 + }, + { + "epoch": 0.12, + "learning_rate": 4.885058235102392e-06, + "loss": 1.037, + "step": 4116 + }, + { + "epoch": 0.12, + "learning_rate": 4.88498511299131e-06, + "loss": 1.1524, + "step": 4117 + }, + { + "epoch": 0.12, + "learning_rate": 4.8849119681763165e-06, + "loss": 1.1651, + "step": 4118 + }, + { + "epoch": 0.12, + "learning_rate": 4.884838800658112e-06, + "loss": 1.101, + "step": 4119 + }, + { + "epoch": 0.12, + "learning_rate": 4.884765610437389e-06, + "loss": 1.0972, + "step": 4120 + }, + { + "epoch": 0.12, + "learning_rate": 4.884692397514846e-06, + "loss": 1.2468, + "step": 4121 + }, + { + "epoch": 0.12, + "learning_rate": 4.884619161891181e-06, + "loss": 0.9786, + "step": 4122 + }, + { + "epoch": 0.12, + "learning_rate": 4.884545903567089e-06, + "loss": 1.1702, + "step": 4123 + }, + { + "epoch": 0.12, + "learning_rate": 4.8844726225432696e-06, + "loss": 1.2054, + "step": 4124 + }, + { + "epoch": 0.12, + "learning_rate": 4.884399318820418e-06, + "loss": 1.1476, + "step": 4125 + }, + { + "epoch": 0.12, + "learning_rate": 4.884325992399234e-06, + "loss": 1.055, + "step": 4126 + }, + { + "epoch": 0.12, + "learning_rate": 4.884252643280415e-06, + "loss": 1.0978, + "step": 4127 + }, + { + "epoch": 0.12, + "learning_rate": 4.884179271464658e-06, + "loss": 1.139, + "step": 4128 + }, + { + "epoch": 0.12, + "learning_rate": 4.884105876952664e-06, + "loss": 1.2654, + "step": 4129 + }, + { + "epoch": 0.12, + "learning_rate": 4.884032459745129e-06, + "loss": 1.0324, + "step": 4130 + }, + { + "epoch": 0.12, + "learning_rate": 4.883959019842754e-06, + "loss": 1.1758, + "step": 4131 + }, + { + "epoch": 0.12, + "learning_rate": 4.8838855572462375e-06, + "loss": 1.1523, + "step": 4132 + }, + { + "epoch": 0.12, + "learning_rate": 4.883812071956277e-06, + "loss": 1.2599, + "step": 4133 + }, + { + "epoch": 0.12, + "learning_rate": 4.883738563973576e-06, + "loss": 1.1021, + "step": 4134 + }, + { + "epoch": 0.12, + "learning_rate": 4.88366503329883e-06, + "loss": 1.0729, + "step": 4135 + }, + { + "epoch": 0.12, + "learning_rate": 4.883591479932742e-06, + "loss": 1.1916, + "step": 4136 + }, + { + "epoch": 0.12, + "learning_rate": 4.883517903876011e-06, + "loss": 1.336, + "step": 4137 + }, + { + "epoch": 0.12, + "learning_rate": 4.883444305129337e-06, + "loss": 1.1718, + "step": 4138 + }, + { + "epoch": 0.12, + "learning_rate": 4.883370683693421e-06, + "loss": 1.2034, + "step": 4139 + }, + { + "epoch": 0.12, + "learning_rate": 4.883297039568965e-06, + "loss": 1.1785, + "step": 4140 + }, + { + "epoch": 0.12, + "learning_rate": 4.883223372756668e-06, + "loss": 1.0688, + "step": 4141 + }, + { + "epoch": 0.12, + "learning_rate": 4.883149683257233e-06, + "loss": 1.2617, + "step": 4142 + }, + { + "epoch": 0.12, + "learning_rate": 4.88307597107136e-06, + "loss": 1.1309, + "step": 4143 + }, + { + "epoch": 0.12, + "learning_rate": 4.883002236199752e-06, + "loss": 1.2133, + "step": 4144 + }, + { + "epoch": 0.12, + "learning_rate": 4.88292847864311e-06, + "loss": 1.1431, + "step": 4145 + }, + { + "epoch": 0.12, + "learning_rate": 4.8828546984021374e-06, + "loss": 1.0678, + "step": 4146 + }, + { + "epoch": 0.12, + "learning_rate": 4.882780895477535e-06, + "loss": 0.9812, + "step": 4147 + }, + { + "epoch": 0.12, + "learning_rate": 4.882707069870006e-06, + "loss": 1.137, + "step": 4148 + }, + { + "epoch": 0.12, + "learning_rate": 4.882633221580254e-06, + "loss": 1.0907, + "step": 4149 + }, + { + "epoch": 0.13, + "learning_rate": 4.88255935060898e-06, + "loss": 1.3064, + "step": 4150 + }, + { + "epoch": 0.13, + "learning_rate": 4.882485456956889e-06, + "loss": 1.098, + "step": 4151 + }, + { + "epoch": 0.13, + "learning_rate": 4.882411540624684e-06, + "loss": 1.1996, + "step": 4152 + }, + { + "epoch": 0.13, + "learning_rate": 4.882337601613069e-06, + "loss": 1.2042, + "step": 4153 + }, + { + "epoch": 0.13, + "learning_rate": 4.882263639922747e-06, + "loss": 1.0997, + "step": 4154 + }, + { + "epoch": 0.13, + "learning_rate": 4.882189655554423e-06, + "loss": 1.2757, + "step": 4155 + }, + { + "epoch": 0.13, + "learning_rate": 4.882115648508799e-06, + "loss": 1.1718, + "step": 4156 + }, + { + "epoch": 0.13, + "learning_rate": 4.882041618786584e-06, + "loss": 1.1926, + "step": 4157 + }, + { + "epoch": 0.13, + "learning_rate": 4.881967566388478e-06, + "loss": 1.226, + "step": 4158 + }, + { + "epoch": 0.13, + "learning_rate": 4.881893491315189e-06, + "loss": 1.1592, + "step": 4159 + }, + { + "epoch": 0.13, + "learning_rate": 4.8818193935674205e-06, + "loss": 1.1634, + "step": 4160 + }, + { + "epoch": 0.13, + "learning_rate": 4.881745273145878e-06, + "loss": 1.2126, + "step": 4161 + }, + { + "epoch": 0.13, + "learning_rate": 4.881671130051269e-06, + "loss": 1.2307, + "step": 4162 + }, + { + "epoch": 0.13, + "learning_rate": 4.881596964284296e-06, + "loss": 1.1863, + "step": 4163 + }, + { + "epoch": 0.13, + "learning_rate": 4.881522775845668e-06, + "loss": 1.213, + "step": 4164 + }, + { + "epoch": 0.13, + "learning_rate": 4.881448564736091e-06, + "loss": 1.1617, + "step": 4165 + }, + { + "epoch": 0.13, + "learning_rate": 4.88137433095627e-06, + "loss": 1.1786, + "step": 4166 + }, + { + "epoch": 0.13, + "learning_rate": 4.881300074506911e-06, + "loss": 1.2489, + "step": 4167 + }, + { + "epoch": 0.13, + "learning_rate": 4.881225795388724e-06, + "loss": 1.3007, + "step": 4168 + }, + { + "epoch": 0.13, + "learning_rate": 4.881151493602414e-06, + "loss": 1.1987, + "step": 4169 + }, + { + "epoch": 0.13, + "learning_rate": 4.881077169148688e-06, + "loss": 1.1752, + "step": 4170 + }, + { + "epoch": 0.13, + "learning_rate": 4.881002822028254e-06, + "loss": 1.0709, + "step": 4171 + }, + { + "epoch": 0.13, + "learning_rate": 4.88092845224182e-06, + "loss": 1.1283, + "step": 4172 + }, + { + "epoch": 0.13, + "learning_rate": 4.880854059790094e-06, + "loss": 1.224, + "step": 4173 + }, + { + "epoch": 0.13, + "learning_rate": 4.880779644673784e-06, + "loss": 1.1805, + "step": 4174 + }, + { + "epoch": 0.13, + "learning_rate": 4.880705206893599e-06, + "loss": 1.1976, + "step": 4175 + }, + { + "epoch": 0.13, + "learning_rate": 4.880630746450245e-06, + "loss": 1.1667, + "step": 4176 + }, + { + "epoch": 0.13, + "learning_rate": 4.880556263344435e-06, + "loss": 1.1454, + "step": 4177 + }, + { + "epoch": 0.13, + "learning_rate": 4.880481757576875e-06, + "loss": 1.1029, + "step": 4178 + }, + { + "epoch": 0.13, + "learning_rate": 4.880407229148275e-06, + "loss": 1.1609, + "step": 4179 + }, + { + "epoch": 0.13, + "learning_rate": 4.8803326780593455e-06, + "loss": 1.1821, + "step": 4180 + }, + { + "epoch": 0.13, + "learning_rate": 4.880258104310794e-06, + "loss": 0.9508, + "step": 4181 + }, + { + "epoch": 0.13, + "learning_rate": 4.8801835079033326e-06, + "loss": 1.1859, + "step": 4182 + }, + { + "epoch": 0.13, + "learning_rate": 4.88010888883767e-06, + "loss": 1.2905, + "step": 4183 + }, + { + "epoch": 0.13, + "learning_rate": 4.880034247114518e-06, + "loss": 1.1789, + "step": 4184 + }, + { + "epoch": 0.13, + "learning_rate": 4.879959582734586e-06, + "loss": 1.1615, + "step": 4185 + }, + { + "epoch": 0.13, + "learning_rate": 4.879884895698584e-06, + "loss": 1.2493, + "step": 4186 + }, + { + "epoch": 0.13, + "learning_rate": 4.879810186007224e-06, + "loss": 1.2539, + "step": 4187 + }, + { + "epoch": 0.13, + "learning_rate": 4.879735453661218e-06, + "loss": 1.1249, + "step": 4188 + }, + { + "epoch": 0.13, + "learning_rate": 4.879660698661277e-06, + "loss": 1.1834, + "step": 4189 + }, + { + "epoch": 0.13, + "learning_rate": 4.879585921008112e-06, + "loss": 1.167, + "step": 4190 + }, + { + "epoch": 0.13, + "learning_rate": 4.879511120702434e-06, + "loss": 1.0361, + "step": 4191 + }, + { + "epoch": 0.13, + "learning_rate": 4.879436297744957e-06, + "loss": 1.1508, + "step": 4192 + }, + { + "epoch": 0.13, + "learning_rate": 4.879361452136393e-06, + "loss": 1.18, + "step": 4193 + }, + { + "epoch": 0.13, + "learning_rate": 4.879286583877453e-06, + "loss": 1.2233, + "step": 4194 + }, + { + "epoch": 0.13, + "learning_rate": 4.87921169296885e-06, + "loss": 1.147, + "step": 4195 + }, + { + "epoch": 0.13, + "learning_rate": 4.879136779411299e-06, + "loss": 1.0934, + "step": 4196 + }, + { + "epoch": 0.13, + "learning_rate": 4.8790618432055116e-06, + "loss": 1.1295, + "step": 4197 + }, + { + "epoch": 0.13, + "learning_rate": 4.8789868843522e-06, + "loss": 1.2505, + "step": 4198 + }, + { + "epoch": 0.13, + "learning_rate": 4.87891190285208e-06, + "loss": 1.1937, + "step": 4199 + }, + { + "epoch": 0.13, + "learning_rate": 4.878836898705864e-06, + "loss": 1.1852, + "step": 4200 + }, + { + "epoch": 0.13, + "learning_rate": 4.878761871914266e-06, + "loss": 1.2021, + "step": 4201 + }, + { + "epoch": 0.13, + "learning_rate": 4.878686822478001e-06, + "loss": 1.2222, + "step": 4202 + }, + { + "epoch": 0.13, + "learning_rate": 4.8786117503977834e-06, + "loss": 1.1656, + "step": 4203 + }, + { + "epoch": 0.13, + "learning_rate": 4.878536655674328e-06, + "loss": 1.0982, + "step": 4204 + }, + { + "epoch": 0.13, + "learning_rate": 4.878461538308349e-06, + "loss": 1.0957, + "step": 4205 + }, + { + "epoch": 0.13, + "learning_rate": 4.878386398300561e-06, + "loss": 1.2013, + "step": 4206 + }, + { + "epoch": 0.13, + "learning_rate": 4.878311235651681e-06, + "loss": 1.1295, + "step": 4207 + }, + { + "epoch": 0.13, + "learning_rate": 4.878236050362422e-06, + "loss": 1.2281, + "step": 4208 + }, + { + "epoch": 0.13, + "learning_rate": 4.8781608424335015e-06, + "loss": 1.1954, + "step": 4209 + }, + { + "epoch": 0.13, + "learning_rate": 4.878085611865636e-06, + "loss": 1.1828, + "step": 4210 + }, + { + "epoch": 0.13, + "learning_rate": 4.87801035865954e-06, + "loss": 1.2416, + "step": 4211 + }, + { + "epoch": 0.13, + "learning_rate": 4.877935082815931e-06, + "loss": 1.2924, + "step": 4212 + }, + { + "epoch": 0.13, + "learning_rate": 4.877859784335524e-06, + "loss": 1.1809, + "step": 4213 + }, + { + "epoch": 0.13, + "learning_rate": 4.8777844632190395e-06, + "loss": 1.2399, + "step": 4214 + }, + { + "epoch": 0.13, + "learning_rate": 4.877709119467191e-06, + "loss": 1.1171, + "step": 4215 + }, + { + "epoch": 0.13, + "learning_rate": 4.8776337530806964e-06, + "loss": 1.1984, + "step": 4216 + }, + { + "epoch": 0.13, + "learning_rate": 4.877558364060274e-06, + "loss": 1.2059, + "step": 4217 + }, + { + "epoch": 0.13, + "learning_rate": 4.8774829524066405e-06, + "loss": 1.0714, + "step": 4218 + }, + { + "epoch": 0.13, + "learning_rate": 4.877407518120515e-06, + "loss": 1.1762, + "step": 4219 + }, + { + "epoch": 0.13, + "learning_rate": 4.8773320612026145e-06, + "loss": 1.1685, + "step": 4220 + }, + { + "epoch": 0.13, + "learning_rate": 4.8772565816536585e-06, + "loss": 1.1329, + "step": 4221 + }, + { + "epoch": 0.13, + "learning_rate": 4.877181079474363e-06, + "loss": 1.0903, + "step": 4222 + }, + { + "epoch": 0.13, + "learning_rate": 4.87710555466545e-06, + "loss": 1.1302, + "step": 4223 + }, + { + "epoch": 0.13, + "learning_rate": 4.877030007227637e-06, + "loss": 1.2058, + "step": 4224 + }, + { + "epoch": 0.13, + "learning_rate": 4.8769544371616425e-06, + "loss": 1.312, + "step": 4225 + }, + { + "epoch": 0.13, + "learning_rate": 4.876878844468188e-06, + "loss": 1.1406, + "step": 4226 + }, + { + "epoch": 0.13, + "learning_rate": 4.87680322914799e-06, + "loss": 1.1631, + "step": 4227 + }, + { + "epoch": 0.13, + "learning_rate": 4.87672759120177e-06, + "loss": 1.2515, + "step": 4228 + }, + { + "epoch": 0.13, + "learning_rate": 4.8766519306302486e-06, + "loss": 1.1413, + "step": 4229 + }, + { + "epoch": 0.13, + "learning_rate": 4.876576247434146e-06, + "loss": 1.0261, + "step": 4230 + }, + { + "epoch": 0.13, + "learning_rate": 4.876500541614181e-06, + "loss": 1.2444, + "step": 4231 + }, + { + "epoch": 0.13, + "learning_rate": 4.876424813171076e-06, + "loss": 1.2223, + "step": 4232 + }, + { + "epoch": 0.13, + "learning_rate": 4.876349062105551e-06, + "loss": 1.2276, + "step": 4233 + }, + { + "epoch": 0.13, + "learning_rate": 4.8762732884183274e-06, + "loss": 1.0512, + "step": 4234 + }, + { + "epoch": 0.13, + "learning_rate": 4.876197492110128e-06, + "loss": 1.2161, + "step": 4235 + }, + { + "epoch": 0.13, + "learning_rate": 4.876121673181671e-06, + "loss": 1.2219, + "step": 4236 + }, + { + "epoch": 0.13, + "learning_rate": 4.87604583163368e-06, + "loss": 1.224, + "step": 4237 + }, + { + "epoch": 0.13, + "learning_rate": 4.875969967466878e-06, + "loss": 1.1592, + "step": 4238 + }, + { + "epoch": 0.13, + "learning_rate": 4.875894080681986e-06, + "loss": 1.1486, + "step": 4239 + }, + { + "epoch": 0.13, + "learning_rate": 4.875818171279727e-06, + "loss": 1.0609, + "step": 4240 + }, + { + "epoch": 0.13, + "learning_rate": 4.875742239260822e-06, + "loss": 1.0656, + "step": 4241 + }, + { + "epoch": 0.13, + "learning_rate": 4.875666284625996e-06, + "loss": 1.1224, + "step": 4242 + }, + { + "epoch": 0.13, + "learning_rate": 4.875590307375972e-06, + "loss": 1.2579, + "step": 4243 + }, + { + "epoch": 0.13, + "learning_rate": 4.875514307511471e-06, + "loss": 1.1915, + "step": 4244 + }, + { + "epoch": 0.13, + "learning_rate": 4.875438285033218e-06, + "loss": 1.1146, + "step": 4245 + }, + { + "epoch": 0.13, + "learning_rate": 4.875362239941936e-06, + "loss": 1.1901, + "step": 4246 + }, + { + "epoch": 0.13, + "learning_rate": 4.875286172238351e-06, + "loss": 1.1749, + "step": 4247 + }, + { + "epoch": 0.13, + "learning_rate": 4.875210081923185e-06, + "loss": 1.0933, + "step": 4248 + }, + { + "epoch": 0.13, + "learning_rate": 4.8751339689971624e-06, + "loss": 1.0839, + "step": 4249 + }, + { + "epoch": 0.13, + "learning_rate": 4.875057833461009e-06, + "loss": 1.1107, + "step": 4250 + }, + { + "epoch": 0.13, + "learning_rate": 4.874981675315449e-06, + "loss": 1.1796, + "step": 4251 + }, + { + "epoch": 0.13, + "learning_rate": 4.874905494561207e-06, + "loss": 1.1693, + "step": 4252 + }, + { + "epoch": 0.13, + "learning_rate": 4.874829291199008e-06, + "loss": 1.1711, + "step": 4253 + }, + { + "epoch": 0.13, + "learning_rate": 4.874753065229579e-06, + "loss": 1.1132, + "step": 4254 + }, + { + "epoch": 0.13, + "learning_rate": 4.874676816653644e-06, + "loss": 1.1769, + "step": 4255 + }, + { + "epoch": 0.13, + "learning_rate": 4.874600545471929e-06, + "loss": 1.0264, + "step": 4256 + }, + { + "epoch": 0.13, + "learning_rate": 4.874524251685161e-06, + "loss": 1.2208, + "step": 4257 + }, + { + "epoch": 0.13, + "learning_rate": 4.8744479352940655e-06, + "loss": 1.1143, + "step": 4258 + }, + { + "epoch": 0.13, + "learning_rate": 4.8743715962993696e-06, + "loss": 1.1293, + "step": 4259 + }, + { + "epoch": 0.13, + "learning_rate": 4.874295234701799e-06, + "loss": 1.1907, + "step": 4260 + }, + { + "epoch": 0.13, + "learning_rate": 4.8742188505020816e-06, + "loss": 1.2192, + "step": 4261 + }, + { + "epoch": 0.13, + "learning_rate": 4.874142443700944e-06, + "loss": 1.1507, + "step": 4262 + }, + { + "epoch": 0.13, + "learning_rate": 4.874066014299114e-06, + "loss": 1.1519, + "step": 4263 + }, + { + "epoch": 0.13, + "learning_rate": 4.873989562297319e-06, + "loss": 1.2247, + "step": 4264 + }, + { + "epoch": 0.13, + "learning_rate": 4.873913087696286e-06, + "loss": 1.1776, + "step": 4265 + }, + { + "epoch": 0.13, + "learning_rate": 4.873836590496745e-06, + "loss": 1.1535, + "step": 4266 + }, + { + "epoch": 0.13, + "learning_rate": 4.873760070699421e-06, + "loss": 1.0657, + "step": 4267 + }, + { + "epoch": 0.13, + "learning_rate": 4.873683528305046e-06, + "loss": 1.1834, + "step": 4268 + }, + { + "epoch": 0.13, + "learning_rate": 4.873606963314347e-06, + "loss": 1.188, + "step": 4269 + }, + { + "epoch": 0.13, + "learning_rate": 4.8735303757280525e-06, + "loss": 1.1547, + "step": 4270 + }, + { + "epoch": 0.13, + "learning_rate": 4.873453765546892e-06, + "loss": 1.1858, + "step": 4271 + }, + { + "epoch": 0.13, + "learning_rate": 4.873377132771595e-06, + "loss": 1.1565, + "step": 4272 + }, + { + "epoch": 0.13, + "learning_rate": 4.87330047740289e-06, + "loss": 1.222, + "step": 4273 + }, + { + "epoch": 0.13, + "learning_rate": 4.873223799441508e-06, + "loss": 1.0419, + "step": 4274 + }, + { + "epoch": 0.13, + "learning_rate": 4.873147098888178e-06, + "loss": 1.198, + "step": 4275 + }, + { + "epoch": 0.13, + "learning_rate": 4.873070375743631e-06, + "loss": 1.1814, + "step": 4276 + }, + { + "epoch": 0.13, + "learning_rate": 4.872993630008597e-06, + "loss": 1.1258, + "step": 4277 + }, + { + "epoch": 0.13, + "learning_rate": 4.872916861683806e-06, + "loss": 1.1057, + "step": 4278 + }, + { + "epoch": 0.13, + "learning_rate": 4.872840070769989e-06, + "loss": 1.2677, + "step": 4279 + }, + { + "epoch": 0.13, + "learning_rate": 4.8727632572678794e-06, + "loss": 1.2234, + "step": 4280 + }, + { + "epoch": 0.13, + "learning_rate": 4.8726864211782044e-06, + "loss": 1.3337, + "step": 4281 + }, + { + "epoch": 0.13, + "learning_rate": 4.872609562501698e-06, + "loss": 1.1034, + "step": 4282 + }, + { + "epoch": 0.13, + "learning_rate": 4.872532681239092e-06, + "loss": 1.2102, + "step": 4283 + }, + { + "epoch": 0.13, + "learning_rate": 4.872455777391116e-06, + "loss": 1.2267, + "step": 4284 + }, + { + "epoch": 0.13, + "learning_rate": 4.8723788509585045e-06, + "loss": 1.1737, + "step": 4285 + }, + { + "epoch": 0.13, + "learning_rate": 4.872301901941988e-06, + "loss": 1.3625, + "step": 4286 + }, + { + "epoch": 0.13, + "learning_rate": 4.8722249303423006e-06, + "loss": 1.241, + "step": 4287 + }, + { + "epoch": 0.13, + "learning_rate": 4.872147936160175e-06, + "loss": 1.1666, + "step": 4288 + }, + { + "epoch": 0.13, + "learning_rate": 4.872070919396343e-06, + "loss": 1.1943, + "step": 4289 + }, + { + "epoch": 0.13, + "learning_rate": 4.8719938800515385e-06, + "loss": 1.0807, + "step": 4290 + }, + { + "epoch": 0.13, + "learning_rate": 4.871916818126494e-06, + "loss": 1.2158, + "step": 4291 + }, + { + "epoch": 0.13, + "learning_rate": 4.871839733621944e-06, + "loss": 1.1457, + "step": 4292 + }, + { + "epoch": 0.13, + "learning_rate": 4.871762626538623e-06, + "loss": 1.1304, + "step": 4293 + }, + { + "epoch": 0.13, + "learning_rate": 4.871685496877263e-06, + "loss": 1.1853, + "step": 4294 + }, + { + "epoch": 0.13, + "learning_rate": 4.871608344638599e-06, + "loss": 1.1467, + "step": 4295 + }, + { + "epoch": 0.13, + "learning_rate": 4.871531169823367e-06, + "loss": 1.1384, + "step": 4296 + }, + { + "epoch": 0.13, + "learning_rate": 4.8714539724322995e-06, + "loss": 1.2599, + "step": 4297 + }, + { + "epoch": 0.13, + "learning_rate": 4.871376752466132e-06, + "loss": 1.2427, + "step": 4298 + }, + { + "epoch": 0.13, + "learning_rate": 4.871299509925601e-06, + "loss": 1.088, + "step": 4299 + }, + { + "epoch": 0.13, + "learning_rate": 4.87122224481144e-06, + "loss": 1.2693, + "step": 4300 + }, + { + "epoch": 0.13, + "learning_rate": 4.871144957124385e-06, + "loss": 1.1602, + "step": 4301 + }, + { + "epoch": 0.13, + "learning_rate": 4.8710676468651726e-06, + "loss": 1.1693, + "step": 4302 + }, + { + "epoch": 0.13, + "learning_rate": 4.8709903140345385e-06, + "loss": 1.1224, + "step": 4303 + }, + { + "epoch": 0.13, + "learning_rate": 4.870912958633218e-06, + "loss": 1.0977, + "step": 4304 + }, + { + "epoch": 0.13, + "learning_rate": 4.870835580661948e-06, + "loss": 1.2683, + "step": 4305 + }, + { + "epoch": 0.13, + "learning_rate": 4.870758180121466e-06, + "loss": 1.2826, + "step": 4306 + }, + { + "epoch": 0.13, + "learning_rate": 4.870680757012506e-06, + "loss": 1.1099, + "step": 4307 + }, + { + "epoch": 0.13, + "learning_rate": 4.870603311335808e-06, + "loss": 1.1731, + "step": 4308 + }, + { + "epoch": 0.13, + "learning_rate": 4.870525843092109e-06, + "loss": 1.1624, + "step": 4309 + }, + { + "epoch": 0.13, + "learning_rate": 4.870448352282144e-06, + "loss": 1.2244, + "step": 4310 + }, + { + "epoch": 0.13, + "learning_rate": 4.870370838906653e-06, + "loss": 1.1549, + "step": 4311 + }, + { + "epoch": 0.13, + "learning_rate": 4.870293302966373e-06, + "loss": 1.2011, + "step": 4312 + }, + { + "epoch": 0.13, + "learning_rate": 4.870215744462044e-06, + "loss": 1.0621, + "step": 4313 + }, + { + "epoch": 0.13, + "learning_rate": 4.870138163394401e-06, + "loss": 1.1668, + "step": 4314 + }, + { + "epoch": 0.13, + "learning_rate": 4.870060559764185e-06, + "loss": 1.1932, + "step": 4315 + }, + { + "epoch": 0.13, + "learning_rate": 4.869982933572132e-06, + "loss": 1.2689, + "step": 4316 + }, + { + "epoch": 0.13, + "learning_rate": 4.869905284818985e-06, + "loss": 1.1056, + "step": 4317 + }, + { + "epoch": 0.13, + "learning_rate": 4.869827613505481e-06, + "loss": 1.0836, + "step": 4318 + }, + { + "epoch": 0.13, + "learning_rate": 4.869749919632359e-06, + "loss": 1.1628, + "step": 4319 + }, + { + "epoch": 0.13, + "learning_rate": 4.869672203200358e-06, + "loss": 1.1539, + "step": 4320 + }, + { + "epoch": 0.13, + "learning_rate": 4.869594464210221e-06, + "loss": 1.1041, + "step": 4321 + }, + { + "epoch": 0.13, + "learning_rate": 4.869516702662684e-06, + "loss": 1.0934, + "step": 4322 + }, + { + "epoch": 0.13, + "learning_rate": 4.869438918558491e-06, + "loss": 1.1257, + "step": 4323 + }, + { + "epoch": 0.13, + "learning_rate": 4.86936111189838e-06, + "loss": 1.1075, + "step": 4324 + }, + { + "epoch": 0.13, + "learning_rate": 4.869283282683092e-06, + "loss": 1.1183, + "step": 4325 + }, + { + "epoch": 0.13, + "learning_rate": 4.869205430913368e-06, + "loss": 1.1434, + "step": 4326 + }, + { + "epoch": 0.13, + "learning_rate": 4.869127556589949e-06, + "loss": 1.0271, + "step": 4327 + }, + { + "epoch": 0.13, + "learning_rate": 4.869049659713577e-06, + "loss": 1.1265, + "step": 4328 + }, + { + "epoch": 0.13, + "learning_rate": 4.868971740284994e-06, + "loss": 1.0618, + "step": 4329 + }, + { + "epoch": 0.13, + "learning_rate": 4.86889379830494e-06, + "loss": 1.061, + "step": 4330 + }, + { + "epoch": 0.13, + "learning_rate": 4.8688158337741585e-06, + "loss": 1.2793, + "step": 4331 + }, + { + "epoch": 0.13, + "learning_rate": 4.868737846693391e-06, + "loss": 1.2338, + "step": 4332 + }, + { + "epoch": 0.13, + "learning_rate": 4.8686598370633805e-06, + "loss": 1.2059, + "step": 4333 + }, + { + "epoch": 0.13, + "learning_rate": 4.868581804884869e-06, + "loss": 1.0229, + "step": 4334 + }, + { + "epoch": 0.13, + "learning_rate": 4.868503750158599e-06, + "loss": 1.1354, + "step": 4335 + }, + { + "epoch": 0.13, + "learning_rate": 4.868425672885314e-06, + "loss": 1.1547, + "step": 4336 + }, + { + "epoch": 0.13, + "learning_rate": 4.868347573065758e-06, + "loss": 1.1093, + "step": 4337 + }, + { + "epoch": 0.13, + "learning_rate": 4.868269450700673e-06, + "loss": 1.1501, + "step": 4338 + }, + { + "epoch": 0.13, + "learning_rate": 4.868191305790803e-06, + "loss": 1.1541, + "step": 4339 + }, + { + "epoch": 0.13, + "learning_rate": 4.868113138336893e-06, + "loss": 1.1568, + "step": 4340 + }, + { + "epoch": 0.13, + "learning_rate": 4.868034948339686e-06, + "loss": 1.1688, + "step": 4341 + }, + { + "epoch": 0.13, + "learning_rate": 4.867956735799928e-06, + "loss": 1.169, + "step": 4342 + }, + { + "epoch": 0.13, + "learning_rate": 4.867878500718362e-06, + "loss": 1.1708, + "step": 4343 + }, + { + "epoch": 0.13, + "learning_rate": 4.867800243095732e-06, + "loss": 1.2352, + "step": 4344 + }, + { + "epoch": 0.13, + "learning_rate": 4.867721962932785e-06, + "loss": 1.2202, + "step": 4345 + }, + { + "epoch": 0.13, + "learning_rate": 4.867643660230264e-06, + "loss": 1.0713, + "step": 4346 + }, + { + "epoch": 0.13, + "learning_rate": 4.8675653349889165e-06, + "loss": 1.1041, + "step": 4347 + }, + { + "epoch": 0.13, + "learning_rate": 4.867486987209487e-06, + "loss": 1.2094, + "step": 4348 + }, + { + "epoch": 0.13, + "learning_rate": 4.867408616892723e-06, + "loss": 1.1517, + "step": 4349 + }, + { + "epoch": 0.13, + "learning_rate": 4.867330224039367e-06, + "loss": 1.2734, + "step": 4350 + }, + { + "epoch": 0.13, + "learning_rate": 4.867251808650169e-06, + "loss": 1.171, + "step": 4351 + }, + { + "epoch": 0.13, + "learning_rate": 4.867173370725873e-06, + "loss": 1.1459, + "step": 4352 + }, + { + "epoch": 0.13, + "learning_rate": 4.867094910267227e-06, + "loss": 1.0267, + "step": 4353 + }, + { + "epoch": 0.13, + "learning_rate": 4.867016427274978e-06, + "loss": 1.1841, + "step": 4354 + }, + { + "epoch": 0.13, + "learning_rate": 4.866937921749871e-06, + "loss": 1.2458, + "step": 4355 + }, + { + "epoch": 0.13, + "learning_rate": 4.8668593936926564e-06, + "loss": 1.2236, + "step": 4356 + }, + { + "epoch": 0.13, + "learning_rate": 4.86678084310408e-06, + "loss": 1.1877, + "step": 4357 + }, + { + "epoch": 0.13, + "learning_rate": 4.86670226998489e-06, + "loss": 1.1205, + "step": 4358 + }, + { + "epoch": 0.13, + "learning_rate": 4.8666236743358336e-06, + "loss": 1.1273, + "step": 4359 + }, + { + "epoch": 0.13, + "learning_rate": 4.86654505615766e-06, + "loss": 1.188, + "step": 4360 + }, + { + "epoch": 0.13, + "learning_rate": 4.866466415451117e-06, + "loss": 1.1445, + "step": 4361 + }, + { + "epoch": 0.13, + "learning_rate": 4.866387752216953e-06, + "loss": 1.0806, + "step": 4362 + }, + { + "epoch": 0.13, + "learning_rate": 4.866309066455919e-06, + "loss": 1.1771, + "step": 4363 + }, + { + "epoch": 0.13, + "learning_rate": 4.866230358168761e-06, + "loss": 1.2717, + "step": 4364 + }, + { + "epoch": 0.13, + "learning_rate": 4.86615162735623e-06, + "loss": 1.0381, + "step": 4365 + }, + { + "epoch": 0.13, + "learning_rate": 4.866072874019075e-06, + "loss": 1.2195, + "step": 4366 + }, + { + "epoch": 0.13, + "learning_rate": 4.865994098158045e-06, + "loss": 1.3088, + "step": 4367 + }, + { + "epoch": 0.13, + "learning_rate": 4.8659152997738925e-06, + "loss": 1.2476, + "step": 4368 + }, + { + "epoch": 0.13, + "learning_rate": 4.865836478867364e-06, + "loss": 1.0562, + "step": 4369 + }, + { + "epoch": 0.13, + "learning_rate": 4.865757635439212e-06, + "loss": 1.1572, + "step": 4370 + }, + { + "epoch": 0.13, + "learning_rate": 4.8656787694901875e-06, + "loss": 1.1261, + "step": 4371 + }, + { + "epoch": 0.13, + "learning_rate": 4.865599881021041e-06, + "loss": 1.1317, + "step": 4372 + }, + { + "epoch": 0.13, + "learning_rate": 4.865520970032521e-06, + "loss": 1.2618, + "step": 4373 + }, + { + "epoch": 0.13, + "learning_rate": 4.865442036525382e-06, + "loss": 1.1238, + "step": 4374 + }, + { + "epoch": 0.13, + "learning_rate": 4.865363080500374e-06, + "loss": 1.2998, + "step": 4375 + }, + { + "epoch": 0.13, + "learning_rate": 4.865284101958247e-06, + "loss": 1.1365, + "step": 4376 + }, + { + "epoch": 0.13, + "learning_rate": 4.865205100899757e-06, + "loss": 1.2214, + "step": 4377 + }, + { + "epoch": 0.13, + "learning_rate": 4.865126077325653e-06, + "loss": 1.1031, + "step": 4378 + }, + { + "epoch": 0.13, + "learning_rate": 4.8650470312366865e-06, + "loss": 1.1521, + "step": 4379 + }, + { + "epoch": 0.13, + "learning_rate": 4.8649679626336125e-06, + "loss": 1.2234, + "step": 4380 + }, + { + "epoch": 0.13, + "learning_rate": 4.864888871517182e-06, + "loss": 1.1211, + "step": 4381 + }, + { + "epoch": 0.13, + "learning_rate": 4.864809757888148e-06, + "loss": 1.2388, + "step": 4382 + }, + { + "epoch": 0.13, + "learning_rate": 4.8647306217472645e-06, + "loss": 1.2335, + "step": 4383 + }, + { + "epoch": 0.13, + "learning_rate": 4.8646514630952844e-06, + "loss": 1.1469, + "step": 4384 + }, + { + "epoch": 0.13, + "learning_rate": 4.864572281932961e-06, + "loss": 1.1099, + "step": 4385 + }, + { + "epoch": 0.13, + "learning_rate": 4.864493078261049e-06, + "loss": 1.1835, + "step": 4386 + }, + { + "epoch": 0.13, + "learning_rate": 4.864413852080301e-06, + "loss": 1.2098, + "step": 4387 + }, + { + "epoch": 0.13, + "learning_rate": 4.864334603391472e-06, + "loss": 1.1459, + "step": 4388 + }, + { + "epoch": 0.13, + "learning_rate": 4.864255332195316e-06, + "loss": 1.1667, + "step": 4389 + }, + { + "epoch": 0.13, + "learning_rate": 4.864176038492588e-06, + "loss": 1.1063, + "step": 4390 + }, + { + "epoch": 0.13, + "learning_rate": 4.8640967222840435e-06, + "loss": 1.0739, + "step": 4391 + }, + { + "epoch": 0.13, + "learning_rate": 4.8640173835704364e-06, + "loss": 1.1476, + "step": 4392 + }, + { + "epoch": 0.13, + "learning_rate": 4.863938022352523e-06, + "loss": 1.0921, + "step": 4393 + }, + { + "epoch": 0.13, + "learning_rate": 4.863858638631057e-06, + "loss": 1.1912, + "step": 4394 + }, + { + "epoch": 0.13, + "learning_rate": 4.863779232406795e-06, + "loss": 1.0609, + "step": 4395 + }, + { + "epoch": 0.13, + "learning_rate": 4.8636998036804935e-06, + "loss": 1.1083, + "step": 4396 + }, + { + "epoch": 0.13, + "learning_rate": 4.863620352452909e-06, + "loss": 1.0875, + "step": 4397 + }, + { + "epoch": 0.13, + "learning_rate": 4.863540878724796e-06, + "loss": 1.1307, + "step": 4398 + }, + { + "epoch": 0.13, + "learning_rate": 4.8634613824969136e-06, + "loss": 1.1304, + "step": 4399 + }, + { + "epoch": 0.13, + "learning_rate": 4.8633818637700155e-06, + "loss": 1.3147, + "step": 4400 + }, + { + "epoch": 0.13, + "learning_rate": 4.863302322544862e-06, + "loss": 1.158, + "step": 4401 + }, + { + "epoch": 0.13, + "learning_rate": 4.863222758822207e-06, + "loss": 1.1403, + "step": 4402 + }, + { + "epoch": 0.13, + "learning_rate": 4.86314317260281e-06, + "loss": 1.1918, + "step": 4403 + }, + { + "epoch": 0.13, + "learning_rate": 4.863063563887428e-06, + "loss": 1.1551, + "step": 4404 + }, + { + "epoch": 0.13, + "learning_rate": 4.8629839326768196e-06, + "loss": 1.2122, + "step": 4405 + }, + { + "epoch": 0.13, + "learning_rate": 4.862904278971742e-06, + "loss": 1.1533, + "step": 4406 + }, + { + "epoch": 0.13, + "learning_rate": 4.8628246027729535e-06, + "loss": 1.1146, + "step": 4407 + }, + { + "epoch": 0.13, + "learning_rate": 4.862744904081213e-06, + "loss": 1.1183, + "step": 4408 + }, + { + "epoch": 0.13, + "learning_rate": 4.862665182897279e-06, + "loss": 1.0953, + "step": 4409 + }, + { + "epoch": 0.13, + "learning_rate": 4.86258543922191e-06, + "loss": 1.0938, + "step": 4410 + }, + { + "epoch": 0.13, + "learning_rate": 4.862505673055865e-06, + "loss": 1.0783, + "step": 4411 + }, + { + "epoch": 0.13, + "learning_rate": 4.862425884399905e-06, + "loss": 1.1389, + "step": 4412 + }, + { + "epoch": 0.13, + "learning_rate": 4.862346073254788e-06, + "loss": 1.0842, + "step": 4413 + }, + { + "epoch": 0.13, + "learning_rate": 4.862266239621274e-06, + "loss": 1.1564, + "step": 4414 + }, + { + "epoch": 0.13, + "learning_rate": 4.862186383500123e-06, + "loss": 1.1534, + "step": 4415 + }, + { + "epoch": 0.13, + "learning_rate": 4.8621065048920946e-06, + "loss": 1.0572, + "step": 4416 + }, + { + "epoch": 0.13, + "learning_rate": 4.862026603797951e-06, + "loss": 1.1417, + "step": 4417 + }, + { + "epoch": 0.13, + "learning_rate": 4.861946680218451e-06, + "loss": 1.2007, + "step": 4418 + }, + { + "epoch": 0.13, + "learning_rate": 4.861866734154357e-06, + "loss": 1.0721, + "step": 4419 + }, + { + "epoch": 0.13, + "learning_rate": 4.861786765606428e-06, + "loss": 1.1708, + "step": 4420 + }, + { + "epoch": 0.13, + "learning_rate": 4.861706774575427e-06, + "loss": 1.2415, + "step": 4421 + }, + { + "epoch": 0.13, + "learning_rate": 4.861626761062116e-06, + "loss": 1.2106, + "step": 4422 + }, + { + "epoch": 0.13, + "learning_rate": 4.861546725067254e-06, + "loss": 1.1274, + "step": 4423 + }, + { + "epoch": 0.13, + "learning_rate": 4.861466666591606e-06, + "loss": 1.2128, + "step": 4424 + }, + { + "epoch": 0.13, + "learning_rate": 4.861386585635932e-06, + "loss": 1.0771, + "step": 4425 + }, + { + "epoch": 0.13, + "learning_rate": 4.861306482200995e-06, + "loss": 1.2227, + "step": 4426 + }, + { + "epoch": 0.13, + "learning_rate": 4.861226356287557e-06, + "loss": 1.23, + "step": 4427 + }, + { + "epoch": 0.13, + "learning_rate": 4.8611462078963814e-06, + "loss": 1.1675, + "step": 4428 + }, + { + "epoch": 0.13, + "learning_rate": 4.861066037028231e-06, + "loss": 1.1146, + "step": 4429 + }, + { + "epoch": 0.13, + "learning_rate": 4.86098584368387e-06, + "loss": 1.2224, + "step": 4430 + }, + { + "epoch": 0.13, + "learning_rate": 4.8609056278640605e-06, + "loss": 1.1702, + "step": 4431 + }, + { + "epoch": 0.13, + "learning_rate": 4.860825389569566e-06, + "loss": 1.1829, + "step": 4432 + }, + { + "epoch": 0.13, + "learning_rate": 4.860745128801152e-06, + "loss": 1.1731, + "step": 4433 + }, + { + "epoch": 0.13, + "learning_rate": 4.86066484555958e-06, + "loss": 1.1046, + "step": 4434 + }, + { + "epoch": 0.13, + "learning_rate": 4.8605845398456155e-06, + "loss": 1.2226, + "step": 4435 + }, + { + "epoch": 0.13, + "learning_rate": 4.860504211660025e-06, + "loss": 1.1555, + "step": 4436 + }, + { + "epoch": 0.13, + "learning_rate": 4.8604238610035695e-06, + "loss": 1.1956, + "step": 4437 + }, + { + "epoch": 0.13, + "learning_rate": 4.860343487877016e-06, + "loss": 1.1645, + "step": 4438 + }, + { + "epoch": 0.13, + "learning_rate": 4.860263092281129e-06, + "loss": 1.0587, + "step": 4439 + }, + { + "epoch": 0.13, + "learning_rate": 4.8601826742166745e-06, + "loss": 1.0851, + "step": 4440 + }, + { + "epoch": 0.13, + "learning_rate": 4.860102233684417e-06, + "loss": 1.2218, + "step": 4441 + }, + { + "epoch": 0.13, + "learning_rate": 4.8600217706851235e-06, + "loss": 1.215, + "step": 4442 + }, + { + "epoch": 0.13, + "learning_rate": 4.859941285219559e-06, + "loss": 1.1956, + "step": 4443 + }, + { + "epoch": 0.13, + "learning_rate": 4.859860777288491e-06, + "loss": 1.1282, + "step": 4444 + }, + { + "epoch": 0.13, + "learning_rate": 4.859780246892685e-06, + "loss": 1.1178, + "step": 4445 + }, + { + "epoch": 0.13, + "learning_rate": 4.8596996940329066e-06, + "loss": 1.2142, + "step": 4446 + }, + { + "epoch": 0.13, + "learning_rate": 4.859619118709924e-06, + "loss": 1.2581, + "step": 4447 + }, + { + "epoch": 0.13, + "learning_rate": 4.859538520924503e-06, + "loss": 1.1049, + "step": 4448 + }, + { + "epoch": 0.13, + "learning_rate": 4.859457900677413e-06, + "loss": 1.0324, + "step": 4449 + }, + { + "epoch": 0.13, + "learning_rate": 4.8593772579694195e-06, + "loss": 1.1653, + "step": 4450 + }, + { + "epoch": 0.13, + "learning_rate": 4.85929659280129e-06, + "loss": 1.1837, + "step": 4451 + }, + { + "epoch": 0.13, + "learning_rate": 4.859215905173795e-06, + "loss": 1.094, + "step": 4452 + }, + { + "epoch": 0.13, + "learning_rate": 4.8591351950877e-06, + "loss": 1.0591, + "step": 4453 + }, + { + "epoch": 0.13, + "learning_rate": 4.859054462543774e-06, + "loss": 1.1578, + "step": 4454 + }, + { + "epoch": 0.13, + "learning_rate": 4.8589737075427855e-06, + "loss": 1.2335, + "step": 4455 + }, + { + "epoch": 0.13, + "learning_rate": 4.8588929300855035e-06, + "loss": 1.0969, + "step": 4456 + }, + { + "epoch": 0.13, + "learning_rate": 4.858812130172697e-06, + "loss": 1.2515, + "step": 4457 + }, + { + "epoch": 0.13, + "learning_rate": 4.858731307805135e-06, + "loss": 1.1943, + "step": 4458 + }, + { + "epoch": 0.13, + "learning_rate": 4.858650462983587e-06, + "loss": 1.1165, + "step": 4459 + }, + { + "epoch": 0.13, + "learning_rate": 4.858569595708823e-06, + "loss": 1.015, + "step": 4460 + }, + { + "epoch": 0.13, + "learning_rate": 4.858488705981611e-06, + "loss": 1.1122, + "step": 4461 + }, + { + "epoch": 0.13, + "learning_rate": 4.858407793802724e-06, + "loss": 1.3078, + "step": 4462 + }, + { + "epoch": 0.13, + "learning_rate": 4.85832685917293e-06, + "loss": 1.1641, + "step": 4463 + }, + { + "epoch": 0.13, + "learning_rate": 4.858245902093e-06, + "loss": 1.2344, + "step": 4464 + }, + { + "epoch": 0.13, + "learning_rate": 4.8581649225637055e-06, + "loss": 1.1028, + "step": 4465 + }, + { + "epoch": 0.13, + "learning_rate": 4.858083920585816e-06, + "loss": 1.1988, + "step": 4466 + }, + { + "epoch": 0.13, + "learning_rate": 4.858002896160103e-06, + "loss": 1.2279, + "step": 4467 + }, + { + "epoch": 0.13, + "learning_rate": 4.857921849287338e-06, + "loss": 1.2271, + "step": 4468 + }, + { + "epoch": 0.13, + "learning_rate": 4.8578407799682935e-06, + "loss": 1.179, + "step": 4469 + }, + { + "epoch": 0.13, + "learning_rate": 4.85775968820374e-06, + "loss": 1.103, + "step": 4470 + }, + { + "epoch": 0.13, + "learning_rate": 4.85767857399445e-06, + "loss": 1.1883, + "step": 4471 + }, + { + "epoch": 0.13, + "learning_rate": 4.857597437341195e-06, + "loss": 1.0715, + "step": 4472 + }, + { + "epoch": 0.13, + "learning_rate": 4.857516278244748e-06, + "loss": 1.0488, + "step": 4473 + }, + { + "epoch": 0.13, + "learning_rate": 4.857435096705881e-06, + "loss": 1.249, + "step": 4474 + }, + { + "epoch": 0.13, + "learning_rate": 4.857353892725368e-06, + "loss": 1.2477, + "step": 4475 + }, + { + "epoch": 0.13, + "learning_rate": 4.8572726663039804e-06, + "loss": 1.1991, + "step": 4476 + }, + { + "epoch": 0.13, + "learning_rate": 4.857191417442493e-06, + "loss": 1.0495, + "step": 4477 + }, + { + "epoch": 0.13, + "learning_rate": 4.85711014614168e-06, + "loss": 1.1307, + "step": 4478 + }, + { + "epoch": 0.13, + "learning_rate": 4.857028852402311e-06, + "loss": 1.1925, + "step": 4479 + }, + { + "epoch": 0.13, + "learning_rate": 4.856947536225164e-06, + "loss": 1.193, + "step": 4480 + }, + { + "epoch": 0.13, + "learning_rate": 4.856866197611011e-06, + "loss": 1.14, + "step": 4481 + }, + { + "epoch": 0.14, + "learning_rate": 4.856784836560628e-06, + "loss": 1.1475, + "step": 4482 + }, + { + "epoch": 0.14, + "learning_rate": 4.856703453074787e-06, + "loss": 1.2462, + "step": 4483 + }, + { + "epoch": 0.14, + "learning_rate": 4.8566220471542644e-06, + "loss": 1.1172, + "step": 4484 + }, + { + "epoch": 0.14, + "learning_rate": 4.856540618799835e-06, + "loss": 1.1169, + "step": 4485 + }, + { + "epoch": 0.14, + "learning_rate": 4.8564591680122745e-06, + "loss": 1.0383, + "step": 4486 + }, + { + "epoch": 0.14, + "learning_rate": 4.8563776947923565e-06, + "loss": 1.1865, + "step": 4487 + }, + { + "epoch": 0.14, + "learning_rate": 4.856296199140859e-06, + "loss": 1.1556, + "step": 4488 + }, + { + "epoch": 0.14, + "learning_rate": 4.856214681058555e-06, + "loss": 1.0911, + "step": 4489 + }, + { + "epoch": 0.14, + "learning_rate": 4.856133140546224e-06, + "loss": 1.1274, + "step": 4490 + }, + { + "epoch": 0.14, + "learning_rate": 4.856051577604639e-06, + "loss": 1.2029, + "step": 4491 + }, + { + "epoch": 0.14, + "learning_rate": 4.855969992234578e-06, + "loss": 1.1223, + "step": 4492 + }, + { + "epoch": 0.14, + "learning_rate": 4.855888384436817e-06, + "loss": 1.2188, + "step": 4493 + }, + { + "epoch": 0.14, + "learning_rate": 4.855806754212133e-06, + "loss": 1.0975, + "step": 4494 + }, + { + "epoch": 0.14, + "learning_rate": 4.8557251015613044e-06, + "loss": 1.1149, + "step": 4495 + }, + { + "epoch": 0.14, + "learning_rate": 4.855643426485106e-06, + "loss": 1.2118, + "step": 4496 + }, + { + "epoch": 0.14, + "learning_rate": 4.855561728984318e-06, + "loss": 1.1785, + "step": 4497 + }, + { + "epoch": 0.14, + "learning_rate": 4.855480009059717e-06, + "loss": 1.167, + "step": 4498 + }, + { + "epoch": 0.14, + "learning_rate": 4.855398266712079e-06, + "loss": 1.2798, + "step": 4499 + }, + { + "epoch": 0.14, + "learning_rate": 4.855316501942186e-06, + "loss": 1.0911, + "step": 4500 + }, + { + "epoch": 0.14, + "learning_rate": 4.855234714750813e-06, + "loss": 1.2394, + "step": 4501 + }, + { + "epoch": 0.14, + "learning_rate": 4.85515290513874e-06, + "loss": 1.1573, + "step": 4502 + }, + { + "epoch": 0.14, + "learning_rate": 4.8550710731067455e-06, + "loss": 1.1541, + "step": 4503 + }, + { + "epoch": 0.14, + "learning_rate": 4.854989218655608e-06, + "loss": 1.0721, + "step": 4504 + }, + { + "epoch": 0.14, + "learning_rate": 4.8549073417861086e-06, + "loss": 1.0446, + "step": 4505 + }, + { + "epoch": 0.14, + "learning_rate": 4.854825442499025e-06, + "loss": 1.1684, + "step": 4506 + }, + { + "epoch": 0.14, + "learning_rate": 4.8547435207951375e-06, + "loss": 1.0671, + "step": 4507 + }, + { + "epoch": 0.14, + "learning_rate": 4.854661576675226e-06, + "loss": 1.1356, + "step": 4508 + }, + { + "epoch": 0.14, + "learning_rate": 4.854579610140069e-06, + "loss": 1.1547, + "step": 4509 + }, + { + "epoch": 0.14, + "learning_rate": 4.854497621190449e-06, + "loss": 1.2061, + "step": 4510 + }, + { + "epoch": 0.14, + "learning_rate": 4.854415609827145e-06, + "loss": 1.2162, + "step": 4511 + }, + { + "epoch": 0.14, + "learning_rate": 4.854333576050941e-06, + "loss": 1.2155, + "step": 4512 + }, + { + "epoch": 0.14, + "learning_rate": 4.854251519862612e-06, + "loss": 1.1639, + "step": 4513 + }, + { + "epoch": 0.14, + "learning_rate": 4.854169441262944e-06, + "loss": 1.1675, + "step": 4514 + }, + { + "epoch": 0.14, + "learning_rate": 4.854087340252716e-06, + "loss": 1.1663, + "step": 4515 + }, + { + "epoch": 0.14, + "learning_rate": 4.85400521683271e-06, + "loss": 1.17, + "step": 4516 + }, + { + "epoch": 0.14, + "learning_rate": 4.853923071003709e-06, + "loss": 1.1302, + "step": 4517 + }, + { + "epoch": 0.14, + "learning_rate": 4.853840902766493e-06, + "loss": 1.1697, + "step": 4518 + }, + { + "epoch": 0.14, + "learning_rate": 4.853758712121847e-06, + "loss": 1.1408, + "step": 4519 + }, + { + "epoch": 0.14, + "learning_rate": 4.85367649907055e-06, + "loss": 1.1485, + "step": 4520 + }, + { + "epoch": 0.14, + "learning_rate": 4.853594263613387e-06, + "loss": 1.1588, + "step": 4521 + }, + { + "epoch": 0.14, + "learning_rate": 4.85351200575114e-06, + "loss": 1.16, + "step": 4522 + }, + { + "epoch": 0.14, + "learning_rate": 4.853429725484593e-06, + "loss": 1.14, + "step": 4523 + }, + { + "epoch": 0.14, + "learning_rate": 4.853347422814527e-06, + "loss": 1.2196, + "step": 4524 + }, + { + "epoch": 0.14, + "learning_rate": 4.853265097741728e-06, + "loss": 1.269, + "step": 4525 + }, + { + "epoch": 0.14, + "learning_rate": 4.853182750266978e-06, + "loss": 1.2081, + "step": 4526 + }, + { + "epoch": 0.14, + "learning_rate": 4.853100380391062e-06, + "loss": 1.059, + "step": 4527 + }, + { + "epoch": 0.14, + "learning_rate": 4.853017988114763e-06, + "loss": 1.0627, + "step": 4528 + }, + { + "epoch": 0.14, + "learning_rate": 4.852935573438867e-06, + "loss": 1.1443, + "step": 4529 + }, + { + "epoch": 0.14, + "learning_rate": 4.852853136364157e-06, + "loss": 1.1971, + "step": 4530 + }, + { + "epoch": 0.14, + "learning_rate": 4.852770676891419e-06, + "loss": 1.2297, + "step": 4531 + }, + { + "epoch": 0.14, + "learning_rate": 4.8526881950214365e-06, + "loss": 1.1468, + "step": 4532 + }, + { + "epoch": 0.14, + "learning_rate": 4.852605690754996e-06, + "loss": 1.1337, + "step": 4533 + }, + { + "epoch": 0.14, + "learning_rate": 4.852523164092882e-06, + "loss": 1.0554, + "step": 4534 + }, + { + "epoch": 0.14, + "learning_rate": 4.85244061503588e-06, + "loss": 1.1623, + "step": 4535 + }, + { + "epoch": 0.14, + "learning_rate": 4.852358043584777e-06, + "loss": 1.1996, + "step": 4536 + }, + { + "epoch": 0.14, + "learning_rate": 4.852275449740358e-06, + "loss": 1.0795, + "step": 4537 + }, + { + "epoch": 0.14, + "learning_rate": 4.85219283350341e-06, + "loss": 1.0931, + "step": 4538 + }, + { + "epoch": 0.14, + "learning_rate": 4.852110194874718e-06, + "loss": 1.2065, + "step": 4539 + }, + { + "epoch": 0.14, + "learning_rate": 4.852027533855071e-06, + "loss": 1.1219, + "step": 4540 + }, + { + "epoch": 0.14, + "learning_rate": 4.851944850445255e-06, + "loss": 1.0545, + "step": 4541 + }, + { + "epoch": 0.14, + "learning_rate": 4.851862144646056e-06, + "loss": 1.117, + "step": 4542 + }, + { + "epoch": 0.14, + "learning_rate": 4.851779416458262e-06, + "loss": 1.1876, + "step": 4543 + }, + { + "epoch": 0.14, + "learning_rate": 4.8516966658826606e-06, + "loss": 1.1403, + "step": 4544 + }, + { + "epoch": 0.14, + "learning_rate": 4.85161389292004e-06, + "loss": 1.1381, + "step": 4545 + }, + { + "epoch": 0.14, + "learning_rate": 4.851531097571187e-06, + "loss": 1.0685, + "step": 4546 + }, + { + "epoch": 0.14, + "learning_rate": 4.851448279836891e-06, + "loss": 1.0857, + "step": 4547 + }, + { + "epoch": 0.14, + "learning_rate": 4.8513654397179396e-06, + "loss": 1.1257, + "step": 4548 + }, + { + "epoch": 0.14, + "learning_rate": 4.851282577215122e-06, + "loss": 1.1656, + "step": 4549 + }, + { + "epoch": 0.14, + "learning_rate": 4.851199692329227e-06, + "loss": 1.1296, + "step": 4550 + }, + { + "epoch": 0.14, + "learning_rate": 4.8511167850610425e-06, + "loss": 1.1892, + "step": 4551 + }, + { + "epoch": 0.14, + "learning_rate": 4.851033855411359e-06, + "loss": 1.1102, + "step": 4552 + }, + { + "epoch": 0.14, + "learning_rate": 4.850950903380965e-06, + "loss": 1.2155, + "step": 4553 + }, + { + "epoch": 0.14, + "learning_rate": 4.850867928970651e-06, + "loss": 1.1611, + "step": 4554 + }, + { + "epoch": 0.14, + "learning_rate": 4.850784932181207e-06, + "loss": 1.1148, + "step": 4555 + }, + { + "epoch": 0.14, + "learning_rate": 4.850701913013422e-06, + "loss": 1.2123, + "step": 4556 + }, + { + "epoch": 0.14, + "learning_rate": 4.850618871468087e-06, + "loss": 1.1778, + "step": 4557 + }, + { + "epoch": 0.14, + "learning_rate": 4.850535807545993e-06, + "loss": 1.1731, + "step": 4558 + }, + { + "epoch": 0.14, + "learning_rate": 4.850452721247929e-06, + "loss": 1.1116, + "step": 4559 + }, + { + "epoch": 0.14, + "learning_rate": 4.850369612574688e-06, + "loss": 1.1765, + "step": 4560 + }, + { + "epoch": 0.14, + "learning_rate": 4.85028648152706e-06, + "loss": 1.2401, + "step": 4561 + }, + { + "epoch": 0.14, + "learning_rate": 4.850203328105837e-06, + "loss": 1.1722, + "step": 4562 + }, + { + "epoch": 0.14, + "learning_rate": 4.85012015231181e-06, + "loss": 1.1832, + "step": 4563 + }, + { + "epoch": 0.14, + "learning_rate": 4.850036954145771e-06, + "loss": 1.049, + "step": 4564 + }, + { + "epoch": 0.14, + "learning_rate": 4.849953733608513e-06, + "loss": 1.1373, + "step": 4565 + }, + { + "epoch": 0.14, + "learning_rate": 4.849870490700825e-06, + "loss": 1.1456, + "step": 4566 + }, + { + "epoch": 0.14, + "learning_rate": 4.849787225423503e-06, + "loss": 1.1874, + "step": 4567 + }, + { + "epoch": 0.14, + "learning_rate": 4.849703937777338e-06, + "loss": 1.1349, + "step": 4568 + }, + { + "epoch": 0.14, + "learning_rate": 4.849620627763124e-06, + "loss": 1.0482, + "step": 4569 + }, + { + "epoch": 0.14, + "learning_rate": 4.849537295381652e-06, + "loss": 1.1722, + "step": 4570 + }, + { + "epoch": 0.14, + "learning_rate": 4.849453940633717e-06, + "loss": 1.1907, + "step": 4571 + }, + { + "epoch": 0.14, + "learning_rate": 4.849370563520113e-06, + "loss": 1.0673, + "step": 4572 + }, + { + "epoch": 0.14, + "learning_rate": 4.849287164041632e-06, + "loss": 1.0638, + "step": 4573 + }, + { + "epoch": 0.14, + "learning_rate": 4.8492037421990675e-06, + "loss": 1.1, + "step": 4574 + }, + { + "epoch": 0.14, + "learning_rate": 4.8491202979932166e-06, + "loss": 1.1943, + "step": 4575 + }, + { + "epoch": 0.14, + "learning_rate": 4.84903683142487e-06, + "loss": 1.1882, + "step": 4576 + }, + { + "epoch": 0.14, + "learning_rate": 4.848953342494826e-06, + "loss": 1.1903, + "step": 4577 + }, + { + "epoch": 0.14, + "learning_rate": 4.848869831203876e-06, + "loss": 1.1727, + "step": 4578 + }, + { + "epoch": 0.14, + "learning_rate": 4.8487862975528175e-06, + "loss": 1.1646, + "step": 4579 + }, + { + "epoch": 0.14, + "learning_rate": 4.8487027415424445e-06, + "loss": 1.2112, + "step": 4580 + }, + { + "epoch": 0.14, + "learning_rate": 4.848619163173553e-06, + "loss": 1.2888, + "step": 4581 + }, + { + "epoch": 0.14, + "learning_rate": 4.848535562446936e-06, + "loss": 1.0527, + "step": 4582 + }, + { + "epoch": 0.14, + "learning_rate": 4.848451939363394e-06, + "loss": 1.2606, + "step": 4583 + }, + { + "epoch": 0.14, + "learning_rate": 4.848368293923719e-06, + "loss": 1.1068, + "step": 4584 + }, + { + "epoch": 0.14, + "learning_rate": 4.84828462612871e-06, + "loss": 1.0586, + "step": 4585 + }, + { + "epoch": 0.14, + "learning_rate": 4.848200935979162e-06, + "loss": 1.0558, + "step": 4586 + }, + { + "epoch": 0.14, + "learning_rate": 4.848117223475871e-06, + "loss": 1.2033, + "step": 4587 + }, + { + "epoch": 0.14, + "learning_rate": 4.848033488619636e-06, + "loss": 1.1409, + "step": 4588 + }, + { + "epoch": 0.14, + "learning_rate": 4.847949731411253e-06, + "loss": 1.1364, + "step": 4589 + }, + { + "epoch": 0.14, + "learning_rate": 4.847865951851519e-06, + "loss": 1.1799, + "step": 4590 + }, + { + "epoch": 0.14, + "learning_rate": 4.847782149941232e-06, + "loss": 1.0159, + "step": 4591 + }, + { + "epoch": 0.14, + "learning_rate": 4.847698325681191e-06, + "loss": 1.0638, + "step": 4592 + }, + { + "epoch": 0.14, + "learning_rate": 4.847614479072191e-06, + "loss": 1.2903, + "step": 4593 + }, + { + "epoch": 0.14, + "learning_rate": 4.847530610115032e-06, + "loss": 1.2347, + "step": 4594 + }, + { + "epoch": 0.14, + "learning_rate": 4.847446718810512e-06, + "loss": 1.2391, + "step": 4595 + }, + { + "epoch": 0.14, + "learning_rate": 4.84736280515943e-06, + "loss": 1.2117, + "step": 4596 + }, + { + "epoch": 0.14, + "learning_rate": 4.847278869162585e-06, + "loss": 1.109, + "step": 4597 + }, + { + "epoch": 0.14, + "learning_rate": 4.847194910820775e-06, + "loss": 1.1164, + "step": 4598 + }, + { + "epoch": 0.14, + "learning_rate": 4.8471109301348e-06, + "loss": 0.9863, + "step": 4599 + }, + { + "epoch": 0.14, + "learning_rate": 4.84702692710546e-06, + "loss": 1.1232, + "step": 4600 + }, + { + "epoch": 0.14, + "learning_rate": 4.846942901733555e-06, + "loss": 1.1487, + "step": 4601 + }, + { + "epoch": 0.14, + "learning_rate": 4.8468588540198826e-06, + "loss": 1.0565, + "step": 4602 + }, + { + "epoch": 0.14, + "learning_rate": 4.846774783965244e-06, + "loss": 1.0584, + "step": 4603 + }, + { + "epoch": 0.14, + "learning_rate": 4.84669069157044e-06, + "loss": 1.1221, + "step": 4604 + }, + { + "epoch": 0.14, + "learning_rate": 4.84660657683627e-06, + "loss": 1.1705, + "step": 4605 + }, + { + "epoch": 0.14, + "learning_rate": 4.8465224397635365e-06, + "loss": 1.2094, + "step": 4606 + }, + { + "epoch": 0.14, + "learning_rate": 4.84643828035304e-06, + "loss": 1.1038, + "step": 4607 + }, + { + "epoch": 0.14, + "learning_rate": 4.84635409860558e-06, + "loss": 1.1515, + "step": 4608 + }, + { + "epoch": 0.14, + "learning_rate": 4.84626989452196e-06, + "loss": 1.0474, + "step": 4609 + }, + { + "epoch": 0.14, + "learning_rate": 4.846185668102979e-06, + "loss": 1.1813, + "step": 4610 + }, + { + "epoch": 0.14, + "learning_rate": 4.846101419349443e-06, + "loss": 1.078, + "step": 4611 + }, + { + "epoch": 0.14, + "learning_rate": 4.84601714826215e-06, + "loss": 1.3174, + "step": 4612 + }, + { + "epoch": 0.14, + "learning_rate": 4.845932854841903e-06, + "loss": 1.015, + "step": 4613 + }, + { + "epoch": 0.14, + "learning_rate": 4.845848539089505e-06, + "loss": 1.1253, + "step": 4614 + }, + { + "epoch": 0.14, + "learning_rate": 4.845764201005759e-06, + "loss": 1.1002, + "step": 4615 + }, + { + "epoch": 0.14, + "learning_rate": 4.8456798405914685e-06, + "loss": 1.0961, + "step": 4616 + }, + { + "epoch": 0.14, + "learning_rate": 4.845595457847435e-06, + "loss": 1.2049, + "step": 4617 + }, + { + "epoch": 0.14, + "learning_rate": 4.845511052774463e-06, + "loss": 1.131, + "step": 4618 + }, + { + "epoch": 0.14, + "learning_rate": 4.845426625373355e-06, + "loss": 1.2173, + "step": 4619 + }, + { + "epoch": 0.14, + "learning_rate": 4.845342175644914e-06, + "loss": 1.1292, + "step": 4620 + }, + { + "epoch": 0.14, + "learning_rate": 4.845257703589946e-06, + "loss": 1.1774, + "step": 4621 + }, + { + "epoch": 0.14, + "learning_rate": 4.845173209209255e-06, + "loss": 1.1329, + "step": 4622 + }, + { + "epoch": 0.14, + "learning_rate": 4.845088692503644e-06, + "loss": 1.2029, + "step": 4623 + }, + { + "epoch": 0.14, + "learning_rate": 4.845004153473917e-06, + "loss": 1.0533, + "step": 4624 + }, + { + "epoch": 0.14, + "learning_rate": 4.844919592120881e-06, + "loss": 1.2843, + "step": 4625 + }, + { + "epoch": 0.14, + "learning_rate": 4.844835008445339e-06, + "loss": 1.1209, + "step": 4626 + }, + { + "epoch": 0.14, + "learning_rate": 4.844750402448098e-06, + "loss": 1.0912, + "step": 4627 + }, + { + "epoch": 0.14, + "learning_rate": 4.844665774129962e-06, + "loss": 1.1429, + "step": 4628 + }, + { + "epoch": 0.14, + "learning_rate": 4.844581123491737e-06, + "loss": 1.1408, + "step": 4629 + }, + { + "epoch": 0.14, + "learning_rate": 4.844496450534228e-06, + "loss": 1.1573, + "step": 4630 + }, + { + "epoch": 0.14, + "learning_rate": 4.8444117552582435e-06, + "loss": 1.3149, + "step": 4631 + }, + { + "epoch": 0.14, + "learning_rate": 4.844327037664588e-06, + "loss": 1.1528, + "step": 4632 + }, + { + "epoch": 0.14, + "learning_rate": 4.844242297754067e-06, + "loss": 1.2094, + "step": 4633 + }, + { + "epoch": 0.14, + "learning_rate": 4.84415753552749e-06, + "loss": 1.0944, + "step": 4634 + }, + { + "epoch": 0.14, + "learning_rate": 4.8440727509856604e-06, + "loss": 1.1196, + "step": 4635 + }, + { + "epoch": 0.14, + "learning_rate": 4.843987944129388e-06, + "loss": 1.1331, + "step": 4636 + }, + { + "epoch": 0.14, + "learning_rate": 4.8439031149594795e-06, + "loss": 1.2115, + "step": 4637 + }, + { + "epoch": 0.14, + "learning_rate": 4.843818263476742e-06, + "loss": 1.2214, + "step": 4638 + }, + { + "epoch": 0.14, + "learning_rate": 4.843733389681984e-06, + "loss": 1.2211, + "step": 4639 + }, + { + "epoch": 0.14, + "learning_rate": 4.843648493576012e-06, + "loss": 1.174, + "step": 4640 + }, + { + "epoch": 0.14, + "learning_rate": 4.843563575159635e-06, + "loss": 1.1158, + "step": 4641 + }, + { + "epoch": 0.14, + "learning_rate": 4.843478634433663e-06, + "loss": 1.1755, + "step": 4642 + }, + { + "epoch": 0.14, + "learning_rate": 4.843393671398901e-06, + "loss": 1.2777, + "step": 4643 + }, + { + "epoch": 0.14, + "learning_rate": 4.843308686056162e-06, + "loss": 1.0038, + "step": 4644 + }, + { + "epoch": 0.14, + "learning_rate": 4.843223678406252e-06, + "loss": 1.1486, + "step": 4645 + }, + { + "epoch": 0.14, + "learning_rate": 4.84313864844998e-06, + "loss": 1.0833, + "step": 4646 + }, + { + "epoch": 0.14, + "learning_rate": 4.8430535961881574e-06, + "loss": 1.1624, + "step": 4647 + }, + { + "epoch": 0.14, + "learning_rate": 4.842968521621593e-06, + "loss": 1.1196, + "step": 4648 + }, + { + "epoch": 0.14, + "learning_rate": 4.842883424751097e-06, + "loss": 1.194, + "step": 4649 + }, + { + "epoch": 0.14, + "learning_rate": 4.842798305577479e-06, + "loss": 1.2164, + "step": 4650 + }, + { + "epoch": 0.14, + "learning_rate": 4.842713164101549e-06, + "loss": 1.1694, + "step": 4651 + }, + { + "epoch": 0.14, + "learning_rate": 4.842628000324119e-06, + "loss": 1.1804, + "step": 4652 + }, + { + "epoch": 0.14, + "learning_rate": 4.842542814245997e-06, + "loss": 1.229, + "step": 4653 + }, + { + "epoch": 0.14, + "learning_rate": 4.842457605867997e-06, + "loss": 1.0774, + "step": 4654 + }, + { + "epoch": 0.14, + "learning_rate": 4.842372375190929e-06, + "loss": 1.2008, + "step": 4655 + }, + { + "epoch": 0.14, + "learning_rate": 4.842287122215603e-06, + "loss": 1.2784, + "step": 4656 + }, + { + "epoch": 0.14, + "learning_rate": 4.8422018469428325e-06, + "loss": 1.2966, + "step": 4657 + }, + { + "epoch": 0.14, + "learning_rate": 4.842116549373428e-06, + "loss": 1.1238, + "step": 4658 + }, + { + "epoch": 0.14, + "learning_rate": 4.842031229508202e-06, + "loss": 1.1004, + "step": 4659 + }, + { + "epoch": 0.14, + "learning_rate": 4.841945887347967e-06, + "loss": 1.0731, + "step": 4660 + }, + { + "epoch": 0.14, + "learning_rate": 4.841860522893534e-06, + "loss": 1.198, + "step": 4661 + }, + { + "epoch": 0.14, + "learning_rate": 4.841775136145719e-06, + "loss": 1.0816, + "step": 4662 + }, + { + "epoch": 0.14, + "learning_rate": 4.8416897271053305e-06, + "loss": 1.1332, + "step": 4663 + }, + { + "epoch": 0.14, + "learning_rate": 4.841604295773185e-06, + "loss": 1.1703, + "step": 4664 + }, + { + "epoch": 0.14, + "learning_rate": 4.841518842150092e-06, + "loss": 1.1851, + "step": 4665 + }, + { + "epoch": 0.14, + "learning_rate": 4.8414333662368694e-06, + "loss": 1.1062, + "step": 4666 + }, + { + "epoch": 0.14, + "learning_rate": 4.841347868034329e-06, + "loss": 1.2375, + "step": 4667 + }, + { + "epoch": 0.14, + "learning_rate": 4.841262347543283e-06, + "loss": 1.2281, + "step": 4668 + }, + { + "epoch": 0.14, + "learning_rate": 4.841176804764548e-06, + "loss": 1.03, + "step": 4669 + }, + { + "epoch": 0.14, + "learning_rate": 4.841091239698937e-06, + "loss": 1.1829, + "step": 4670 + }, + { + "epoch": 0.14, + "learning_rate": 4.841005652347266e-06, + "loss": 1.2353, + "step": 4671 + }, + { + "epoch": 0.14, + "learning_rate": 4.840920042710347e-06, + "loss": 1.2153, + "step": 4672 + }, + { + "epoch": 0.14, + "learning_rate": 4.840834410788998e-06, + "loss": 1.2988, + "step": 4673 + }, + { + "epoch": 0.14, + "learning_rate": 4.840748756584031e-06, + "loss": 1.309, + "step": 4674 + }, + { + "epoch": 0.14, + "learning_rate": 4.840663080096265e-06, + "loss": 1.2615, + "step": 4675 + }, + { + "epoch": 0.14, + "learning_rate": 4.840577381326513e-06, + "loss": 1.1895, + "step": 4676 + }, + { + "epoch": 0.14, + "learning_rate": 4.840491660275593e-06, + "loss": 1.1465, + "step": 4677 + }, + { + "epoch": 0.14, + "learning_rate": 4.840405916944317e-06, + "loss": 1.1753, + "step": 4678 + }, + { + "epoch": 0.14, + "learning_rate": 4.8403201513335065e-06, + "loss": 1.1925, + "step": 4679 + }, + { + "epoch": 0.14, + "learning_rate": 4.840234363443973e-06, + "loss": 1.2009, + "step": 4680 + }, + { + "epoch": 0.14, + "learning_rate": 4.840148553276537e-06, + "loss": 1.0724, + "step": 4681 + }, + { + "epoch": 0.14, + "learning_rate": 4.840062720832013e-06, + "loss": 1.1461, + "step": 4682 + }, + { + "epoch": 0.14, + "learning_rate": 4.83997686611122e-06, + "loss": 1.0833, + "step": 4683 + }, + { + "epoch": 0.14, + "learning_rate": 4.839890989114972e-06, + "loss": 1.1687, + "step": 4684 + }, + { + "epoch": 0.14, + "learning_rate": 4.83980508984409e-06, + "loss": 1.199, + "step": 4685 + }, + { + "epoch": 0.14, + "learning_rate": 4.839719168299392e-06, + "loss": 1.1369, + "step": 4686 + }, + { + "epoch": 0.14, + "learning_rate": 4.839633224481692e-06, + "loss": 1.1998, + "step": 4687 + }, + { + "epoch": 0.14, + "learning_rate": 4.839547258391812e-06, + "loss": 1.3625, + "step": 4688 + }, + { + "epoch": 0.14, + "learning_rate": 4.839461270030568e-06, + "loss": 1.1862, + "step": 4689 + }, + { + "epoch": 0.14, + "learning_rate": 4.83937525939878e-06, + "loss": 1.1451, + "step": 4690 + }, + { + "epoch": 0.14, + "learning_rate": 4.839289226497266e-06, + "loss": 1.0756, + "step": 4691 + }, + { + "epoch": 0.14, + "learning_rate": 4.839203171326845e-06, + "loss": 1.2166, + "step": 4692 + }, + { + "epoch": 0.14, + "learning_rate": 4.839117093888337e-06, + "loss": 1.1453, + "step": 4693 + }, + { + "epoch": 0.14, + "learning_rate": 4.8390309941825595e-06, + "loss": 1.1298, + "step": 4694 + }, + { + "epoch": 0.14, + "learning_rate": 4.838944872210335e-06, + "loss": 1.2223, + "step": 4695 + }, + { + "epoch": 0.14, + "learning_rate": 4.8388587279724805e-06, + "loss": 1.1928, + "step": 4696 + }, + { + "epoch": 0.14, + "learning_rate": 4.838772561469819e-06, + "loss": 1.1726, + "step": 4697 + }, + { + "epoch": 0.14, + "learning_rate": 4.838686372703168e-06, + "loss": 1.0573, + "step": 4698 + }, + { + "epoch": 0.14, + "learning_rate": 4.8386001616733495e-06, + "loss": 1.2316, + "step": 4699 + }, + { + "epoch": 0.14, + "learning_rate": 4.838513928381183e-06, + "loss": 1.0742, + "step": 4700 + }, + { + "epoch": 0.14, + "learning_rate": 4.838427672827491e-06, + "loss": 1.2354, + "step": 4701 + }, + { + "epoch": 0.14, + "learning_rate": 4.838341395013093e-06, + "loss": 1.2188, + "step": 4702 + }, + { + "epoch": 0.14, + "learning_rate": 4.838255094938811e-06, + "loss": 1.1667, + "step": 4703 + }, + { + "epoch": 0.14, + "learning_rate": 4.838168772605467e-06, + "loss": 1.0923, + "step": 4704 + }, + { + "epoch": 0.14, + "learning_rate": 4.8380824280138825e-06, + "loss": 1.1849, + "step": 4705 + }, + { + "epoch": 0.14, + "learning_rate": 4.837996061164879e-06, + "loss": 1.2236, + "step": 4706 + }, + { + "epoch": 0.14, + "learning_rate": 4.83790967205928e-06, + "loss": 1.1918, + "step": 4707 + }, + { + "epoch": 0.14, + "learning_rate": 4.837823260697907e-06, + "loss": 1.0723, + "step": 4708 + }, + { + "epoch": 0.14, + "learning_rate": 4.837736827081581e-06, + "loss": 1.173, + "step": 4709 + }, + { + "epoch": 0.14, + "learning_rate": 4.837650371211127e-06, + "loss": 1.2003, + "step": 4710 + }, + { + "epoch": 0.14, + "learning_rate": 4.8375638930873675e-06, + "loss": 1.1868, + "step": 4711 + }, + { + "epoch": 0.14, + "learning_rate": 4.837477392711125e-06, + "loss": 1.2026, + "step": 4712 + }, + { + "epoch": 0.14, + "learning_rate": 4.837390870083224e-06, + "loss": 1.0708, + "step": 4713 + }, + { + "epoch": 0.14, + "learning_rate": 4.837304325204488e-06, + "loss": 1.1433, + "step": 4714 + }, + { + "epoch": 0.14, + "learning_rate": 4.8372177580757394e-06, + "loss": 1.0849, + "step": 4715 + }, + { + "epoch": 0.14, + "learning_rate": 4.837131168697805e-06, + "loss": 1.085, + "step": 4716 + }, + { + "epoch": 0.14, + "learning_rate": 4.837044557071507e-06, + "loss": 1.187, + "step": 4717 + }, + { + "epoch": 0.14, + "learning_rate": 4.836957923197669e-06, + "loss": 1.2571, + "step": 4718 + }, + { + "epoch": 0.14, + "learning_rate": 4.8368712670771176e-06, + "loss": 1.2086, + "step": 4719 + }, + { + "epoch": 0.14, + "learning_rate": 4.836784588710678e-06, + "loss": 1.1207, + "step": 4720 + }, + { + "epoch": 0.14, + "learning_rate": 4.836697888099175e-06, + "loss": 1.1705, + "step": 4721 + }, + { + "epoch": 0.14, + "learning_rate": 4.836611165243432e-06, + "loss": 1.1424, + "step": 4722 + }, + { + "epoch": 0.14, + "learning_rate": 4.836524420144276e-06, + "loss": 1.1302, + "step": 4723 + }, + { + "epoch": 0.14, + "learning_rate": 4.836437652802534e-06, + "loss": 1.1801, + "step": 4724 + }, + { + "epoch": 0.14, + "learning_rate": 4.83635086321903e-06, + "loss": 1.1849, + "step": 4725 + }, + { + "epoch": 0.14, + "learning_rate": 4.836264051394592e-06, + "loss": 1.1172, + "step": 4726 + }, + { + "epoch": 0.14, + "learning_rate": 4.836177217330045e-06, + "loss": 1.1988, + "step": 4727 + }, + { + "epoch": 0.14, + "learning_rate": 4.836090361026216e-06, + "loss": 1.1881, + "step": 4728 + }, + { + "epoch": 0.14, + "learning_rate": 4.836003482483931e-06, + "loss": 1.1401, + "step": 4729 + }, + { + "epoch": 0.14, + "learning_rate": 4.835916581704019e-06, + "loss": 1.1794, + "step": 4730 + }, + { + "epoch": 0.14, + "learning_rate": 4.8358296586873056e-06, + "loss": 1.136, + "step": 4731 + }, + { + "epoch": 0.14, + "learning_rate": 4.835742713434619e-06, + "loss": 1.1617, + "step": 4732 + }, + { + "epoch": 0.14, + "learning_rate": 4.835655745946787e-06, + "loss": 1.0214, + "step": 4733 + }, + { + "epoch": 0.14, + "learning_rate": 4.835568756224636e-06, + "loss": 1.2534, + "step": 4734 + }, + { + "epoch": 0.14, + "learning_rate": 4.835481744268996e-06, + "loss": 1.2228, + "step": 4735 + }, + { + "epoch": 0.14, + "learning_rate": 4.835394710080695e-06, + "loss": 1.1185, + "step": 4736 + }, + { + "epoch": 0.14, + "learning_rate": 4.835307653660561e-06, + "loss": 1.0853, + "step": 4737 + }, + { + "epoch": 0.14, + "learning_rate": 4.835220575009423e-06, + "loss": 1.1703, + "step": 4738 + }, + { + "epoch": 0.14, + "learning_rate": 4.835133474128109e-06, + "loss": 1.1093, + "step": 4739 + }, + { + "epoch": 0.14, + "learning_rate": 4.835046351017449e-06, + "loss": 1.1158, + "step": 4740 + }, + { + "epoch": 0.14, + "learning_rate": 4.834959205678273e-06, + "loss": 1.0523, + "step": 4741 + }, + { + "epoch": 0.14, + "learning_rate": 4.83487203811141e-06, + "loss": 1.2347, + "step": 4742 + }, + { + "epoch": 0.14, + "learning_rate": 4.83478484831769e-06, + "loss": 1.2378, + "step": 4743 + }, + { + "epoch": 0.14, + "learning_rate": 4.834697636297941e-06, + "loss": 1.1355, + "step": 4744 + }, + { + "epoch": 0.14, + "learning_rate": 4.834610402052997e-06, + "loss": 1.2009, + "step": 4745 + }, + { + "epoch": 0.14, + "learning_rate": 4.834523145583685e-06, + "loss": 1.1351, + "step": 4746 + }, + { + "epoch": 0.14, + "learning_rate": 4.834435866890837e-06, + "loss": 1.0809, + "step": 4747 + }, + { + "epoch": 0.14, + "learning_rate": 4.834348565975285e-06, + "loss": 1.2297, + "step": 4748 + }, + { + "epoch": 0.14, + "learning_rate": 4.834261242837858e-06, + "loss": 1.28, + "step": 4749 + }, + { + "epoch": 0.14, + "learning_rate": 4.834173897479388e-06, + "loss": 1.2218, + "step": 4750 + }, + { + "epoch": 0.14, + "learning_rate": 4.8340865299007075e-06, + "loss": 1.1367, + "step": 4751 + }, + { + "epoch": 0.14, + "learning_rate": 4.833999140102647e-06, + "loss": 1.1096, + "step": 4752 + }, + { + "epoch": 0.14, + "learning_rate": 4.833911728086039e-06, + "loss": 1.074, + "step": 4753 + }, + { + "epoch": 0.14, + "learning_rate": 4.8338242938517155e-06, + "loss": 1.2277, + "step": 4754 + }, + { + "epoch": 0.14, + "learning_rate": 4.833736837400508e-06, + "loss": 1.1371, + "step": 4755 + }, + { + "epoch": 0.14, + "learning_rate": 4.83364935873325e-06, + "loss": 1.2201, + "step": 4756 + }, + { + "epoch": 0.14, + "learning_rate": 4.833561857850774e-06, + "loss": 1.223, + "step": 4757 + }, + { + "epoch": 0.14, + "learning_rate": 4.833474334753913e-06, + "loss": 1.2225, + "step": 4758 + }, + { + "epoch": 0.14, + "learning_rate": 4.8333867894435e-06, + "loss": 1.064, + "step": 4759 + }, + { + "epoch": 0.14, + "learning_rate": 4.8332992219203695e-06, + "loss": 1.1245, + "step": 4760 + }, + { + "epoch": 0.14, + "learning_rate": 4.833211632185354e-06, + "loss": 1.1398, + "step": 4761 + }, + { + "epoch": 0.14, + "learning_rate": 4.8331240202392875e-06, + "loss": 1.1443, + "step": 4762 + }, + { + "epoch": 0.14, + "learning_rate": 4.833036386083002e-06, + "loss": 1.0903, + "step": 4763 + }, + { + "epoch": 0.14, + "learning_rate": 4.832948729717336e-06, + "loss": 1.2303, + "step": 4764 + }, + { + "epoch": 0.14, + "learning_rate": 4.832861051143121e-06, + "loss": 1.0753, + "step": 4765 + }, + { + "epoch": 0.14, + "learning_rate": 4.832773350361192e-06, + "loss": 1.0717, + "step": 4766 + }, + { + "epoch": 0.14, + "learning_rate": 4.8326856273723845e-06, + "loss": 1.1832, + "step": 4767 + }, + { + "epoch": 0.14, + "learning_rate": 4.832597882177533e-06, + "loss": 1.2881, + "step": 4768 + }, + { + "epoch": 0.14, + "learning_rate": 4.832510114777474e-06, + "loss": 1.2025, + "step": 4769 + }, + { + "epoch": 0.14, + "learning_rate": 4.832422325173041e-06, + "loss": 1.1981, + "step": 4770 + }, + { + "epoch": 0.14, + "learning_rate": 4.832334513365071e-06, + "loss": 1.1319, + "step": 4771 + }, + { + "epoch": 0.14, + "learning_rate": 4.832246679354401e-06, + "loss": 1.1275, + "step": 4772 + }, + { + "epoch": 0.14, + "learning_rate": 4.832158823141864e-06, + "loss": 1.1152, + "step": 4773 + }, + { + "epoch": 0.14, + "learning_rate": 4.8320709447283e-06, + "loss": 1.1805, + "step": 4774 + }, + { + "epoch": 0.14, + "learning_rate": 4.831983044114542e-06, + "loss": 1.0646, + "step": 4775 + }, + { + "epoch": 0.14, + "learning_rate": 4.83189512130143e-06, + "loss": 1.155, + "step": 4776 + }, + { + "epoch": 0.14, + "learning_rate": 4.831807176289799e-06, + "loss": 1.0905, + "step": 4777 + }, + { + "epoch": 0.14, + "learning_rate": 4.8317192090804854e-06, + "loss": 1.0764, + "step": 4778 + }, + { + "epoch": 0.14, + "learning_rate": 4.83163121967433e-06, + "loss": 1.1705, + "step": 4779 + }, + { + "epoch": 0.14, + "learning_rate": 4.831543208072167e-06, + "loss": 1.2847, + "step": 4780 + }, + { + "epoch": 0.14, + "learning_rate": 4.831455174274836e-06, + "loss": 1.2447, + "step": 4781 + }, + { + "epoch": 0.14, + "learning_rate": 4.8313671182831745e-06, + "loss": 1.0786, + "step": 4782 + }, + { + "epoch": 0.14, + "learning_rate": 4.831279040098021e-06, + "loss": 1.1259, + "step": 4783 + }, + { + "epoch": 0.14, + "learning_rate": 4.831190939720214e-06, + "loss": 1.1417, + "step": 4784 + }, + { + "epoch": 0.14, + "learning_rate": 4.831102817150591e-06, + "loss": 1.1601, + "step": 4785 + }, + { + "epoch": 0.14, + "learning_rate": 4.831014672389993e-06, + "loss": 1.2255, + "step": 4786 + }, + { + "epoch": 0.14, + "learning_rate": 4.830926505439258e-06, + "loss": 1.2244, + "step": 4787 + }, + { + "epoch": 0.14, + "learning_rate": 4.830838316299225e-06, + "loss": 1.1673, + "step": 4788 + }, + { + "epoch": 0.14, + "learning_rate": 4.830750104970734e-06, + "loss": 1.2245, + "step": 4789 + }, + { + "epoch": 0.14, + "learning_rate": 4.830661871454624e-06, + "loss": 1.1392, + "step": 4790 + }, + { + "epoch": 0.14, + "learning_rate": 4.8305736157517355e-06, + "loss": 1.1854, + "step": 4791 + }, + { + "epoch": 0.14, + "learning_rate": 4.830485337862909e-06, + "loss": 1.1916, + "step": 4792 + }, + { + "epoch": 0.14, + "learning_rate": 4.830397037788984e-06, + "loss": 1.2249, + "step": 4793 + }, + { + "epoch": 0.14, + "learning_rate": 4.830308715530802e-06, + "loss": 1.184, + "step": 4794 + }, + { + "epoch": 0.14, + "learning_rate": 4.830220371089204e-06, + "loss": 1.0767, + "step": 4795 + }, + { + "epoch": 0.14, + "learning_rate": 4.830132004465029e-06, + "loss": 1.1578, + "step": 4796 + }, + { + "epoch": 0.14, + "learning_rate": 4.83004361565912e-06, + "loss": 1.0778, + "step": 4797 + }, + { + "epoch": 0.14, + "learning_rate": 4.829955204672318e-06, + "loss": 1.235, + "step": 4798 + }, + { + "epoch": 0.14, + "learning_rate": 4.829866771505465e-06, + "loss": 1.2532, + "step": 4799 + }, + { + "epoch": 0.14, + "learning_rate": 4.829778316159402e-06, + "loss": 1.0303, + "step": 4800 + }, + { + "epoch": 0.14, + "learning_rate": 4.829689838634972e-06, + "loss": 1.1094, + "step": 4801 + }, + { + "epoch": 0.14, + "learning_rate": 4.829601338933016e-06, + "loss": 1.106, + "step": 4802 + }, + { + "epoch": 0.14, + "learning_rate": 4.829512817054377e-06, + "loss": 1.0918, + "step": 4803 + }, + { + "epoch": 0.14, + "learning_rate": 4.829424272999899e-06, + "loss": 1.1361, + "step": 4804 + }, + { + "epoch": 0.14, + "learning_rate": 4.829335706770423e-06, + "loss": 1.1678, + "step": 4805 + }, + { + "epoch": 0.14, + "learning_rate": 4.8292471183667935e-06, + "loss": 1.2606, + "step": 4806 + }, + { + "epoch": 0.14, + "learning_rate": 4.829158507789853e-06, + "loss": 1.1961, + "step": 4807 + }, + { + "epoch": 0.14, + "learning_rate": 4.829069875040445e-06, + "loss": 1.111, + "step": 4808 + }, + { + "epoch": 0.14, + "learning_rate": 4.828981220119414e-06, + "loss": 1.1446, + "step": 4809 + }, + { + "epoch": 0.14, + "learning_rate": 4.828892543027603e-06, + "loss": 1.1014, + "step": 4810 + }, + { + "epoch": 0.14, + "learning_rate": 4.828803843765857e-06, + "loss": 1.1323, + "step": 4811 + }, + { + "epoch": 0.14, + "learning_rate": 4.82871512233502e-06, + "loss": 1.1598, + "step": 4812 + }, + { + "epoch": 0.14, + "learning_rate": 4.8286263787359365e-06, + "loss": 0.9788, + "step": 4813 + }, + { + "epoch": 0.15, + "learning_rate": 4.828537612969451e-06, + "loss": 1.2153, + "step": 4814 + }, + { + "epoch": 0.15, + "learning_rate": 4.8284488250364095e-06, + "loss": 1.1257, + "step": 4815 + }, + { + "epoch": 0.15, + "learning_rate": 4.828360014937656e-06, + "loss": 1.1124, + "step": 4816 + }, + { + "epoch": 0.15, + "learning_rate": 4.828271182674037e-06, + "loss": 1.2319, + "step": 4817 + }, + { + "epoch": 0.15, + "learning_rate": 4.828182328246398e-06, + "loss": 1.1606, + "step": 4818 + }, + { + "epoch": 0.15, + "learning_rate": 4.828093451655584e-06, + "loss": 1.0231, + "step": 4819 + }, + { + "epoch": 0.15, + "learning_rate": 4.828004552902441e-06, + "loss": 1.1147, + "step": 4820 + }, + { + "epoch": 0.15, + "learning_rate": 4.827915631987816e-06, + "loss": 1.0895, + "step": 4821 + }, + { + "epoch": 0.15, + "learning_rate": 4.827826688912556e-06, + "loss": 1.1294, + "step": 4822 + }, + { + "epoch": 0.15, + "learning_rate": 4.827737723677507e-06, + "loss": 1.178, + "step": 4823 + }, + { + "epoch": 0.15, + "learning_rate": 4.827648736283515e-06, + "loss": 1.1162, + "step": 4824 + }, + { + "epoch": 0.15, + "learning_rate": 4.82755972673143e-06, + "loss": 1.1953, + "step": 4825 + }, + { + "epoch": 0.15, + "learning_rate": 4.827470695022097e-06, + "loss": 1.1404, + "step": 4826 + }, + { + "epoch": 0.15, + "learning_rate": 4.827381641156363e-06, + "loss": 1.0623, + "step": 4827 + }, + { + "epoch": 0.15, + "learning_rate": 4.827292565135076e-06, + "loss": 1.2498, + "step": 4828 + }, + { + "epoch": 0.15, + "learning_rate": 4.827203466959086e-06, + "loss": 1.2373, + "step": 4829 + }, + { + "epoch": 0.15, + "learning_rate": 4.827114346629239e-06, + "loss": 1.1569, + "step": 4830 + }, + { + "epoch": 0.15, + "learning_rate": 4.827025204146384e-06, + "loss": 1.144, + "step": 4831 + }, + { + "epoch": 0.15, + "learning_rate": 4.826936039511371e-06, + "loss": 1.1399, + "step": 4832 + }, + { + "epoch": 0.15, + "learning_rate": 4.826846852725047e-06, + "loss": 1.1353, + "step": 4833 + }, + { + "epoch": 0.15, + "learning_rate": 4.8267576437882614e-06, + "loss": 1.0605, + "step": 4834 + }, + { + "epoch": 0.15, + "learning_rate": 4.8266684127018634e-06, + "loss": 1.1865, + "step": 4835 + }, + { + "epoch": 0.15, + "learning_rate": 4.826579159466703e-06, + "loss": 1.1809, + "step": 4836 + }, + { + "epoch": 0.15, + "learning_rate": 4.82648988408363e-06, + "loss": 1.2192, + "step": 4837 + }, + { + "epoch": 0.15, + "learning_rate": 4.826400586553493e-06, + "loss": 1.2599, + "step": 4838 + }, + { + "epoch": 0.15, + "learning_rate": 4.826311266877143e-06, + "loss": 1.2128, + "step": 4839 + }, + { + "epoch": 0.15, + "learning_rate": 4.82622192505543e-06, + "loss": 1.0716, + "step": 4840 + }, + { + "epoch": 0.15, + "learning_rate": 4.826132561089205e-06, + "loss": 1.183, + "step": 4841 + }, + { + "epoch": 0.15, + "learning_rate": 4.8260431749793185e-06, + "loss": 1.1667, + "step": 4842 + }, + { + "epoch": 0.15, + "learning_rate": 4.825953766726621e-06, + "loss": 1.3334, + "step": 4843 + }, + { + "epoch": 0.15, + "learning_rate": 4.825864336331964e-06, + "loss": 1.2532, + "step": 4844 + }, + { + "epoch": 0.15, + "learning_rate": 4.825774883796198e-06, + "loss": 1.1827, + "step": 4845 + }, + { + "epoch": 0.15, + "learning_rate": 4.825685409120176e-06, + "loss": 1.1385, + "step": 4846 + }, + { + "epoch": 0.15, + "learning_rate": 4.825595912304749e-06, + "loss": 1.1396, + "step": 4847 + }, + { + "epoch": 0.15, + "learning_rate": 4.825506393350769e-06, + "loss": 1.1131, + "step": 4848 + }, + { + "epoch": 0.15, + "learning_rate": 4.825416852259088e-06, + "loss": 1.1941, + "step": 4849 + }, + { + "epoch": 0.15, + "learning_rate": 4.825327289030558e-06, + "loss": 1.1577, + "step": 4850 + }, + { + "epoch": 0.15, + "learning_rate": 4.825237703666032e-06, + "loss": 1.0801, + "step": 4851 + }, + { + "epoch": 0.15, + "learning_rate": 4.825148096166365e-06, + "loss": 1.1577, + "step": 4852 + }, + { + "epoch": 0.15, + "learning_rate": 4.825058466532405e-06, + "loss": 1.0214, + "step": 4853 + }, + { + "epoch": 0.15, + "learning_rate": 4.82496881476501e-06, + "loss": 1.1328, + "step": 4854 + }, + { + "epoch": 0.15, + "learning_rate": 4.824879140865031e-06, + "loss": 1.2075, + "step": 4855 + }, + { + "epoch": 0.15, + "learning_rate": 4.824789444833323e-06, + "loss": 1.1596, + "step": 4856 + }, + { + "epoch": 0.15, + "learning_rate": 4.824699726670738e-06, + "loss": 1.214, + "step": 4857 + }, + { + "epoch": 0.15, + "learning_rate": 4.824609986378132e-06, + "loss": 1.145, + "step": 4858 + }, + { + "epoch": 0.15, + "learning_rate": 4.824520223956358e-06, + "loss": 1.1349, + "step": 4859 + }, + { + "epoch": 0.15, + "learning_rate": 4.824430439406272e-06, + "loss": 1.1147, + "step": 4860 + }, + { + "epoch": 0.15, + "learning_rate": 4.824340632728727e-06, + "loss": 1.208, + "step": 4861 + }, + { + "epoch": 0.15, + "learning_rate": 4.824250803924578e-06, + "loss": 1.2114, + "step": 4862 + }, + { + "epoch": 0.15, + "learning_rate": 4.824160952994682e-06, + "loss": 1.2214, + "step": 4863 + }, + { + "epoch": 0.15, + "learning_rate": 4.824071079939892e-06, + "loss": 1.2181, + "step": 4864 + }, + { + "epoch": 0.15, + "learning_rate": 4.823981184761065e-06, + "loss": 1.0046, + "step": 4865 + }, + { + "epoch": 0.15, + "learning_rate": 4.823891267459057e-06, + "loss": 1.1766, + "step": 4866 + }, + { + "epoch": 0.15, + "learning_rate": 4.823801328034723e-06, + "loss": 1.1367, + "step": 4867 + }, + { + "epoch": 0.15, + "learning_rate": 4.823711366488919e-06, + "loss": 1.1235, + "step": 4868 + }, + { + "epoch": 0.15, + "learning_rate": 4.823621382822503e-06, + "loss": 1.1583, + "step": 4869 + }, + { + "epoch": 0.15, + "learning_rate": 4.8235313770363295e-06, + "loss": 1.1982, + "step": 4870 + }, + { + "epoch": 0.15, + "learning_rate": 4.823441349131257e-06, + "loss": 1.076, + "step": 4871 + }, + { + "epoch": 0.15, + "learning_rate": 4.8233512991081414e-06, + "loss": 1.1746, + "step": 4872 + }, + { + "epoch": 0.15, + "learning_rate": 4.82326122696784e-06, + "loss": 1.1082, + "step": 4873 + }, + { + "epoch": 0.15, + "learning_rate": 4.823171132711212e-06, + "loss": 1.2612, + "step": 4874 + }, + { + "epoch": 0.15, + "learning_rate": 4.823081016339113e-06, + "loss": 1.2511, + "step": 4875 + }, + { + "epoch": 0.15, + "learning_rate": 4.8229908778524015e-06, + "loss": 1.2034, + "step": 4876 + }, + { + "epoch": 0.15, + "learning_rate": 4.822900717251935e-06, + "loss": 1.1731, + "step": 4877 + }, + { + "epoch": 0.15, + "learning_rate": 4.822810534538573e-06, + "loss": 1.1119, + "step": 4878 + }, + { + "epoch": 0.15, + "learning_rate": 4.822720329713174e-06, + "loss": 1.1327, + "step": 4879 + }, + { + "epoch": 0.15, + "learning_rate": 4.822630102776596e-06, + "loss": 1.2001, + "step": 4880 + }, + { + "epoch": 0.15, + "learning_rate": 4.822539853729697e-06, + "loss": 1.1786, + "step": 4881 + }, + { + "epoch": 0.15, + "learning_rate": 4.822449582573337e-06, + "loss": 1.0527, + "step": 4882 + }, + { + "epoch": 0.15, + "learning_rate": 4.822359289308377e-06, + "loss": 1.0919, + "step": 4883 + }, + { + "epoch": 0.15, + "learning_rate": 4.8222689739356745e-06, + "loss": 1.2002, + "step": 4884 + }, + { + "epoch": 0.15, + "learning_rate": 4.822178636456089e-06, + "loss": 1.1569, + "step": 4885 + }, + { + "epoch": 0.15, + "learning_rate": 4.822088276870482e-06, + "loss": 1.2329, + "step": 4886 + }, + { + "epoch": 0.15, + "learning_rate": 4.821997895179713e-06, + "loss": 1.1447, + "step": 4887 + }, + { + "epoch": 0.15, + "learning_rate": 4.821907491384642e-06, + "loss": 1.1481, + "step": 4888 + }, + { + "epoch": 0.15, + "learning_rate": 4.8218170654861305e-06, + "loss": 1.1714, + "step": 4889 + }, + { + "epoch": 0.15, + "learning_rate": 4.821726617485038e-06, + "loss": 1.1259, + "step": 4890 + }, + { + "epoch": 0.15, + "learning_rate": 4.821636147382227e-06, + "loss": 1.0792, + "step": 4891 + }, + { + "epoch": 0.15, + "learning_rate": 4.8215456551785575e-06, + "loss": 1.1902, + "step": 4892 + }, + { + "epoch": 0.15, + "learning_rate": 4.8214551408748925e-06, + "loss": 1.2142, + "step": 4893 + }, + { + "epoch": 0.15, + "learning_rate": 4.821364604472091e-06, + "loss": 1.1619, + "step": 4894 + }, + { + "epoch": 0.15, + "learning_rate": 4.821274045971017e-06, + "loss": 1.1453, + "step": 4895 + }, + { + "epoch": 0.15, + "learning_rate": 4.821183465372533e-06, + "loss": 1.182, + "step": 4896 + }, + { + "epoch": 0.15, + "learning_rate": 4.821092862677499e-06, + "loss": 1.09, + "step": 4897 + }, + { + "epoch": 0.15, + "learning_rate": 4.82100223788678e-06, + "loss": 1.1368, + "step": 4898 + }, + { + "epoch": 0.15, + "learning_rate": 4.820911591001237e-06, + "loss": 1.2705, + "step": 4899 + }, + { + "epoch": 0.15, + "learning_rate": 4.820820922021733e-06, + "loss": 1.1595, + "step": 4900 + }, + { + "epoch": 0.15, + "learning_rate": 4.820730230949132e-06, + "loss": 1.1378, + "step": 4901 + }, + { + "epoch": 0.15, + "learning_rate": 4.820639517784298e-06, + "loss": 1.1949, + "step": 4902 + }, + { + "epoch": 0.15, + "learning_rate": 4.820548782528092e-06, + "loss": 1.0546, + "step": 4903 + }, + { + "epoch": 0.15, + "learning_rate": 4.820458025181379e-06, + "loss": 1.1942, + "step": 4904 + }, + { + "epoch": 0.15, + "learning_rate": 4.820367245745024e-06, + "loss": 1.291, + "step": 4905 + }, + { + "epoch": 0.15, + "learning_rate": 4.8202764442198905e-06, + "loss": 1.2822, + "step": 4906 + }, + { + "epoch": 0.15, + "learning_rate": 4.820185620606842e-06, + "loss": 1.1308, + "step": 4907 + }, + { + "epoch": 0.15, + "learning_rate": 4.820094774906744e-06, + "loss": 1.1511, + "step": 4908 + }, + { + "epoch": 0.15, + "learning_rate": 4.820003907120461e-06, + "loss": 1.0804, + "step": 4909 + }, + { + "epoch": 0.15, + "learning_rate": 4.819913017248859e-06, + "loss": 1.2262, + "step": 4910 + }, + { + "epoch": 0.15, + "learning_rate": 4.8198221052928015e-06, + "loss": 1.1371, + "step": 4911 + }, + { + "epoch": 0.15, + "learning_rate": 4.819731171253156e-06, + "loss": 1.1498, + "step": 4912 + }, + { + "epoch": 0.15, + "learning_rate": 4.8196402151307856e-06, + "loss": 1.0912, + "step": 4913 + }, + { + "epoch": 0.15, + "learning_rate": 4.819549236926558e-06, + "loss": 1.153, + "step": 4914 + }, + { + "epoch": 0.15, + "learning_rate": 4.819458236641339e-06, + "loss": 1.0759, + "step": 4915 + }, + { + "epoch": 0.15, + "learning_rate": 4.819367214275994e-06, + "loss": 1.1168, + "step": 4916 + }, + { + "epoch": 0.15, + "learning_rate": 4.819276169831391e-06, + "loss": 1.063, + "step": 4917 + }, + { + "epoch": 0.15, + "learning_rate": 4.819185103308396e-06, + "loss": 1.3358, + "step": 4918 + }, + { + "epoch": 0.15, + "learning_rate": 4.819094014707875e-06, + "loss": 1.2311, + "step": 4919 + }, + { + "epoch": 0.15, + "learning_rate": 4.819002904030696e-06, + "loss": 1.2134, + "step": 4920 + }, + { + "epoch": 0.15, + "learning_rate": 4.818911771277727e-06, + "loss": 1.1468, + "step": 4921 + }, + { + "epoch": 0.15, + "learning_rate": 4.8188206164498335e-06, + "loss": 1.1392, + "step": 4922 + }, + { + "epoch": 0.15, + "learning_rate": 4.818729439547885e-06, + "loss": 1.1586, + "step": 4923 + }, + { + "epoch": 0.15, + "learning_rate": 4.81863824057275e-06, + "loss": 1.2313, + "step": 4924 + }, + { + "epoch": 0.15, + "learning_rate": 4.818547019525295e-06, + "loss": 1.1879, + "step": 4925 + }, + { + "epoch": 0.15, + "learning_rate": 4.818455776406388e-06, + "loss": 1.2172, + "step": 4926 + }, + { + "epoch": 0.15, + "learning_rate": 4.8183645112169e-06, + "loss": 1.2459, + "step": 4927 + }, + { + "epoch": 0.15, + "learning_rate": 4.818273223957698e-06, + "loss": 1.043, + "step": 4928 + }, + { + "epoch": 0.15, + "learning_rate": 4.818181914629651e-06, + "loss": 1.1876, + "step": 4929 + }, + { + "epoch": 0.15, + "learning_rate": 4.8180905832336285e-06, + "loss": 1.0429, + "step": 4930 + }, + { + "epoch": 0.15, + "learning_rate": 4.817999229770502e-06, + "loss": 1.2488, + "step": 4931 + }, + { + "epoch": 0.15, + "learning_rate": 4.817907854241137e-06, + "loss": 1.0491, + "step": 4932 + }, + { + "epoch": 0.15, + "learning_rate": 4.817816456646406e-06, + "loss": 1.0366, + "step": 4933 + }, + { + "epoch": 0.15, + "learning_rate": 4.817725036987179e-06, + "loss": 1.171, + "step": 4934 + }, + { + "epoch": 0.15, + "learning_rate": 4.817633595264326e-06, + "loss": 1.2132, + "step": 4935 + }, + { + "epoch": 0.15, + "learning_rate": 4.817542131478717e-06, + "loss": 1.1609, + "step": 4936 + }, + { + "epoch": 0.15, + "learning_rate": 4.817450645631223e-06, + "loss": 1.2845, + "step": 4937 + }, + { + "epoch": 0.15, + "learning_rate": 4.817359137722716e-06, + "loss": 1.1595, + "step": 4938 + }, + { + "epoch": 0.15, + "learning_rate": 4.8172676077540655e-06, + "loss": 1.1937, + "step": 4939 + }, + { + "epoch": 0.15, + "learning_rate": 4.817176055726143e-06, + "loss": 1.2899, + "step": 4940 + }, + { + "epoch": 0.15, + "learning_rate": 4.817084481639821e-06, + "loss": 1.1319, + "step": 4941 + }, + { + "epoch": 0.15, + "learning_rate": 4.81699288549597e-06, + "loss": 1.2631, + "step": 4942 + }, + { + "epoch": 0.15, + "learning_rate": 4.816901267295463e-06, + "loss": 1.189, + "step": 4943 + }, + { + "epoch": 0.15, + "learning_rate": 4.8168096270391715e-06, + "loss": 1.2044, + "step": 4944 + }, + { + "epoch": 0.15, + "learning_rate": 4.816717964727969e-06, + "loss": 1.0645, + "step": 4945 + }, + { + "epoch": 0.15, + "learning_rate": 4.816626280362728e-06, + "loss": 1.2051, + "step": 4946 + }, + { + "epoch": 0.15, + "learning_rate": 4.816534573944318e-06, + "loss": 1.0785, + "step": 4947 + }, + { + "epoch": 0.15, + "learning_rate": 4.8164428454736156e-06, + "loss": 1.1326, + "step": 4948 + }, + { + "epoch": 0.15, + "learning_rate": 4.816351094951493e-06, + "loss": 1.173, + "step": 4949 + }, + { + "epoch": 0.15, + "learning_rate": 4.816259322378825e-06, + "loss": 1.1928, + "step": 4950 + }, + { + "epoch": 0.15, + "learning_rate": 4.816167527756482e-06, + "loss": 1.2097, + "step": 4951 + }, + { + "epoch": 0.15, + "learning_rate": 4.81607571108534e-06, + "loss": 1.0623, + "step": 4952 + }, + { + "epoch": 0.15, + "learning_rate": 4.815983872366273e-06, + "loss": 1.149, + "step": 4953 + }, + { + "epoch": 0.15, + "learning_rate": 4.815892011600155e-06, + "loss": 1.1465, + "step": 4954 + }, + { + "epoch": 0.15, + "learning_rate": 4.815800128787859e-06, + "loss": 1.1523, + "step": 4955 + }, + { + "epoch": 0.15, + "learning_rate": 4.8157082239302634e-06, + "loss": 1.1624, + "step": 4956 + }, + { + "epoch": 0.15, + "learning_rate": 4.8156162970282395e-06, + "loss": 1.1255, + "step": 4957 + }, + { + "epoch": 0.15, + "learning_rate": 4.815524348082664e-06, + "loss": 1.2352, + "step": 4958 + }, + { + "epoch": 0.15, + "learning_rate": 4.8154323770944125e-06, + "loss": 1.0963, + "step": 4959 + }, + { + "epoch": 0.15, + "learning_rate": 4.815340384064359e-06, + "loss": 1.1776, + "step": 4960 + }, + { + "epoch": 0.15, + "learning_rate": 4.81524836899338e-06, + "loss": 1.1203, + "step": 4961 + }, + { + "epoch": 0.15, + "learning_rate": 4.815156331882353e-06, + "loss": 1.2274, + "step": 4962 + }, + { + "epoch": 0.15, + "learning_rate": 4.8150642727321506e-06, + "loss": 1.09, + "step": 4963 + }, + { + "epoch": 0.15, + "learning_rate": 4.814972191543653e-06, + "loss": 1.1463, + "step": 4964 + }, + { + "epoch": 0.15, + "learning_rate": 4.814880088317734e-06, + "loss": 1.0845, + "step": 4965 + }, + { + "epoch": 0.15, + "learning_rate": 4.814787963055273e-06, + "loss": 1.2043, + "step": 4966 + }, + { + "epoch": 0.15, + "learning_rate": 4.814695815757144e-06, + "loss": 1.1557, + "step": 4967 + }, + { + "epoch": 0.15, + "learning_rate": 4.814603646424226e-06, + "loss": 1.1121, + "step": 4968 + }, + { + "epoch": 0.15, + "learning_rate": 4.814511455057396e-06, + "loss": 1.2373, + "step": 4969 + }, + { + "epoch": 0.15, + "learning_rate": 4.814419241657531e-06, + "loss": 1.123, + "step": 4970 + }, + { + "epoch": 0.15, + "learning_rate": 4.814327006225511e-06, + "loss": 1.1134, + "step": 4971 + }, + { + "epoch": 0.15, + "learning_rate": 4.814234748762211e-06, + "loss": 1.095, + "step": 4972 + }, + { + "epoch": 0.15, + "learning_rate": 4.814142469268512e-06, + "loss": 1.2777, + "step": 4973 + }, + { + "epoch": 0.15, + "learning_rate": 4.81405016774529e-06, + "loss": 1.0357, + "step": 4974 + }, + { + "epoch": 0.15, + "learning_rate": 4.813957844193426e-06, + "loss": 1.2346, + "step": 4975 + }, + { + "epoch": 0.15, + "learning_rate": 4.813865498613797e-06, + "loss": 1.1519, + "step": 4976 + }, + { + "epoch": 0.15, + "learning_rate": 4.813773131007283e-06, + "loss": 1.1615, + "step": 4977 + }, + { + "epoch": 0.15, + "learning_rate": 4.8136807413747635e-06, + "loss": 1.121, + "step": 4978 + }, + { + "epoch": 0.15, + "learning_rate": 4.813588329717118e-06, + "loss": 1.1741, + "step": 4979 + }, + { + "epoch": 0.15, + "learning_rate": 4.813495896035225e-06, + "loss": 1.3403, + "step": 4980 + }, + { + "epoch": 0.15, + "learning_rate": 4.813403440329966e-06, + "loss": 1.02, + "step": 4981 + }, + { + "epoch": 0.15, + "learning_rate": 4.81331096260222e-06, + "loss": 1.1896, + "step": 4982 + }, + { + "epoch": 0.15, + "learning_rate": 4.8132184628528675e-06, + "loss": 1.2369, + "step": 4983 + }, + { + "epoch": 0.15, + "learning_rate": 4.81312594108279e-06, + "loss": 1.1497, + "step": 4984 + }, + { + "epoch": 0.15, + "learning_rate": 4.813033397292867e-06, + "loss": 1.1135, + "step": 4985 + }, + { + "epoch": 0.15, + "learning_rate": 4.812940831483981e-06, + "loss": 1.214, + "step": 4986 + }, + { + "epoch": 0.15, + "learning_rate": 4.812848243657011e-06, + "loss": 1.3073, + "step": 4987 + }, + { + "epoch": 0.15, + "learning_rate": 4.81275563381284e-06, + "loss": 1.3121, + "step": 4988 + }, + { + "epoch": 0.15, + "learning_rate": 4.812663001952349e-06, + "loss": 1.0705, + "step": 4989 + }, + { + "epoch": 0.15, + "learning_rate": 4.812570348076421e-06, + "loss": 1.2297, + "step": 4990 + }, + { + "epoch": 0.15, + "learning_rate": 4.812477672185936e-06, + "loss": 1.0856, + "step": 4991 + }, + { + "epoch": 0.15, + "learning_rate": 4.812384974281778e-06, + "loss": 1.039, + "step": 4992 + }, + { + "epoch": 0.15, + "learning_rate": 4.812292254364829e-06, + "loss": 1.2058, + "step": 4993 + }, + { + "epoch": 0.15, + "learning_rate": 4.81219951243597e-06, + "loss": 1.1547, + "step": 4994 + }, + { + "epoch": 0.15, + "learning_rate": 4.8121067484960856e-06, + "loss": 1.1648, + "step": 4995 + }, + { + "epoch": 0.15, + "learning_rate": 4.8120139625460596e-06, + "loss": 1.1292, + "step": 4996 + }, + { + "epoch": 0.15, + "learning_rate": 4.8119211545867735e-06, + "loss": 1.1588, + "step": 4997 + }, + { + "epoch": 0.15, + "learning_rate": 4.811828324619112e-06, + "loss": 1.1927, + "step": 4998 + }, + { + "epoch": 0.15, + "learning_rate": 4.811735472643958e-06, + "loss": 1.1909, + "step": 4999 + }, + { + "epoch": 0.15, + "learning_rate": 4.8116425986621955e-06, + "loss": 1.0789, + "step": 5000 + }, + { + "epoch": 0.15, + "learning_rate": 4.811549702674708e-06, + "loss": 1.1527, + "step": 5001 + }, + { + "epoch": 0.15, + "learning_rate": 4.811456784682381e-06, + "loss": 1.1495, + "step": 5002 + }, + { + "epoch": 0.15, + "learning_rate": 4.8113638446861e-06, + "loss": 1.1155, + "step": 5003 + }, + { + "epoch": 0.15, + "learning_rate": 4.811270882686747e-06, + "loss": 1.1055, + "step": 5004 + }, + { + "epoch": 0.15, + "learning_rate": 4.811177898685209e-06, + "loss": 1.1334, + "step": 5005 + }, + { + "epoch": 0.15, + "learning_rate": 4.81108489268237e-06, + "loss": 1.2993, + "step": 5006 + }, + { + "epoch": 0.15, + "learning_rate": 4.810991864679116e-06, + "loss": 1.1677, + "step": 5007 + }, + { + "epoch": 0.15, + "learning_rate": 4.810898814676332e-06, + "loss": 1.1292, + "step": 5008 + }, + { + "epoch": 0.15, + "learning_rate": 4.810805742674905e-06, + "loss": 1.1346, + "step": 5009 + }, + { + "epoch": 0.15, + "learning_rate": 4.81071264867572e-06, + "loss": 1.1223, + "step": 5010 + }, + { + "epoch": 0.15, + "learning_rate": 4.810619532679665e-06, + "loss": 1.0984, + "step": 5011 + }, + { + "epoch": 0.15, + "learning_rate": 4.810526394687623e-06, + "loss": 1.1603, + "step": 5012 + }, + { + "epoch": 0.15, + "learning_rate": 4.8104332347004825e-06, + "loss": 1.0208, + "step": 5013 + }, + { + "epoch": 0.15, + "learning_rate": 4.8103400527191305e-06, + "loss": 1.0662, + "step": 5014 + }, + { + "epoch": 0.15, + "learning_rate": 4.8102468487444545e-06, + "loss": 1.1199, + "step": 5015 + }, + { + "epoch": 0.15, + "learning_rate": 4.810153622777341e-06, + "loss": 1.2205, + "step": 5016 + }, + { + "epoch": 0.15, + "learning_rate": 4.810060374818677e-06, + "loss": 1.214, + "step": 5017 + }, + { + "epoch": 0.15, + "learning_rate": 4.809967104869352e-06, + "loss": 1.0439, + "step": 5018 + }, + { + "epoch": 0.15, + "learning_rate": 4.809873812930251e-06, + "loss": 1.0739, + "step": 5019 + }, + { + "epoch": 0.15, + "learning_rate": 4.809780499002265e-06, + "loss": 1.0901, + "step": 5020 + }, + { + "epoch": 0.15, + "learning_rate": 4.8096871630862805e-06, + "loss": 1.0663, + "step": 5021 + }, + { + "epoch": 0.15, + "learning_rate": 4.809593805183188e-06, + "loss": 1.2134, + "step": 5022 + }, + { + "epoch": 0.15, + "learning_rate": 4.8095004252938734e-06, + "loss": 1.2107, + "step": 5023 + }, + { + "epoch": 0.15, + "learning_rate": 4.809407023419227e-06, + "loss": 1.2422, + "step": 5024 + }, + { + "epoch": 0.15, + "learning_rate": 4.809313599560138e-06, + "loss": 1.1893, + "step": 5025 + }, + { + "epoch": 0.15, + "learning_rate": 4.809220153717496e-06, + "loss": 1.1165, + "step": 5026 + }, + { + "epoch": 0.15, + "learning_rate": 4.809126685892191e-06, + "loss": 1.2026, + "step": 5027 + }, + { + "epoch": 0.15, + "learning_rate": 4.809033196085111e-06, + "loss": 1.2147, + "step": 5028 + }, + { + "epoch": 0.15, + "learning_rate": 4.808939684297148e-06, + "loss": 1.1351, + "step": 5029 + }, + { + "epoch": 0.15, + "learning_rate": 4.808846150529191e-06, + "loss": 1.1105, + "step": 5030 + }, + { + "epoch": 0.15, + "learning_rate": 4.808752594782129e-06, + "loss": 1.4191, + "step": 5031 + }, + { + "epoch": 0.15, + "learning_rate": 4.8086590170568555e-06, + "loss": 1.1785, + "step": 5032 + }, + { + "epoch": 0.15, + "learning_rate": 4.808565417354261e-06, + "loss": 1.1122, + "step": 5033 + }, + { + "epoch": 0.15, + "learning_rate": 4.808471795675234e-06, + "loss": 1.0389, + "step": 5034 + }, + { + "epoch": 0.15, + "learning_rate": 4.808378152020668e-06, + "loss": 1.1638, + "step": 5035 + }, + { + "epoch": 0.15, + "learning_rate": 4.808284486391454e-06, + "loss": 1.1989, + "step": 5036 + }, + { + "epoch": 0.15, + "learning_rate": 4.808190798788483e-06, + "loss": 1.1152, + "step": 5037 + }, + { + "epoch": 0.15, + "learning_rate": 4.808097089212648e-06, + "loss": 1.224, + "step": 5038 + }, + { + "epoch": 0.15, + "learning_rate": 4.808003357664839e-06, + "loss": 1.1389, + "step": 5039 + }, + { + "epoch": 0.15, + "learning_rate": 4.80790960414595e-06, + "loss": 1.1191, + "step": 5040 + }, + { + "epoch": 0.15, + "learning_rate": 4.807815828656874e-06, + "loss": 1.1243, + "step": 5041 + }, + { + "epoch": 0.15, + "learning_rate": 4.807722031198503e-06, + "loss": 1.1681, + "step": 5042 + }, + { + "epoch": 0.15, + "learning_rate": 4.807628211771728e-06, + "loss": 1.2104, + "step": 5043 + }, + { + "epoch": 0.15, + "learning_rate": 4.807534370377445e-06, + "loss": 1.1375, + "step": 5044 + }, + { + "epoch": 0.15, + "learning_rate": 4.8074405070165455e-06, + "loss": 1.1595, + "step": 5045 + }, + { + "epoch": 0.15, + "learning_rate": 4.807346621689925e-06, + "loss": 1.0242, + "step": 5046 + }, + { + "epoch": 0.15, + "learning_rate": 4.807252714398474e-06, + "loss": 1.0185, + "step": 5047 + }, + { + "epoch": 0.15, + "learning_rate": 4.807158785143089e-06, + "loss": 1.1443, + "step": 5048 + }, + { + "epoch": 0.15, + "learning_rate": 4.807064833924664e-06, + "loss": 1.2345, + "step": 5049 + }, + { + "epoch": 0.15, + "learning_rate": 4.806970860744093e-06, + "loss": 1.147, + "step": 5050 + }, + { + "epoch": 0.15, + "learning_rate": 4.80687686560227e-06, + "loss": 1.2158, + "step": 5051 + }, + { + "epoch": 0.15, + "learning_rate": 4.806782848500091e-06, + "loss": 1.1522, + "step": 5052 + }, + { + "epoch": 0.15, + "learning_rate": 4.806688809438449e-06, + "loss": 1.136, + "step": 5053 + }, + { + "epoch": 0.15, + "learning_rate": 4.806594748418242e-06, + "loss": 1.262, + "step": 5054 + }, + { + "epoch": 0.15, + "learning_rate": 4.806500665440363e-06, + "loss": 1.2354, + "step": 5055 + }, + { + "epoch": 0.15, + "learning_rate": 4.806406560505709e-06, + "loss": 1.2668, + "step": 5056 + }, + { + "epoch": 0.15, + "learning_rate": 4.806312433615174e-06, + "loss": 1.2189, + "step": 5057 + }, + { + "epoch": 0.15, + "learning_rate": 4.806218284769657e-06, + "loss": 1.1194, + "step": 5058 + }, + { + "epoch": 0.15, + "learning_rate": 4.806124113970052e-06, + "loss": 1.1742, + "step": 5059 + }, + { + "epoch": 0.15, + "learning_rate": 4.806029921217255e-06, + "loss": 1.0375, + "step": 5060 + }, + { + "epoch": 0.15, + "learning_rate": 4.805935706512166e-06, + "loss": 1.1276, + "step": 5061 + }, + { + "epoch": 0.15, + "learning_rate": 4.805841469855679e-06, + "loss": 1.1486, + "step": 5062 + }, + { + "epoch": 0.15, + "learning_rate": 4.80574721124869e-06, + "loss": 1.1151, + "step": 5063 + }, + { + "epoch": 0.15, + "learning_rate": 4.805652930692099e-06, + "loss": 1.1364, + "step": 5064 + }, + { + "epoch": 0.15, + "learning_rate": 4.805558628186804e-06, + "loss": 1.1827, + "step": 5065 + }, + { + "epoch": 0.15, + "learning_rate": 4.8054643037337e-06, + "loss": 1.1951, + "step": 5066 + }, + { + "epoch": 0.15, + "learning_rate": 4.805369957333687e-06, + "loss": 1.222, + "step": 5067 + }, + { + "epoch": 0.15, + "learning_rate": 4.805275588987661e-06, + "loss": 1.3074, + "step": 5068 + }, + { + "epoch": 0.15, + "learning_rate": 4.805181198696523e-06, + "loss": 1.1169, + "step": 5069 + }, + { + "epoch": 0.15, + "learning_rate": 4.805086786461168e-06, + "loss": 1.0183, + "step": 5070 + }, + { + "epoch": 0.15, + "learning_rate": 4.804992352282499e-06, + "loss": 1.1468, + "step": 5071 + }, + { + "epoch": 0.15, + "learning_rate": 4.804897896161413e-06, + "loss": 1.1483, + "step": 5072 + }, + { + "epoch": 0.15, + "learning_rate": 4.804803418098808e-06, + "loss": 1.1509, + "step": 5073 + }, + { + "epoch": 0.15, + "learning_rate": 4.804708918095585e-06, + "loss": 1.2374, + "step": 5074 + }, + { + "epoch": 0.15, + "learning_rate": 4.804614396152643e-06, + "loss": 1.1105, + "step": 5075 + }, + { + "epoch": 0.15, + "learning_rate": 4.804519852270881e-06, + "loss": 1.144, + "step": 5076 + }, + { + "epoch": 0.15, + "learning_rate": 4.8044252864512015e-06, + "loss": 1.1907, + "step": 5077 + }, + { + "epoch": 0.15, + "learning_rate": 4.804330698694503e-06, + "loss": 1.1226, + "step": 5078 + }, + { + "epoch": 0.15, + "learning_rate": 4.804236089001685e-06, + "loss": 1.1998, + "step": 5079 + }, + { + "epoch": 0.15, + "learning_rate": 4.804141457373649e-06, + "loss": 1.1606, + "step": 5080 + }, + { + "epoch": 0.15, + "learning_rate": 4.804046803811297e-06, + "loss": 1.1799, + "step": 5081 + }, + { + "epoch": 0.15, + "learning_rate": 4.803952128315529e-06, + "loss": 1.1535, + "step": 5082 + }, + { + "epoch": 0.15, + "learning_rate": 4.8038574308872465e-06, + "loss": 1.1377, + "step": 5083 + }, + { + "epoch": 0.15, + "learning_rate": 4.80376271152735e-06, + "loss": 1.0872, + "step": 5084 + }, + { + "epoch": 0.15, + "learning_rate": 4.803667970236743e-06, + "loss": 1.1593, + "step": 5085 + }, + { + "epoch": 0.15, + "learning_rate": 4.803573207016326e-06, + "loss": 1.1462, + "step": 5086 + }, + { + "epoch": 0.15, + "learning_rate": 4.803478421867001e-06, + "loss": 1.2089, + "step": 5087 + }, + { + "epoch": 0.15, + "learning_rate": 4.8033836147896716e-06, + "loss": 1.108, + "step": 5088 + }, + { + "epoch": 0.15, + "learning_rate": 4.803288785785239e-06, + "loss": 1.1132, + "step": 5089 + }, + { + "epoch": 0.15, + "learning_rate": 4.8031939348546065e-06, + "loss": 1.087, + "step": 5090 + }, + { + "epoch": 0.15, + "learning_rate": 4.803099061998677e-06, + "loss": 1.2229, + "step": 5091 + }, + { + "epoch": 0.15, + "learning_rate": 4.803004167218354e-06, + "loss": 1.2051, + "step": 5092 + }, + { + "epoch": 0.15, + "learning_rate": 4.80290925051454e-06, + "loss": 1.1635, + "step": 5093 + }, + { + "epoch": 0.15, + "learning_rate": 4.80281431188814e-06, + "loss": 1.1368, + "step": 5094 + }, + { + "epoch": 0.15, + "learning_rate": 4.802719351340056e-06, + "loss": 1.1089, + "step": 5095 + }, + { + "epoch": 0.15, + "learning_rate": 4.802624368871193e-06, + "loss": 1.0936, + "step": 5096 + }, + { + "epoch": 0.15, + "learning_rate": 4.802529364482454e-06, + "loss": 1.0743, + "step": 5097 + }, + { + "epoch": 0.15, + "learning_rate": 4.802434338174746e-06, + "loss": 1.1782, + "step": 5098 + }, + { + "epoch": 0.15, + "learning_rate": 4.802339289948972e-06, + "loss": 1.1799, + "step": 5099 + }, + { + "epoch": 0.15, + "learning_rate": 4.802244219806036e-06, + "loss": 1.0917, + "step": 5100 + }, + { + "epoch": 0.15, + "learning_rate": 4.8021491277468435e-06, + "loss": 1.205, + "step": 5101 + }, + { + "epoch": 0.15, + "learning_rate": 4.8020540137723e-06, + "loss": 1.2088, + "step": 5102 + }, + { + "epoch": 0.15, + "learning_rate": 4.801958877883312e-06, + "loss": 1.1582, + "step": 5103 + }, + { + "epoch": 0.15, + "learning_rate": 4.8018637200807835e-06, + "loss": 1.2324, + "step": 5104 + }, + { + "epoch": 0.15, + "learning_rate": 4.801768540365621e-06, + "loss": 1.2178, + "step": 5105 + }, + { + "epoch": 0.15, + "learning_rate": 4.801673338738732e-06, + "loss": 1.209, + "step": 5106 + }, + { + "epoch": 0.15, + "learning_rate": 4.801578115201019e-06, + "loss": 1.1141, + "step": 5107 + }, + { + "epoch": 0.15, + "learning_rate": 4.801482869753392e-06, + "loss": 1.1453, + "step": 5108 + }, + { + "epoch": 0.15, + "learning_rate": 4.801387602396756e-06, + "loss": 1.166, + "step": 5109 + }, + { + "epoch": 0.15, + "learning_rate": 4.801292313132019e-06, + "loss": 1.0884, + "step": 5110 + }, + { + "epoch": 0.15, + "learning_rate": 4.801197001960088e-06, + "loss": 1.0355, + "step": 5111 + }, + { + "epoch": 0.15, + "learning_rate": 4.801101668881869e-06, + "loss": 1.1458, + "step": 5112 + }, + { + "epoch": 0.15, + "learning_rate": 4.80100631389827e-06, + "loss": 1.1725, + "step": 5113 + }, + { + "epoch": 0.15, + "learning_rate": 4.8009109370102e-06, + "loss": 1.1165, + "step": 5114 + }, + { + "epoch": 0.15, + "learning_rate": 4.800815538218566e-06, + "loss": 1.1827, + "step": 5115 + }, + { + "epoch": 0.15, + "learning_rate": 4.800720117524276e-06, + "loss": 1.1402, + "step": 5116 + }, + { + "epoch": 0.15, + "learning_rate": 4.800624674928238e-06, + "loss": 1.216, + "step": 5117 + }, + { + "epoch": 0.15, + "learning_rate": 4.800529210431362e-06, + "loss": 1.3055, + "step": 5118 + }, + { + "epoch": 0.15, + "learning_rate": 4.8004337240345545e-06, + "loss": 1.2327, + "step": 5119 + }, + { + "epoch": 0.15, + "learning_rate": 4.800338215738727e-06, + "loss": 1.1867, + "step": 5120 + }, + { + "epoch": 0.15, + "learning_rate": 4.800242685544787e-06, + "loss": 1.0835, + "step": 5121 + }, + { + "epoch": 0.15, + "learning_rate": 4.800147133453645e-06, + "loss": 1.1528, + "step": 5122 + }, + { + "epoch": 0.15, + "learning_rate": 4.80005155946621e-06, + "loss": 1.1261, + "step": 5123 + }, + { + "epoch": 0.15, + "learning_rate": 4.799955963583392e-06, + "loss": 1.3672, + "step": 5124 + }, + { + "epoch": 0.15, + "learning_rate": 4.7998603458061e-06, + "loss": 0.9269, + "step": 5125 + }, + { + "epoch": 0.15, + "learning_rate": 4.799764706135246e-06, + "loss": 1.2244, + "step": 5126 + }, + { + "epoch": 0.15, + "learning_rate": 4.7996690445717395e-06, + "loss": 1.1081, + "step": 5127 + }, + { + "epoch": 0.15, + "learning_rate": 4.799573361116492e-06, + "loss": 1.1327, + "step": 5128 + }, + { + "epoch": 0.15, + "learning_rate": 4.799477655770412e-06, + "loss": 1.1406, + "step": 5129 + }, + { + "epoch": 0.15, + "learning_rate": 4.799381928534413e-06, + "loss": 1.2645, + "step": 5130 + }, + { + "epoch": 0.15, + "learning_rate": 4.799286179409406e-06, + "loss": 1.1198, + "step": 5131 + }, + { + "epoch": 0.15, + "learning_rate": 4.799190408396302e-06, + "loss": 1.18, + "step": 5132 + }, + { + "epoch": 0.15, + "learning_rate": 4.7990946154960115e-06, + "loss": 1.187, + "step": 5133 + }, + { + "epoch": 0.15, + "learning_rate": 4.798998800709448e-06, + "loss": 1.1383, + "step": 5134 + }, + { + "epoch": 0.15, + "learning_rate": 4.798902964037523e-06, + "loss": 1.1651, + "step": 5135 + }, + { + "epoch": 0.15, + "learning_rate": 4.798807105481149e-06, + "loss": 1.223, + "step": 5136 + }, + { + "epoch": 0.15, + "learning_rate": 4.798711225041239e-06, + "loss": 1.2248, + "step": 5137 + }, + { + "epoch": 0.15, + "learning_rate": 4.7986153227187045e-06, + "loss": 1.1514, + "step": 5138 + }, + { + "epoch": 0.15, + "learning_rate": 4.79851939851446e-06, + "loss": 1.1865, + "step": 5139 + }, + { + "epoch": 0.15, + "learning_rate": 4.798423452429417e-06, + "loss": 1.1107, + "step": 5140 + }, + { + "epoch": 0.15, + "learning_rate": 4.798327484464491e-06, + "loss": 1.3209, + "step": 5141 + }, + { + "epoch": 0.15, + "learning_rate": 4.798231494620593e-06, + "loss": 1.2887, + "step": 5142 + }, + { + "epoch": 0.15, + "learning_rate": 4.798135482898639e-06, + "loss": 1.1479, + "step": 5143 + }, + { + "epoch": 0.15, + "learning_rate": 4.79803944929954e-06, + "loss": 1.2063, + "step": 5144 + }, + { + "epoch": 0.15, + "learning_rate": 4.797943393824215e-06, + "loss": 1.1616, + "step": 5145 + }, + { + "epoch": 0.16, + "learning_rate": 4.797847316473574e-06, + "loss": 1.1306, + "step": 5146 + }, + { + "epoch": 0.16, + "learning_rate": 4.797751217248534e-06, + "loss": 1.0566, + "step": 5147 + }, + { + "epoch": 0.16, + "learning_rate": 4.797655096150008e-06, + "loss": 1.2606, + "step": 5148 + }, + { + "epoch": 0.16, + "learning_rate": 4.797558953178913e-06, + "loss": 1.1158, + "step": 5149 + }, + { + "epoch": 0.16, + "learning_rate": 4.797462788336163e-06, + "loss": 1.0999, + "step": 5150 + }, + { + "epoch": 0.16, + "learning_rate": 4.797366601622674e-06, + "loss": 1.2336, + "step": 5151 + }, + { + "epoch": 0.16, + "learning_rate": 4.79727039303936e-06, + "loss": 1.16, + "step": 5152 + }, + { + "epoch": 0.16, + "learning_rate": 4.79717416258714e-06, + "loss": 1.1582, + "step": 5153 + }, + { + "epoch": 0.16, + "learning_rate": 4.797077910266928e-06, + "loss": 1.2222, + "step": 5154 + }, + { + "epoch": 0.16, + "learning_rate": 4.7969816360796404e-06, + "loss": 1.2292, + "step": 5155 + }, + { + "epoch": 0.16, + "learning_rate": 4.796885340026194e-06, + "loss": 1.1233, + "step": 5156 + }, + { + "epoch": 0.16, + "learning_rate": 4.796789022107505e-06, + "loss": 1.1117, + "step": 5157 + }, + { + "epoch": 0.16, + "learning_rate": 4.796692682324491e-06, + "loss": 1.0991, + "step": 5158 + }, + { + "epoch": 0.16, + "learning_rate": 4.796596320678069e-06, + "loss": 1.0634, + "step": 5159 + }, + { + "epoch": 0.16, + "learning_rate": 4.796499937169156e-06, + "loss": 1.1321, + "step": 5160 + }, + { + "epoch": 0.16, + "learning_rate": 4.796403531798669e-06, + "loss": 1.087, + "step": 5161 + }, + { + "epoch": 0.16, + "learning_rate": 4.796307104567526e-06, + "loss": 1.2208, + "step": 5162 + }, + { + "epoch": 0.16, + "learning_rate": 4.796210655476646e-06, + "loss": 1.1945, + "step": 5163 + }, + { + "epoch": 0.16, + "learning_rate": 4.796114184526946e-06, + "loss": 1.1485, + "step": 5164 + }, + { + "epoch": 0.16, + "learning_rate": 4.796017691719346e-06, + "loss": 1.1069, + "step": 5165 + }, + { + "epoch": 0.16, + "learning_rate": 4.795921177054763e-06, + "loss": 1.0988, + "step": 5166 + }, + { + "epoch": 0.16, + "learning_rate": 4.795824640534116e-06, + "loss": 1.1996, + "step": 5167 + }, + { + "epoch": 0.16, + "learning_rate": 4.795728082158324e-06, + "loss": 1.2009, + "step": 5168 + }, + { + "epoch": 0.16, + "learning_rate": 4.795631501928306e-06, + "loss": 1.1311, + "step": 5169 + }, + { + "epoch": 0.16, + "learning_rate": 4.795534899844983e-06, + "loss": 1.2148, + "step": 5170 + }, + { + "epoch": 0.16, + "learning_rate": 4.795438275909272e-06, + "loss": 1.1984, + "step": 5171 + }, + { + "epoch": 0.16, + "learning_rate": 4.795341630122094e-06, + "loss": 1.1733, + "step": 5172 + }, + { + "epoch": 0.16, + "learning_rate": 4.79524496248437e-06, + "loss": 1.1032, + "step": 5173 + }, + { + "epoch": 0.16, + "learning_rate": 4.795148272997019e-06, + "loss": 1.222, + "step": 5174 + }, + { + "epoch": 0.16, + "learning_rate": 4.795051561660962e-06, + "loss": 1.2019, + "step": 5175 + }, + { + "epoch": 0.16, + "learning_rate": 4.794954828477118e-06, + "loss": 1.2465, + "step": 5176 + }, + { + "epoch": 0.16, + "learning_rate": 4.794858073446411e-06, + "loss": 1.1713, + "step": 5177 + }, + { + "epoch": 0.16, + "learning_rate": 4.7947612965697605e-06, + "loss": 1.108, + "step": 5178 + }, + { + "epoch": 0.16, + "learning_rate": 4.794664497848087e-06, + "loss": 1.319, + "step": 5179 + }, + { + "epoch": 0.16, + "learning_rate": 4.794567677282312e-06, + "loss": 1.2516, + "step": 5180 + }, + { + "epoch": 0.16, + "learning_rate": 4.794470834873359e-06, + "loss": 1.1625, + "step": 5181 + }, + { + "epoch": 0.16, + "learning_rate": 4.794373970622149e-06, + "loss": 1.0878, + "step": 5182 + }, + { + "epoch": 0.16, + "learning_rate": 4.7942770845296026e-06, + "loss": 1.1326, + "step": 5183 + }, + { + "epoch": 0.16, + "learning_rate": 4.794180176596645e-06, + "loss": 1.1215, + "step": 5184 + }, + { + "epoch": 0.16, + "learning_rate": 4.794083246824195e-06, + "loss": 1.1087, + "step": 5185 + }, + { + "epoch": 0.16, + "learning_rate": 4.793986295213178e-06, + "loss": 1.1684, + "step": 5186 + }, + { + "epoch": 0.16, + "learning_rate": 4.793889321764516e-06, + "loss": 1.1422, + "step": 5187 + }, + { + "epoch": 0.16, + "learning_rate": 4.7937923264791336e-06, + "loss": 1.0951, + "step": 5188 + }, + { + "epoch": 0.16, + "learning_rate": 4.793695309357952e-06, + "loss": 1.2001, + "step": 5189 + }, + { + "epoch": 0.16, + "learning_rate": 4.793598270401896e-06, + "loss": 1.0921, + "step": 5190 + }, + { + "epoch": 0.16, + "learning_rate": 4.793501209611889e-06, + "loss": 1.1958, + "step": 5191 + }, + { + "epoch": 0.16, + "learning_rate": 4.7934041269888556e-06, + "loss": 1.0997, + "step": 5192 + }, + { + "epoch": 0.16, + "learning_rate": 4.7933070225337195e-06, + "loss": 1.2867, + "step": 5193 + }, + { + "epoch": 0.16, + "learning_rate": 4.793209896247404e-06, + "loss": 1.2368, + "step": 5194 + }, + { + "epoch": 0.16, + "learning_rate": 4.793112748130836e-06, + "loss": 1.1237, + "step": 5195 + }, + { + "epoch": 0.16, + "learning_rate": 4.793015578184939e-06, + "loss": 1.1047, + "step": 5196 + }, + { + "epoch": 0.16, + "learning_rate": 4.792918386410636e-06, + "loss": 1.1479, + "step": 5197 + }, + { + "epoch": 0.16, + "learning_rate": 4.7928211728088566e-06, + "loss": 1.1693, + "step": 5198 + }, + { + "epoch": 0.16, + "learning_rate": 4.7927239373805225e-06, + "loss": 1.207, + "step": 5199 + }, + { + "epoch": 0.16, + "learning_rate": 4.792626680126562e-06, + "loss": 1.0853, + "step": 5200 + }, + { + "epoch": 0.16, + "learning_rate": 4.7925294010478985e-06, + "loss": 1.2275, + "step": 5201 + }, + { + "epoch": 0.16, + "learning_rate": 4.79243210014546e-06, + "loss": 1.1014, + "step": 5202 + }, + { + "epoch": 0.16, + "learning_rate": 4.792334777420171e-06, + "loss": 1.1152, + "step": 5203 + }, + { + "epoch": 0.16, + "learning_rate": 4.79223743287296e-06, + "loss": 1.0895, + "step": 5204 + }, + { + "epoch": 0.16, + "learning_rate": 4.7921400665047525e-06, + "loss": 1.1561, + "step": 5205 + }, + { + "epoch": 0.16, + "learning_rate": 4.7920426783164744e-06, + "loss": 1.0991, + "step": 5206 + }, + { + "epoch": 0.16, + "learning_rate": 4.791945268309055e-06, + "loss": 1.0561, + "step": 5207 + }, + { + "epoch": 0.16, + "learning_rate": 4.791847836483419e-06, + "loss": 1.0544, + "step": 5208 + }, + { + "epoch": 0.16, + "learning_rate": 4.7917503828404975e-06, + "loss": 1.0611, + "step": 5209 + }, + { + "epoch": 0.16, + "learning_rate": 4.791652907381215e-06, + "loss": 1.1123, + "step": 5210 + }, + { + "epoch": 0.16, + "learning_rate": 4.791555410106501e-06, + "loss": 1.2568, + "step": 5211 + }, + { + "epoch": 0.16, + "learning_rate": 4.7914578910172825e-06, + "loss": 1.1375, + "step": 5212 + }, + { + "epoch": 0.16, + "learning_rate": 4.791360350114489e-06, + "loss": 1.2201, + "step": 5213 + }, + { + "epoch": 0.16, + "learning_rate": 4.791262787399048e-06, + "loss": 1.1583, + "step": 5214 + }, + { + "epoch": 0.16, + "learning_rate": 4.79116520287189e-06, + "loss": 1.1538, + "step": 5215 + }, + { + "epoch": 0.16, + "learning_rate": 4.791067596533941e-06, + "loss": 1.1772, + "step": 5216 + }, + { + "epoch": 0.16, + "learning_rate": 4.790969968386133e-06, + "loss": 1.2493, + "step": 5217 + }, + { + "epoch": 0.16, + "learning_rate": 4.790872318429394e-06, + "loss": 1.244, + "step": 5218 + }, + { + "epoch": 0.16, + "learning_rate": 4.790774646664654e-06, + "loss": 1.2781, + "step": 5219 + }, + { + "epoch": 0.16, + "learning_rate": 4.790676953092842e-06, + "loss": 1.0705, + "step": 5220 + }, + { + "epoch": 0.16, + "learning_rate": 4.790579237714889e-06, + "loss": 1.1285, + "step": 5221 + }, + { + "epoch": 0.16, + "learning_rate": 4.790481500531725e-06, + "loss": 1.1677, + "step": 5222 + }, + { + "epoch": 0.16, + "learning_rate": 4.790383741544281e-06, + "loss": 1.2615, + "step": 5223 + }, + { + "epoch": 0.16, + "learning_rate": 4.790285960753485e-06, + "loss": 1.1738, + "step": 5224 + }, + { + "epoch": 0.16, + "learning_rate": 4.790188158160271e-06, + "loss": 1.2207, + "step": 5225 + }, + { + "epoch": 0.16, + "learning_rate": 4.790090333765569e-06, + "loss": 1.1785, + "step": 5226 + }, + { + "epoch": 0.16, + "learning_rate": 4.789992487570309e-06, + "loss": 1.2112, + "step": 5227 + }, + { + "epoch": 0.16, + "learning_rate": 4.789894619575424e-06, + "loss": 1.0961, + "step": 5228 + }, + { + "epoch": 0.16, + "learning_rate": 4.789796729781845e-06, + "loss": 1.1276, + "step": 5229 + }, + { + "epoch": 0.16, + "learning_rate": 4.789698818190504e-06, + "loss": 1.2294, + "step": 5230 + }, + { + "epoch": 0.16, + "learning_rate": 4.789600884802333e-06, + "loss": 1.225, + "step": 5231 + }, + { + "epoch": 0.16, + "learning_rate": 4.789502929618264e-06, + "loss": 1.1672, + "step": 5232 + }, + { + "epoch": 0.16, + "learning_rate": 4.78940495263923e-06, + "loss": 1.1528, + "step": 5233 + }, + { + "epoch": 0.16, + "learning_rate": 4.789306953866163e-06, + "loss": 1.137, + "step": 5234 + }, + { + "epoch": 0.16, + "learning_rate": 4.789208933299997e-06, + "loss": 1.0794, + "step": 5235 + }, + { + "epoch": 0.16, + "learning_rate": 4.789110890941664e-06, + "loss": 1.1237, + "step": 5236 + }, + { + "epoch": 0.16, + "learning_rate": 4.789012826792099e-06, + "loss": 1.1015, + "step": 5237 + }, + { + "epoch": 0.16, + "learning_rate": 4.7889147408522326e-06, + "loss": 1.1232, + "step": 5238 + }, + { + "epoch": 0.16, + "learning_rate": 4.788816633123001e-06, + "loss": 1.1031, + "step": 5239 + }, + { + "epoch": 0.16, + "learning_rate": 4.788718503605338e-06, + "loss": 1.1666, + "step": 5240 + }, + { + "epoch": 0.16, + "learning_rate": 4.788620352300176e-06, + "loss": 1.1739, + "step": 5241 + }, + { + "epoch": 0.16, + "learning_rate": 4.7885221792084515e-06, + "loss": 1.2026, + "step": 5242 + }, + { + "epoch": 0.16, + "learning_rate": 4.788423984331098e-06, + "loss": 1.2251, + "step": 5243 + }, + { + "epoch": 0.16, + "learning_rate": 4.788325767669049e-06, + "loss": 1.1105, + "step": 5244 + }, + { + "epoch": 0.16, + "learning_rate": 4.788227529223242e-06, + "loss": 1.1141, + "step": 5245 + }, + { + "epoch": 0.16, + "learning_rate": 4.7881292689946105e-06, + "loss": 1.1154, + "step": 5246 + }, + { + "epoch": 0.16, + "learning_rate": 4.788030986984091e-06, + "loss": 1.1874, + "step": 5247 + }, + { + "epoch": 0.16, + "learning_rate": 4.787932683192617e-06, + "loss": 1.2575, + "step": 5248 + }, + { + "epoch": 0.16, + "learning_rate": 4.787834357621127e-06, + "loss": 1.3188, + "step": 5249 + }, + { + "epoch": 0.16, + "learning_rate": 4.787736010270556e-06, + "loss": 1.2408, + "step": 5250 + }, + { + "epoch": 0.16, + "learning_rate": 4.787637641141839e-06, + "loss": 1.1522, + "step": 5251 + }, + { + "epoch": 0.16, + "learning_rate": 4.787539250235914e-06, + "loss": 1.0325, + "step": 5252 + }, + { + "epoch": 0.16, + "learning_rate": 4.787440837553717e-06, + "loss": 0.9888, + "step": 5253 + }, + { + "epoch": 0.16, + "learning_rate": 4.7873424030961845e-06, + "loss": 1.114, + "step": 5254 + }, + { + "epoch": 0.16, + "learning_rate": 4.7872439468642544e-06, + "loss": 1.2681, + "step": 5255 + }, + { + "epoch": 0.16, + "learning_rate": 4.787145468858864e-06, + "loss": 1.1019, + "step": 5256 + }, + { + "epoch": 0.16, + "learning_rate": 4.78704696908095e-06, + "loss": 1.2061, + "step": 5257 + }, + { + "epoch": 0.16, + "learning_rate": 4.78694844753145e-06, + "loss": 1.1344, + "step": 5258 + }, + { + "epoch": 0.16, + "learning_rate": 4.786849904211301e-06, + "loss": 1.1289, + "step": 5259 + }, + { + "epoch": 0.16, + "learning_rate": 4.786751339121444e-06, + "loss": 1.0967, + "step": 5260 + }, + { + "epoch": 0.16, + "learning_rate": 4.786652752262815e-06, + "loss": 1.1772, + "step": 5261 + }, + { + "epoch": 0.16, + "learning_rate": 4.786554143636353e-06, + "loss": 1.2552, + "step": 5262 + }, + { + "epoch": 0.16, + "learning_rate": 4.7864555132429965e-06, + "loss": 1.1265, + "step": 5263 + }, + { + "epoch": 0.16, + "learning_rate": 4.786356861083686e-06, + "loss": 1.1558, + "step": 5264 + }, + { + "epoch": 0.16, + "learning_rate": 4.7862581871593585e-06, + "loss": 1.2089, + "step": 5265 + }, + { + "epoch": 0.16, + "learning_rate": 4.786159491470954e-06, + "loss": 1.079, + "step": 5266 + }, + { + "epoch": 0.16, + "learning_rate": 4.786060774019412e-06, + "loss": 1.1916, + "step": 5267 + }, + { + "epoch": 0.16, + "learning_rate": 4.785962034805674e-06, + "loss": 1.1199, + "step": 5268 + }, + { + "epoch": 0.16, + "learning_rate": 4.785863273830676e-06, + "loss": 1.045, + "step": 5269 + }, + { + "epoch": 0.16, + "learning_rate": 4.7857644910953615e-06, + "loss": 1.1873, + "step": 5270 + }, + { + "epoch": 0.16, + "learning_rate": 4.785665686600671e-06, + "loss": 1.1522, + "step": 5271 + }, + { + "epoch": 0.16, + "learning_rate": 4.785566860347543e-06, + "loss": 1.1927, + "step": 5272 + }, + { + "epoch": 0.16, + "learning_rate": 4.785468012336919e-06, + "loss": 1.1454, + "step": 5273 + }, + { + "epoch": 0.16, + "learning_rate": 4.785369142569741e-06, + "loss": 1.0884, + "step": 5274 + }, + { + "epoch": 0.16, + "learning_rate": 4.785270251046949e-06, + "loss": 1.0565, + "step": 5275 + }, + { + "epoch": 0.16, + "learning_rate": 4.785171337769485e-06, + "loss": 1.1556, + "step": 5276 + }, + { + "epoch": 0.16, + "learning_rate": 4.78507240273829e-06, + "loss": 1.0682, + "step": 5277 + }, + { + "epoch": 0.16, + "learning_rate": 4.784973445954306e-06, + "loss": 1.1536, + "step": 5278 + }, + { + "epoch": 0.16, + "learning_rate": 4.784874467418477e-06, + "loss": 1.1824, + "step": 5279 + }, + { + "epoch": 0.16, + "learning_rate": 4.784775467131741e-06, + "loss": 1.2235, + "step": 5280 + }, + { + "epoch": 0.16, + "learning_rate": 4.784676445095045e-06, + "loss": 1.1268, + "step": 5281 + }, + { + "epoch": 0.16, + "learning_rate": 4.784577401309329e-06, + "loss": 1.1758, + "step": 5282 + }, + { + "epoch": 0.16, + "learning_rate": 4.784478335775536e-06, + "loss": 1.1127, + "step": 5283 + }, + { + "epoch": 0.16, + "learning_rate": 4.784379248494609e-06, + "loss": 1.1038, + "step": 5284 + }, + { + "epoch": 0.16, + "learning_rate": 4.784280139467493e-06, + "loss": 1.1663, + "step": 5285 + }, + { + "epoch": 0.16, + "learning_rate": 4.78418100869513e-06, + "loss": 1.1868, + "step": 5286 + }, + { + "epoch": 0.16, + "learning_rate": 4.784081856178464e-06, + "loss": 1.1778, + "step": 5287 + }, + { + "epoch": 0.16, + "learning_rate": 4.783982681918438e-06, + "loss": 1.0251, + "step": 5288 + }, + { + "epoch": 0.16, + "learning_rate": 4.783883485915998e-06, + "loss": 1.2044, + "step": 5289 + }, + { + "epoch": 0.16, + "learning_rate": 4.783784268172086e-06, + "loss": 1.08, + "step": 5290 + }, + { + "epoch": 0.16, + "learning_rate": 4.7836850286876475e-06, + "loss": 1.2081, + "step": 5291 + }, + { + "epoch": 0.16, + "learning_rate": 4.7835857674636285e-06, + "loss": 1.1421, + "step": 5292 + }, + { + "epoch": 0.16, + "learning_rate": 4.783486484500972e-06, + "loss": 1.2043, + "step": 5293 + }, + { + "epoch": 0.16, + "learning_rate": 4.783387179800625e-06, + "loss": 1.1685, + "step": 5294 + }, + { + "epoch": 0.16, + "learning_rate": 4.783287853363531e-06, + "loss": 1.1776, + "step": 5295 + }, + { + "epoch": 0.16, + "learning_rate": 4.783188505190636e-06, + "loss": 1.1613, + "step": 5296 + }, + { + "epoch": 0.16, + "learning_rate": 4.783089135282887e-06, + "loss": 1.0831, + "step": 5297 + }, + { + "epoch": 0.16, + "learning_rate": 4.782989743641227e-06, + "loss": 1.1448, + "step": 5298 + }, + { + "epoch": 0.16, + "learning_rate": 4.782890330266606e-06, + "loss": 1.1146, + "step": 5299 + }, + { + "epoch": 0.16, + "learning_rate": 4.782790895159969e-06, + "loss": 1.0209, + "step": 5300 + }, + { + "epoch": 0.16, + "learning_rate": 4.782691438322261e-06, + "loss": 1.0817, + "step": 5301 + }, + { + "epoch": 0.16, + "learning_rate": 4.78259195975443e-06, + "loss": 1.1447, + "step": 5302 + }, + { + "epoch": 0.16, + "learning_rate": 4.782492459457423e-06, + "loss": 1.1526, + "step": 5303 + }, + { + "epoch": 0.16, + "learning_rate": 4.782392937432186e-06, + "loss": 1.0887, + "step": 5304 + }, + { + "epoch": 0.16, + "learning_rate": 4.782293393679669e-06, + "loss": 1.1536, + "step": 5305 + }, + { + "epoch": 0.16, + "learning_rate": 4.782193828200818e-06, + "loss": 1.1808, + "step": 5306 + }, + { + "epoch": 0.16, + "learning_rate": 4.782094240996581e-06, + "loss": 1.2277, + "step": 5307 + }, + { + "epoch": 0.16, + "learning_rate": 4.781994632067905e-06, + "loss": 1.131, + "step": 5308 + }, + { + "epoch": 0.16, + "learning_rate": 4.78189500141574e-06, + "loss": 1.0908, + "step": 5309 + }, + { + "epoch": 0.16, + "learning_rate": 4.781795349041033e-06, + "loss": 1.1775, + "step": 5310 + }, + { + "epoch": 0.16, + "learning_rate": 4.781695674944733e-06, + "loss": 1.2023, + "step": 5311 + }, + { + "epoch": 0.16, + "learning_rate": 4.781595979127789e-06, + "loss": 1.2087, + "step": 5312 + }, + { + "epoch": 0.16, + "learning_rate": 4.781496261591151e-06, + "loss": 1.1953, + "step": 5313 + }, + { + "epoch": 0.16, + "learning_rate": 4.781396522335768e-06, + "loss": 1.12, + "step": 5314 + }, + { + "epoch": 0.16, + "learning_rate": 4.781296761362587e-06, + "loss": 1.0356, + "step": 5315 + }, + { + "epoch": 0.16, + "learning_rate": 4.78119697867256e-06, + "loss": 1.1041, + "step": 5316 + }, + { + "epoch": 0.16, + "learning_rate": 4.781097174266637e-06, + "loss": 1.1564, + "step": 5317 + }, + { + "epoch": 0.16, + "learning_rate": 4.780997348145767e-06, + "loss": 1.2321, + "step": 5318 + }, + { + "epoch": 0.16, + "learning_rate": 4.780897500310902e-06, + "loss": 1.1462, + "step": 5319 + }, + { + "epoch": 0.16, + "learning_rate": 4.78079763076299e-06, + "loss": 1.0704, + "step": 5320 + }, + { + "epoch": 0.16, + "learning_rate": 4.780697739502984e-06, + "loss": 1.0896, + "step": 5321 + }, + { + "epoch": 0.16, + "learning_rate": 4.780597826531833e-06, + "loss": 1.1222, + "step": 5322 + }, + { + "epoch": 0.16, + "learning_rate": 4.78049789185049e-06, + "loss": 1.1356, + "step": 5323 + }, + { + "epoch": 0.16, + "learning_rate": 4.780397935459904e-06, + "loss": 1.1606, + "step": 5324 + }, + { + "epoch": 0.16, + "learning_rate": 4.780297957361029e-06, + "loss": 1.178, + "step": 5325 + }, + { + "epoch": 0.16, + "learning_rate": 4.7801979575548156e-06, + "loss": 1.1563, + "step": 5326 + }, + { + "epoch": 0.16, + "learning_rate": 4.780097936042216e-06, + "loss": 1.1714, + "step": 5327 + }, + { + "epoch": 0.16, + "learning_rate": 4.779997892824182e-06, + "loss": 1.1, + "step": 5328 + }, + { + "epoch": 0.16, + "learning_rate": 4.779897827901665e-06, + "loss": 1.1573, + "step": 5329 + }, + { + "epoch": 0.16, + "learning_rate": 4.77979774127562e-06, + "loss": 1.1453, + "step": 5330 + }, + { + "epoch": 0.16, + "learning_rate": 4.779697632946998e-06, + "loss": 1.1511, + "step": 5331 + }, + { + "epoch": 0.16, + "learning_rate": 4.779597502916753e-06, + "loss": 1.1876, + "step": 5332 + }, + { + "epoch": 0.16, + "learning_rate": 4.779497351185838e-06, + "loss": 1.2491, + "step": 5333 + }, + { + "epoch": 0.16, + "learning_rate": 4.779397177755205e-06, + "loss": 1.1668, + "step": 5334 + }, + { + "epoch": 0.16, + "learning_rate": 4.7792969826258095e-06, + "loss": 1.1007, + "step": 5335 + }, + { + "epoch": 0.16, + "learning_rate": 4.779196765798604e-06, + "loss": 1.0799, + "step": 5336 + }, + { + "epoch": 0.16, + "learning_rate": 4.779096527274542e-06, + "loss": 1.1678, + "step": 5337 + }, + { + "epoch": 0.16, + "learning_rate": 4.778996267054581e-06, + "loss": 1.1607, + "step": 5338 + }, + { + "epoch": 0.16, + "learning_rate": 4.778895985139672e-06, + "loss": 1.0276, + "step": 5339 + }, + { + "epoch": 0.16, + "learning_rate": 4.77879568153077e-06, + "loss": 1.2162, + "step": 5340 + }, + { + "epoch": 0.16, + "learning_rate": 4.778695356228832e-06, + "loss": 1.1226, + "step": 5341 + }, + { + "epoch": 0.16, + "learning_rate": 4.778595009234811e-06, + "loss": 1.1016, + "step": 5342 + }, + { + "epoch": 0.16, + "learning_rate": 4.778494640549663e-06, + "loss": 1.1871, + "step": 5343 + }, + { + "epoch": 0.16, + "learning_rate": 4.778394250174343e-06, + "loss": 1.2682, + "step": 5344 + }, + { + "epoch": 0.16, + "learning_rate": 4.778293838109807e-06, + "loss": 1.1648, + "step": 5345 + }, + { + "epoch": 0.16, + "learning_rate": 4.778193404357011e-06, + "loss": 1.1085, + "step": 5346 + }, + { + "epoch": 0.16, + "learning_rate": 4.778092948916912e-06, + "loss": 1.152, + "step": 5347 + }, + { + "epoch": 0.16, + "learning_rate": 4.777992471790465e-06, + "loss": 1.2927, + "step": 5348 + }, + { + "epoch": 0.16, + "learning_rate": 4.777891972978625e-06, + "loss": 1.1566, + "step": 5349 + }, + { + "epoch": 0.16, + "learning_rate": 4.777791452482352e-06, + "loss": 1.151, + "step": 5350 + }, + { + "epoch": 0.16, + "learning_rate": 4.777690910302601e-06, + "loss": 1.2119, + "step": 5351 + }, + { + "epoch": 0.16, + "learning_rate": 4.77759034644033e-06, + "loss": 1.1797, + "step": 5352 + }, + { + "epoch": 0.16, + "learning_rate": 4.777489760896496e-06, + "loss": 1.1379, + "step": 5353 + }, + { + "epoch": 0.16, + "learning_rate": 4.777389153672056e-06, + "loss": 1.3248, + "step": 5354 + }, + { + "epoch": 0.16, + "learning_rate": 4.777288524767968e-06, + "loss": 1.2123, + "step": 5355 + }, + { + "epoch": 0.16, + "learning_rate": 4.77718787418519e-06, + "loss": 1.2628, + "step": 5356 + }, + { + "epoch": 0.16, + "learning_rate": 4.77708720192468e-06, + "loss": 1.1442, + "step": 5357 + }, + { + "epoch": 0.16, + "learning_rate": 4.776986507987397e-06, + "loss": 1.0754, + "step": 5358 + }, + { + "epoch": 0.16, + "learning_rate": 4.776885792374298e-06, + "loss": 1.1536, + "step": 5359 + }, + { + "epoch": 0.16, + "learning_rate": 4.776785055086344e-06, + "loss": 1.1243, + "step": 5360 + }, + { + "epoch": 0.16, + "learning_rate": 4.776684296124493e-06, + "loss": 1.2088, + "step": 5361 + }, + { + "epoch": 0.16, + "learning_rate": 4.776583515489703e-06, + "loss": 1.0699, + "step": 5362 + }, + { + "epoch": 0.16, + "learning_rate": 4.776482713182935e-06, + "loss": 1.0712, + "step": 5363 + }, + { + "epoch": 0.16, + "learning_rate": 4.7763818892051475e-06, + "loss": 1.0496, + "step": 5364 + }, + { + "epoch": 0.16, + "learning_rate": 4.776281043557301e-06, + "loss": 1.1468, + "step": 5365 + }, + { + "epoch": 0.16, + "learning_rate": 4.776180176240356e-06, + "loss": 1.1855, + "step": 5366 + }, + { + "epoch": 0.16, + "learning_rate": 4.776079287255271e-06, + "loss": 1.2054, + "step": 5367 + }, + { + "epoch": 0.16, + "learning_rate": 4.775978376603008e-06, + "loss": 1.0211, + "step": 5368 + }, + { + "epoch": 0.16, + "learning_rate": 4.775877444284525e-06, + "loss": 1.1472, + "step": 5369 + }, + { + "epoch": 0.16, + "learning_rate": 4.7757764903007875e-06, + "loss": 1.1555, + "step": 5370 + }, + { + "epoch": 0.16, + "learning_rate": 4.775675514652753e-06, + "loss": 1.1387, + "step": 5371 + }, + { + "epoch": 0.16, + "learning_rate": 4.775574517341383e-06, + "loss": 1.0247, + "step": 5372 + }, + { + "epoch": 0.16, + "learning_rate": 4.775473498367641e-06, + "loss": 1.2135, + "step": 5373 + }, + { + "epoch": 0.16, + "learning_rate": 4.775372457732486e-06, + "loss": 1.197, + "step": 5374 + }, + { + "epoch": 0.16, + "learning_rate": 4.7752713954368805e-06, + "loss": 1.1605, + "step": 5375 + }, + { + "epoch": 0.16, + "learning_rate": 4.775170311481788e-06, + "loss": 1.147, + "step": 5376 + }, + { + "epoch": 0.16, + "learning_rate": 4.77506920586817e-06, + "loss": 1.1115, + "step": 5377 + }, + { + "epoch": 0.16, + "learning_rate": 4.7749680785969885e-06, + "loss": 1.1384, + "step": 5378 + }, + { + "epoch": 0.16, + "learning_rate": 4.7748669296692064e-06, + "loss": 1.1132, + "step": 5379 + }, + { + "epoch": 0.16, + "learning_rate": 4.774765759085788e-06, + "loss": 1.1562, + "step": 5380 + }, + { + "epoch": 0.16, + "learning_rate": 4.774664566847693e-06, + "loss": 0.9844, + "step": 5381 + }, + { + "epoch": 0.16, + "learning_rate": 4.7745633529558886e-06, + "loss": 1.0771, + "step": 5382 + }, + { + "epoch": 0.16, + "learning_rate": 4.774462117411336e-06, + "loss": 1.1809, + "step": 5383 + }, + { + "epoch": 0.16, + "learning_rate": 4.774360860214999e-06, + "loss": 1.0482, + "step": 5384 + }, + { + "epoch": 0.16, + "learning_rate": 4.774259581367843e-06, + "loss": 1.1602, + "step": 5385 + }, + { + "epoch": 0.16, + "learning_rate": 4.774158280870831e-06, + "loss": 1.2123, + "step": 5386 + }, + { + "epoch": 0.16, + "learning_rate": 4.774056958724926e-06, + "loss": 1.0468, + "step": 5387 + }, + { + "epoch": 0.16, + "learning_rate": 4.773955614931095e-06, + "loss": 1.1891, + "step": 5388 + }, + { + "epoch": 0.16, + "learning_rate": 4.773854249490302e-06, + "loss": 1.187, + "step": 5389 + }, + { + "epoch": 0.16, + "learning_rate": 4.7737528624035115e-06, + "loss": 1.0966, + "step": 5390 + }, + { + "epoch": 0.16, + "learning_rate": 4.773651453671688e-06, + "loss": 1.106, + "step": 5391 + }, + { + "epoch": 0.16, + "learning_rate": 4.773550023295799e-06, + "loss": 1.19, + "step": 5392 + }, + { + "epoch": 0.16, + "learning_rate": 4.773448571276808e-06, + "loss": 1.1473, + "step": 5393 + }, + { + "epoch": 0.16, + "learning_rate": 4.773347097615682e-06, + "loss": 1.1584, + "step": 5394 + }, + { + "epoch": 0.16, + "learning_rate": 4.773245602313386e-06, + "loss": 1.1149, + "step": 5395 + }, + { + "epoch": 0.16, + "learning_rate": 4.773144085370887e-06, + "loss": 1.1511, + "step": 5396 + }, + { + "epoch": 0.16, + "learning_rate": 4.773042546789151e-06, + "loss": 1.2075, + "step": 5397 + }, + { + "epoch": 0.16, + "learning_rate": 4.772940986569144e-06, + "loss": 1.1573, + "step": 5398 + }, + { + "epoch": 0.16, + "learning_rate": 4.772839404711834e-06, + "loss": 1.1473, + "step": 5399 + }, + { + "epoch": 0.16, + "learning_rate": 4.772737801218188e-06, + "loss": 1.1362, + "step": 5400 + }, + { + "epoch": 0.16, + "learning_rate": 4.772636176089172e-06, + "loss": 1.2113, + "step": 5401 + }, + { + "epoch": 0.16, + "learning_rate": 4.772534529325754e-06, + "loss": 1.1597, + "step": 5402 + }, + { + "epoch": 0.16, + "learning_rate": 4.7724328609289025e-06, + "loss": 1.1023, + "step": 5403 + }, + { + "epoch": 0.16, + "learning_rate": 4.772331170899585e-06, + "loss": 1.1264, + "step": 5404 + }, + { + "epoch": 0.16, + "learning_rate": 4.772229459238768e-06, + "loss": 1.1823, + "step": 5405 + }, + { + "epoch": 0.16, + "learning_rate": 4.772127725947422e-06, + "loss": 1.1116, + "step": 5406 + }, + { + "epoch": 0.16, + "learning_rate": 4.7720259710265135e-06, + "loss": 1.2021, + "step": 5407 + }, + { + "epoch": 0.16, + "learning_rate": 4.771924194477012e-06, + "loss": 1.1749, + "step": 5408 + }, + { + "epoch": 0.16, + "learning_rate": 4.771822396299886e-06, + "loss": 1.1956, + "step": 5409 + }, + { + "epoch": 0.16, + "learning_rate": 4.771720576496106e-06, + "loss": 1.0889, + "step": 5410 + }, + { + "epoch": 0.16, + "learning_rate": 4.7716187350666395e-06, + "loss": 1.1818, + "step": 5411 + }, + { + "epoch": 0.16, + "learning_rate": 4.7715168720124575e-06, + "loss": 1.3383, + "step": 5412 + }, + { + "epoch": 0.16, + "learning_rate": 4.771414987334528e-06, + "loss": 1.2205, + "step": 5413 + }, + { + "epoch": 0.16, + "learning_rate": 4.771313081033822e-06, + "loss": 1.227, + "step": 5414 + }, + { + "epoch": 0.16, + "learning_rate": 4.771211153111309e-06, + "loss": 1.1069, + "step": 5415 + }, + { + "epoch": 0.16, + "learning_rate": 4.7711092035679606e-06, + "loss": 1.1944, + "step": 5416 + }, + { + "epoch": 0.16, + "learning_rate": 4.771007232404746e-06, + "loss": 1.0537, + "step": 5417 + }, + { + "epoch": 0.16, + "learning_rate": 4.7709052396226365e-06, + "loss": 1.2496, + "step": 5418 + }, + { + "epoch": 0.16, + "learning_rate": 4.770803225222602e-06, + "loss": 1.0325, + "step": 5419 + }, + { + "epoch": 0.16, + "learning_rate": 4.7707011892056154e-06, + "loss": 1.1899, + "step": 5420 + }, + { + "epoch": 0.16, + "learning_rate": 4.770599131572646e-06, + "loss": 1.0698, + "step": 5421 + }, + { + "epoch": 0.16, + "learning_rate": 4.770497052324667e-06, + "loss": 1.1249, + "step": 5422 + }, + { + "epoch": 0.16, + "learning_rate": 4.77039495146265e-06, + "loss": 1.1851, + "step": 5423 + }, + { + "epoch": 0.16, + "learning_rate": 4.7702928289875664e-06, + "loss": 1.2783, + "step": 5424 + }, + { + "epoch": 0.16, + "learning_rate": 4.7701906849003886e-06, + "loss": 1.1509, + "step": 5425 + }, + { + "epoch": 0.16, + "learning_rate": 4.770088519202088e-06, + "loss": 1.2329, + "step": 5426 + }, + { + "epoch": 0.16, + "learning_rate": 4.769986331893639e-06, + "loss": 1.1951, + "step": 5427 + }, + { + "epoch": 0.16, + "learning_rate": 4.769884122976013e-06, + "loss": 1.118, + "step": 5428 + }, + { + "epoch": 0.16, + "learning_rate": 4.769781892450182e-06, + "loss": 1.1973, + "step": 5429 + }, + { + "epoch": 0.16, + "learning_rate": 4.769679640317123e-06, + "loss": 1.2823, + "step": 5430 + }, + { + "epoch": 0.16, + "learning_rate": 4.7695773665778055e-06, + "loss": 1.0839, + "step": 5431 + }, + { + "epoch": 0.16, + "learning_rate": 4.769475071233205e-06, + "loss": 1.2162, + "step": 5432 + }, + { + "epoch": 0.16, + "learning_rate": 4.769372754284294e-06, + "loss": 1.1572, + "step": 5433 + }, + { + "epoch": 0.16, + "learning_rate": 4.769270415732048e-06, + "loss": 1.1249, + "step": 5434 + }, + { + "epoch": 0.16, + "learning_rate": 4.769168055577441e-06, + "loss": 1.1385, + "step": 5435 + }, + { + "epoch": 0.16, + "learning_rate": 4.769065673821447e-06, + "loss": 1.2587, + "step": 5436 + }, + { + "epoch": 0.16, + "learning_rate": 4.768963270465039e-06, + "loss": 1.3349, + "step": 5437 + }, + { + "epoch": 0.16, + "learning_rate": 4.768860845509196e-06, + "loss": 1.1644, + "step": 5438 + }, + { + "epoch": 0.16, + "learning_rate": 4.768758398954888e-06, + "loss": 1.1409, + "step": 5439 + }, + { + "epoch": 0.16, + "learning_rate": 4.768655930803095e-06, + "loss": 1.183, + "step": 5440 + }, + { + "epoch": 0.16, + "learning_rate": 4.768553441054788e-06, + "loss": 1.0802, + "step": 5441 + }, + { + "epoch": 0.16, + "learning_rate": 4.768450929710946e-06, + "loss": 1.1511, + "step": 5442 + }, + { + "epoch": 0.16, + "learning_rate": 4.768348396772543e-06, + "loss": 1.1215, + "step": 5443 + }, + { + "epoch": 0.16, + "learning_rate": 4.768245842240556e-06, + "loss": 1.2521, + "step": 5444 + }, + { + "epoch": 0.16, + "learning_rate": 4.768143266115961e-06, + "loss": 1.1791, + "step": 5445 + }, + { + "epoch": 0.16, + "learning_rate": 4.768040668399735e-06, + "loss": 1.1354, + "step": 5446 + }, + { + "epoch": 0.16, + "learning_rate": 4.767938049092854e-06, + "loss": 1.1523, + "step": 5447 + }, + { + "epoch": 0.16, + "learning_rate": 4.767835408196295e-06, + "loss": 1.0944, + "step": 5448 + }, + { + "epoch": 0.16, + "learning_rate": 4.767732745711035e-06, + "loss": 1.2213, + "step": 5449 + }, + { + "epoch": 0.16, + "learning_rate": 4.767630061638051e-06, + "loss": 1.2251, + "step": 5450 + }, + { + "epoch": 0.16, + "learning_rate": 4.767527355978321e-06, + "loss": 1.0949, + "step": 5451 + }, + { + "epoch": 0.16, + "learning_rate": 4.767424628732823e-06, + "loss": 1.1921, + "step": 5452 + }, + { + "epoch": 0.16, + "learning_rate": 4.767321879902534e-06, + "loss": 1.1176, + "step": 5453 + }, + { + "epoch": 0.16, + "learning_rate": 4.767219109488434e-06, + "loss": 1.1275, + "step": 5454 + }, + { + "epoch": 0.16, + "learning_rate": 4.767116317491499e-06, + "loss": 1.2115, + "step": 5455 + }, + { + "epoch": 0.16, + "learning_rate": 4.767013503912709e-06, + "loss": 1.2869, + "step": 5456 + }, + { + "epoch": 0.16, + "learning_rate": 4.766910668753042e-06, + "loss": 1.2646, + "step": 5457 + }, + { + "epoch": 0.16, + "learning_rate": 4.766807812013478e-06, + "loss": 1.1493, + "step": 5458 + }, + { + "epoch": 0.16, + "learning_rate": 4.766704933694994e-06, + "loss": 1.1353, + "step": 5459 + }, + { + "epoch": 0.16, + "learning_rate": 4.766602033798572e-06, + "loss": 1.2301, + "step": 5460 + }, + { + "epoch": 0.16, + "learning_rate": 4.766499112325189e-06, + "loss": 1.1783, + "step": 5461 + }, + { + "epoch": 0.16, + "learning_rate": 4.766396169275827e-06, + "loss": 1.1494, + "step": 5462 + }, + { + "epoch": 0.16, + "learning_rate": 4.766293204651464e-06, + "loss": 1.1046, + "step": 5463 + }, + { + "epoch": 0.16, + "learning_rate": 4.766190218453082e-06, + "loss": 1.1412, + "step": 5464 + }, + { + "epoch": 0.16, + "learning_rate": 4.766087210681661e-06, + "loss": 1.1451, + "step": 5465 + }, + { + "epoch": 0.16, + "learning_rate": 4.76598418133818e-06, + "loss": 1.1232, + "step": 5466 + }, + { + "epoch": 0.16, + "learning_rate": 4.765881130423622e-06, + "loss": 1.0959, + "step": 5467 + }, + { + "epoch": 0.16, + "learning_rate": 4.765778057938966e-06, + "loss": 1.1891, + "step": 5468 + }, + { + "epoch": 0.16, + "learning_rate": 4.765674963885194e-06, + "loss": 1.1757, + "step": 5469 + }, + { + "epoch": 0.16, + "learning_rate": 4.7655718482632884e-06, + "loss": 1.1753, + "step": 5470 + }, + { + "epoch": 0.16, + "learning_rate": 4.76546871107423e-06, + "loss": 1.0906, + "step": 5471 + }, + { + "epoch": 0.16, + "learning_rate": 4.765365552319e-06, + "loss": 1.0641, + "step": 5472 + }, + { + "epoch": 0.16, + "learning_rate": 4.7652623719985814e-06, + "loss": 1.0712, + "step": 5473 + }, + { + "epoch": 0.16, + "learning_rate": 4.765159170113955e-06, + "loss": 1.2418, + "step": 5474 + }, + { + "epoch": 0.16, + "learning_rate": 4.7650559466661054e-06, + "loss": 1.2037, + "step": 5475 + }, + { + "epoch": 0.16, + "learning_rate": 4.764952701656014e-06, + "loss": 1.1654, + "step": 5476 + }, + { + "epoch": 0.16, + "learning_rate": 4.764849435084663e-06, + "loss": 1.1675, + "step": 5477 + }, + { + "epoch": 0.17, + "learning_rate": 4.764746146953036e-06, + "loss": 1.0486, + "step": 5478 + }, + { + "epoch": 0.17, + "learning_rate": 4.764642837262118e-06, + "loss": 1.1371, + "step": 5479 + }, + { + "epoch": 0.17, + "learning_rate": 4.76453950601289e-06, + "loss": 1.1205, + "step": 5480 + }, + { + "epoch": 0.17, + "learning_rate": 4.764436153206335e-06, + "loss": 1.1147, + "step": 5481 + }, + { + "epoch": 0.17, + "learning_rate": 4.76433277884344e-06, + "loss": 1.163, + "step": 5482 + }, + { + "epoch": 0.17, + "learning_rate": 4.764229382925187e-06, + "loss": 1.1936, + "step": 5483 + }, + { + "epoch": 0.17, + "learning_rate": 4.764125965452562e-06, + "loss": 1.1791, + "step": 5484 + }, + { + "epoch": 0.17, + "learning_rate": 4.764022526426547e-06, + "loss": 1.0843, + "step": 5485 + }, + { + "epoch": 0.17, + "learning_rate": 4.7639190658481284e-06, + "loss": 1.2407, + "step": 5486 + }, + { + "epoch": 0.17, + "learning_rate": 4.76381558371829e-06, + "loss": 1.2131, + "step": 5487 + }, + { + "epoch": 0.17, + "learning_rate": 4.763712080038018e-06, + "loss": 1.171, + "step": 5488 + }, + { + "epoch": 0.17, + "learning_rate": 4.763608554808298e-06, + "loss": 1.1984, + "step": 5489 + }, + { + "epoch": 0.17, + "learning_rate": 4.7635050080301135e-06, + "loss": 0.9995, + "step": 5490 + }, + { + "epoch": 0.17, + "learning_rate": 4.763401439704452e-06, + "loss": 0.9451, + "step": 5491 + }, + { + "epoch": 0.17, + "learning_rate": 4.763297849832299e-06, + "loss": 1.239, + "step": 5492 + }, + { + "epoch": 0.17, + "learning_rate": 4.7631942384146405e-06, + "loss": 1.1317, + "step": 5493 + }, + { + "epoch": 0.17, + "learning_rate": 4.763090605452462e-06, + "loss": 1.1398, + "step": 5494 + }, + { + "epoch": 0.17, + "learning_rate": 4.762986950946752e-06, + "loss": 1.1049, + "step": 5495 + }, + { + "epoch": 0.17, + "learning_rate": 4.762883274898495e-06, + "loss": 1.1964, + "step": 5496 + }, + { + "epoch": 0.17, + "learning_rate": 4.76277957730868e-06, + "loss": 1.1031, + "step": 5497 + }, + { + "epoch": 0.17, + "learning_rate": 4.762675858178293e-06, + "loss": 1.0951, + "step": 5498 + }, + { + "epoch": 0.17, + "learning_rate": 4.762572117508322e-06, + "loss": 1.1815, + "step": 5499 + }, + { + "epoch": 0.17, + "learning_rate": 4.762468355299753e-06, + "loss": 1.1891, + "step": 5500 + }, + { + "epoch": 0.17, + "learning_rate": 4.762364571553576e-06, + "loss": 1.1494, + "step": 5501 + }, + { + "epoch": 0.17, + "learning_rate": 4.762260766270777e-06, + "loss": 1.0777, + "step": 5502 + }, + { + "epoch": 0.17, + "learning_rate": 4.762156939452346e-06, + "loss": 1.1251, + "step": 5503 + }, + { + "epoch": 0.17, + "learning_rate": 4.7620530910992705e-06, + "loss": 1.0833, + "step": 5504 + }, + { + "epoch": 0.17, + "learning_rate": 4.761949221212538e-06, + "loss": 1.2542, + "step": 5505 + }, + { + "epoch": 0.17, + "learning_rate": 4.761845329793139e-06, + "loss": 1.1104, + "step": 5506 + }, + { + "epoch": 0.17, + "learning_rate": 4.761741416842061e-06, + "loss": 1.1059, + "step": 5507 + }, + { + "epoch": 0.17, + "learning_rate": 4.7616374823602944e-06, + "loss": 1.1764, + "step": 5508 + }, + { + "epoch": 0.17, + "learning_rate": 4.761533526348828e-06, + "loss": 1.1451, + "step": 5509 + }, + { + "epoch": 0.17, + "learning_rate": 4.761429548808653e-06, + "loss": 1.0889, + "step": 5510 + }, + { + "epoch": 0.17, + "learning_rate": 4.7613255497407564e-06, + "loss": 1.1285, + "step": 5511 + }, + { + "epoch": 0.17, + "learning_rate": 4.76122152914613e-06, + "loss": 1.2294, + "step": 5512 + }, + { + "epoch": 0.17, + "learning_rate": 4.761117487025764e-06, + "loss": 1.0236, + "step": 5513 + }, + { + "epoch": 0.17, + "learning_rate": 4.761013423380648e-06, + "loss": 1.0816, + "step": 5514 + }, + { + "epoch": 0.17, + "learning_rate": 4.760909338211773e-06, + "loss": 1.2247, + "step": 5515 + }, + { + "epoch": 0.17, + "learning_rate": 4.760805231520131e-06, + "loss": 1.0948, + "step": 5516 + }, + { + "epoch": 0.17, + "learning_rate": 4.760701103306711e-06, + "loss": 1.1859, + "step": 5517 + }, + { + "epoch": 0.17, + "learning_rate": 4.760596953572506e-06, + "loss": 1.1523, + "step": 5518 + }, + { + "epoch": 0.17, + "learning_rate": 4.760492782318506e-06, + "loss": 1.222, + "step": 5519 + }, + { + "epoch": 0.17, + "learning_rate": 4.7603885895457046e-06, + "loss": 1.2451, + "step": 5520 + }, + { + "epoch": 0.17, + "learning_rate": 4.760284375255091e-06, + "loss": 1.1495, + "step": 5521 + }, + { + "epoch": 0.17, + "learning_rate": 4.76018013944766e-06, + "loss": 1.1998, + "step": 5522 + }, + { + "epoch": 0.17, + "learning_rate": 4.760075882124402e-06, + "loss": 1.1263, + "step": 5523 + }, + { + "epoch": 0.17, + "learning_rate": 4.7599716032863104e-06, + "loss": 1.1927, + "step": 5524 + }, + { + "epoch": 0.17, + "learning_rate": 4.759867302934377e-06, + "loss": 1.0515, + "step": 5525 + }, + { + "epoch": 0.17, + "learning_rate": 4.759762981069596e-06, + "loss": 1.1926, + "step": 5526 + }, + { + "epoch": 0.17, + "learning_rate": 4.7596586376929595e-06, + "loss": 1.1282, + "step": 5527 + }, + { + "epoch": 0.17, + "learning_rate": 4.759554272805461e-06, + "loss": 1.115, + "step": 5528 + }, + { + "epoch": 0.17, + "learning_rate": 4.759449886408094e-06, + "loss": 1.028, + "step": 5529 + }, + { + "epoch": 0.17, + "learning_rate": 4.759345478501852e-06, + "loss": 1.0951, + "step": 5530 + }, + { + "epoch": 0.17, + "learning_rate": 4.759241049087729e-06, + "loss": 1.1705, + "step": 5531 + }, + { + "epoch": 0.17, + "learning_rate": 4.7591365981667205e-06, + "loss": 1.1973, + "step": 5532 + }, + { + "epoch": 0.17, + "learning_rate": 4.759032125739819e-06, + "loss": 1.1824, + "step": 5533 + }, + { + "epoch": 0.17, + "learning_rate": 4.758927631808019e-06, + "loss": 1.1444, + "step": 5534 + }, + { + "epoch": 0.17, + "learning_rate": 4.758823116372316e-06, + "loss": 1.1345, + "step": 5535 + }, + { + "epoch": 0.17, + "learning_rate": 4.758718579433705e-06, + "loss": 1.2357, + "step": 5536 + }, + { + "epoch": 0.17, + "learning_rate": 4.758614020993182e-06, + "loss": 1.1138, + "step": 5537 + }, + { + "epoch": 0.17, + "learning_rate": 4.758509441051741e-06, + "loss": 1.0947, + "step": 5538 + }, + { + "epoch": 0.17, + "learning_rate": 4.7584048396103765e-06, + "loss": 1.16, + "step": 5539 + }, + { + "epoch": 0.17, + "learning_rate": 4.758300216670087e-06, + "loss": 1.1573, + "step": 5540 + }, + { + "epoch": 0.17, + "learning_rate": 4.758195572231866e-06, + "loss": 1.3029, + "step": 5541 + }, + { + "epoch": 0.17, + "learning_rate": 4.7580909062967115e-06, + "loss": 1.1651, + "step": 5542 + }, + { + "epoch": 0.17, + "learning_rate": 4.757986218865619e-06, + "loss": 1.2864, + "step": 5543 + }, + { + "epoch": 0.17, + "learning_rate": 4.757881509939584e-06, + "loss": 1.1047, + "step": 5544 + }, + { + "epoch": 0.17, + "learning_rate": 4.757776779519607e-06, + "loss": 1.1647, + "step": 5545 + }, + { + "epoch": 0.17, + "learning_rate": 4.757672027606681e-06, + "loss": 1.1021, + "step": 5546 + }, + { + "epoch": 0.17, + "learning_rate": 4.757567254201804e-06, + "loss": 1.1719, + "step": 5547 + }, + { + "epoch": 0.17, + "learning_rate": 4.757462459305975e-06, + "loss": 1.0784, + "step": 5548 + }, + { + "epoch": 0.17, + "learning_rate": 4.75735764292019e-06, + "loss": 1.1243, + "step": 5549 + }, + { + "epoch": 0.17, + "learning_rate": 4.757252805045448e-06, + "loss": 1.2317, + "step": 5550 + }, + { + "epoch": 0.17, + "learning_rate": 4.757147945682746e-06, + "loss": 1.1694, + "step": 5551 + }, + { + "epoch": 0.17, + "learning_rate": 4.757043064833082e-06, + "loss": 1.1854, + "step": 5552 + }, + { + "epoch": 0.17, + "learning_rate": 4.756938162497457e-06, + "loss": 1.1379, + "step": 5553 + }, + { + "epoch": 0.17, + "learning_rate": 4.756833238676865e-06, + "loss": 1.3041, + "step": 5554 + }, + { + "epoch": 0.17, + "learning_rate": 4.75672829337231e-06, + "loss": 1.2023, + "step": 5555 + }, + { + "epoch": 0.17, + "learning_rate": 4.756623326584787e-06, + "loss": 1.2273, + "step": 5556 + }, + { + "epoch": 0.17, + "learning_rate": 4.756518338315297e-06, + "loss": 1.2153, + "step": 5557 + }, + { + "epoch": 0.17, + "learning_rate": 4.75641332856484e-06, + "loss": 1.1773, + "step": 5558 + }, + { + "epoch": 0.17, + "learning_rate": 4.756308297334414e-06, + "loss": 1.0905, + "step": 5559 + }, + { + "epoch": 0.17, + "learning_rate": 4.75620324462502e-06, + "loss": 1.1643, + "step": 5560 + }, + { + "epoch": 0.17, + "learning_rate": 4.756098170437658e-06, + "loss": 1.0793, + "step": 5561 + }, + { + "epoch": 0.17, + "learning_rate": 4.7559930747733275e-06, + "loss": 1.2568, + "step": 5562 + }, + { + "epoch": 0.17, + "learning_rate": 4.75588795763303e-06, + "loss": 1.1686, + "step": 5563 + }, + { + "epoch": 0.17, + "learning_rate": 4.755782819017765e-06, + "loss": 1.1465, + "step": 5564 + }, + { + "epoch": 0.17, + "learning_rate": 4.755677658928534e-06, + "loss": 1.1726, + "step": 5565 + }, + { + "epoch": 0.17, + "learning_rate": 4.755572477366338e-06, + "loss": 1.1271, + "step": 5566 + }, + { + "epoch": 0.17, + "learning_rate": 4.7554672743321785e-06, + "loss": 1.1533, + "step": 5567 + }, + { + "epoch": 0.17, + "learning_rate": 4.755362049827057e-06, + "loss": 1.131, + "step": 5568 + }, + { + "epoch": 0.17, + "learning_rate": 4.7552568038519755e-06, + "loss": 1.1957, + "step": 5569 + }, + { + "epoch": 0.17, + "learning_rate": 4.755151536407935e-06, + "loss": 1.1061, + "step": 5570 + }, + { + "epoch": 0.17, + "learning_rate": 4.755046247495937e-06, + "loss": 1.019, + "step": 5571 + }, + { + "epoch": 0.17, + "learning_rate": 4.754940937116986e-06, + "loss": 1.1337, + "step": 5572 + }, + { + "epoch": 0.17, + "learning_rate": 4.754835605272083e-06, + "loss": 1.1583, + "step": 5573 + }, + { + "epoch": 0.17, + "learning_rate": 4.75473025196223e-06, + "loss": 1.148, + "step": 5574 + }, + { + "epoch": 0.17, + "learning_rate": 4.754624877188433e-06, + "loss": 1.1705, + "step": 5575 + }, + { + "epoch": 0.17, + "learning_rate": 4.754519480951692e-06, + "loss": 1.0773, + "step": 5576 + }, + { + "epoch": 0.17, + "learning_rate": 4.754414063253011e-06, + "loss": 1.2249, + "step": 5577 + }, + { + "epoch": 0.17, + "learning_rate": 4.754308624093393e-06, + "loss": 1.1351, + "step": 5578 + }, + { + "epoch": 0.17, + "learning_rate": 4.7542031634738445e-06, + "loss": 1.261, + "step": 5579 + }, + { + "epoch": 0.17, + "learning_rate": 4.7540976813953665e-06, + "loss": 1.0437, + "step": 5580 + }, + { + "epoch": 0.17, + "learning_rate": 4.753992177858965e-06, + "loss": 1.2554, + "step": 5581 + }, + { + "epoch": 0.17, + "learning_rate": 4.753886652865642e-06, + "loss": 1.1823, + "step": 5582 + }, + { + "epoch": 0.17, + "learning_rate": 4.753781106416406e-06, + "loss": 1.1661, + "step": 5583 + }, + { + "epoch": 0.17, + "learning_rate": 4.753675538512257e-06, + "loss": 1.1055, + "step": 5584 + }, + { + "epoch": 0.17, + "learning_rate": 4.753569949154203e-06, + "loss": 1.0463, + "step": 5585 + }, + { + "epoch": 0.17, + "learning_rate": 4.753464338343249e-06, + "loss": 1.334, + "step": 5586 + }, + { + "epoch": 0.17, + "learning_rate": 4.7533587060803995e-06, + "loss": 1.177, + "step": 5587 + }, + { + "epoch": 0.17, + "learning_rate": 4.75325305236666e-06, + "loss": 1.1965, + "step": 5588 + }, + { + "epoch": 0.17, + "learning_rate": 4.753147377203037e-06, + "loss": 1.2778, + "step": 5589 + }, + { + "epoch": 0.17, + "learning_rate": 4.753041680590536e-06, + "loss": 1.0715, + "step": 5590 + }, + { + "epoch": 0.17, + "learning_rate": 4.752935962530163e-06, + "loss": 1.1509, + "step": 5591 + }, + { + "epoch": 0.17, + "learning_rate": 4.7528302230229255e-06, + "loss": 1.0578, + "step": 5592 + }, + { + "epoch": 0.17, + "learning_rate": 4.752724462069829e-06, + "loss": 1.1758, + "step": 5593 + }, + { + "epoch": 0.17, + "learning_rate": 4.75261867967188e-06, + "loss": 1.101, + "step": 5594 + }, + { + "epoch": 0.17, + "learning_rate": 4.752512875830086e-06, + "loss": 1.2196, + "step": 5595 + }, + { + "epoch": 0.17, + "learning_rate": 4.752407050545455e-06, + "loss": 1.1905, + "step": 5596 + }, + { + "epoch": 0.17, + "learning_rate": 4.752301203818993e-06, + "loss": 1.0438, + "step": 5597 + }, + { + "epoch": 0.17, + "learning_rate": 4.752195335651709e-06, + "loss": 1.0852, + "step": 5598 + }, + { + "epoch": 0.17, + "learning_rate": 4.75208944604461e-06, + "loss": 1.0823, + "step": 5599 + }, + { + "epoch": 0.17, + "learning_rate": 4.7519835349987045e-06, + "loss": 1.1755, + "step": 5600 + }, + { + "epoch": 0.17, + "learning_rate": 4.7518776025149995e-06, + "loss": 1.1517, + "step": 5601 + }, + { + "epoch": 0.17, + "learning_rate": 4.751771648594504e-06, + "loss": 1.1878, + "step": 5602 + }, + { + "epoch": 0.17, + "learning_rate": 4.751665673238227e-06, + "loss": 1.1071, + "step": 5603 + }, + { + "epoch": 0.17, + "learning_rate": 4.7515596764471786e-06, + "loss": 1.26, + "step": 5604 + }, + { + "epoch": 0.17, + "learning_rate": 4.751453658222364e-06, + "loss": 1.1903, + "step": 5605 + }, + { + "epoch": 0.17, + "learning_rate": 4.751347618564798e-06, + "loss": 1.1828, + "step": 5606 + }, + { + "epoch": 0.17, + "learning_rate": 4.751241557475485e-06, + "loss": 1.1083, + "step": 5607 + }, + { + "epoch": 0.17, + "learning_rate": 4.751135474955437e-06, + "loss": 1.2148, + "step": 5608 + }, + { + "epoch": 0.17, + "learning_rate": 4.751029371005663e-06, + "loss": 1.1254, + "step": 5609 + }, + { + "epoch": 0.17, + "learning_rate": 4.750923245627175e-06, + "loss": 1.1856, + "step": 5610 + }, + { + "epoch": 0.17, + "learning_rate": 4.75081709882098e-06, + "loss": 1.2283, + "step": 5611 + }, + { + "epoch": 0.17, + "learning_rate": 4.7507109305880905e-06, + "loss": 1.0801, + "step": 5612 + }, + { + "epoch": 0.17, + "learning_rate": 4.7506047409295176e-06, + "loss": 1.1501, + "step": 5613 + }, + { + "epoch": 0.17, + "learning_rate": 4.750498529846271e-06, + "loss": 1.1226, + "step": 5614 + }, + { + "epoch": 0.17, + "learning_rate": 4.750392297339363e-06, + "loss": 1.1188, + "step": 5615 + }, + { + "epoch": 0.17, + "learning_rate": 4.750286043409803e-06, + "loss": 1.1716, + "step": 5616 + }, + { + "epoch": 0.17, + "learning_rate": 4.750179768058605e-06, + "loss": 1.2239, + "step": 5617 + }, + { + "epoch": 0.17, + "learning_rate": 4.750073471286779e-06, + "loss": 1.2557, + "step": 5618 + }, + { + "epoch": 0.17, + "learning_rate": 4.749967153095337e-06, + "loss": 1.1658, + "step": 5619 + }, + { + "epoch": 0.17, + "learning_rate": 4.749860813485291e-06, + "loss": 1.1968, + "step": 5620 + }, + { + "epoch": 0.17, + "learning_rate": 4.749754452457654e-06, + "loss": 1.0991, + "step": 5621 + }, + { + "epoch": 0.17, + "learning_rate": 4.749648070013438e-06, + "loss": 1.0633, + "step": 5622 + }, + { + "epoch": 0.17, + "learning_rate": 4.749541666153655e-06, + "loss": 1.0375, + "step": 5623 + }, + { + "epoch": 0.17, + "learning_rate": 4.749435240879321e-06, + "loss": 1.2314, + "step": 5624 + }, + { + "epoch": 0.17, + "learning_rate": 4.749328794191444e-06, + "loss": 1.2667, + "step": 5625 + }, + { + "epoch": 0.17, + "learning_rate": 4.7492223260910426e-06, + "loss": 1.2006, + "step": 5626 + }, + { + "epoch": 0.17, + "learning_rate": 4.749115836579127e-06, + "loss": 1.0361, + "step": 5627 + }, + { + "epoch": 0.17, + "learning_rate": 4.749009325656712e-06, + "loss": 1.0674, + "step": 5628 + }, + { + "epoch": 0.17, + "learning_rate": 4.748902793324811e-06, + "loss": 1.2126, + "step": 5629 + }, + { + "epoch": 0.17, + "learning_rate": 4.748796239584438e-06, + "loss": 1.2399, + "step": 5630 + }, + { + "epoch": 0.17, + "learning_rate": 4.748689664436609e-06, + "loss": 1.2193, + "step": 5631 + }, + { + "epoch": 0.17, + "learning_rate": 4.748583067882337e-06, + "loss": 1.1544, + "step": 5632 + }, + { + "epoch": 0.17, + "learning_rate": 4.748476449922637e-06, + "loss": 1.1277, + "step": 5633 + }, + { + "epoch": 0.17, + "learning_rate": 4.748369810558524e-06, + "loss": 1.0797, + "step": 5634 + }, + { + "epoch": 0.17, + "learning_rate": 4.7482631497910135e-06, + "loss": 1.1199, + "step": 5635 + }, + { + "epoch": 0.17, + "learning_rate": 4.748156467621121e-06, + "loss": 1.1504, + "step": 5636 + }, + { + "epoch": 0.17, + "learning_rate": 4.748049764049861e-06, + "loss": 1.2773, + "step": 5637 + }, + { + "epoch": 0.17, + "learning_rate": 4.7479430390782504e-06, + "loss": 1.0963, + "step": 5638 + }, + { + "epoch": 0.17, + "learning_rate": 4.747836292707304e-06, + "loss": 1.1708, + "step": 5639 + }, + { + "epoch": 0.17, + "learning_rate": 4.74772952493804e-06, + "loss": 1.1245, + "step": 5640 + }, + { + "epoch": 0.17, + "learning_rate": 4.747622735771473e-06, + "loss": 1.1228, + "step": 5641 + }, + { + "epoch": 0.17, + "learning_rate": 4.747515925208619e-06, + "loss": 1.2231, + "step": 5642 + }, + { + "epoch": 0.17, + "learning_rate": 4.747409093250497e-06, + "loss": 1.0825, + "step": 5643 + }, + { + "epoch": 0.17, + "learning_rate": 4.747302239898122e-06, + "loss": 1.2039, + "step": 5644 + }, + { + "epoch": 0.17, + "learning_rate": 4.747195365152513e-06, + "loss": 1.1577, + "step": 5645 + }, + { + "epoch": 0.17, + "learning_rate": 4.747088469014685e-06, + "loss": 1.1284, + "step": 5646 + }, + { + "epoch": 0.17, + "learning_rate": 4.746981551485659e-06, + "loss": 1.1266, + "step": 5647 + }, + { + "epoch": 0.17, + "learning_rate": 4.746874612566449e-06, + "loss": 1.2972, + "step": 5648 + }, + { + "epoch": 0.17, + "learning_rate": 4.746767652258075e-06, + "loss": 1.173, + "step": 5649 + }, + { + "epoch": 0.17, + "learning_rate": 4.746660670561556e-06, + "loss": 1.1385, + "step": 5650 + }, + { + "epoch": 0.17, + "learning_rate": 4.746553667477909e-06, + "loss": 1.0917, + "step": 5651 + }, + { + "epoch": 0.17, + "learning_rate": 4.746446643008153e-06, + "loss": 1.1332, + "step": 5652 + }, + { + "epoch": 0.17, + "learning_rate": 4.746339597153306e-06, + "loss": 1.0562, + "step": 5653 + }, + { + "epoch": 0.17, + "learning_rate": 4.74623252991439e-06, + "loss": 1.1658, + "step": 5654 + }, + { + "epoch": 0.17, + "learning_rate": 4.746125441292421e-06, + "loss": 1.0948, + "step": 5655 + }, + { + "epoch": 0.17, + "learning_rate": 4.746018331288419e-06, + "loss": 1.2433, + "step": 5656 + }, + { + "epoch": 0.17, + "learning_rate": 4.745911199903405e-06, + "loss": 1.1439, + "step": 5657 + }, + { + "epoch": 0.17, + "learning_rate": 4.745804047138398e-06, + "loss": 1.1919, + "step": 5658 + }, + { + "epoch": 0.17, + "learning_rate": 4.745696872994417e-06, + "loss": 1.0989, + "step": 5659 + }, + { + "epoch": 0.17, + "learning_rate": 4.745589677472485e-06, + "loss": 1.1573, + "step": 5660 + }, + { + "epoch": 0.17, + "learning_rate": 4.745482460573619e-06, + "loss": 1.0975, + "step": 5661 + }, + { + "epoch": 0.17, + "learning_rate": 4.745375222298843e-06, + "loss": 1.1874, + "step": 5662 + }, + { + "epoch": 0.17, + "learning_rate": 4.745267962649176e-06, + "loss": 1.2371, + "step": 5663 + }, + { + "epoch": 0.17, + "learning_rate": 4.745160681625639e-06, + "loss": 1.2135, + "step": 5664 + }, + { + "epoch": 0.17, + "learning_rate": 4.745053379229253e-06, + "loss": 1.0303, + "step": 5665 + }, + { + "epoch": 0.17, + "learning_rate": 4.744946055461041e-06, + "loss": 1.1893, + "step": 5666 + }, + { + "epoch": 0.17, + "learning_rate": 4.744838710322024e-06, + "loss": 1.1832, + "step": 5667 + }, + { + "epoch": 0.17, + "learning_rate": 4.744731343813222e-06, + "loss": 1.134, + "step": 5668 + }, + { + "epoch": 0.17, + "learning_rate": 4.744623955935661e-06, + "loss": 1.1515, + "step": 5669 + }, + { + "epoch": 0.17, + "learning_rate": 4.7445165466903595e-06, + "loss": 1.0977, + "step": 5670 + }, + { + "epoch": 0.17, + "learning_rate": 4.7444091160783415e-06, + "loss": 1.1093, + "step": 5671 + }, + { + "epoch": 0.17, + "learning_rate": 4.74430166410063e-06, + "loss": 1.1086, + "step": 5672 + }, + { + "epoch": 0.17, + "learning_rate": 4.7441941907582475e-06, + "loss": 1.113, + "step": 5673 + }, + { + "epoch": 0.17, + "learning_rate": 4.744086696052217e-06, + "loss": 1.1486, + "step": 5674 + }, + { + "epoch": 0.17, + "learning_rate": 4.7439791799835626e-06, + "loss": 1.1107, + "step": 5675 + }, + { + "epoch": 0.17, + "learning_rate": 4.743871642553306e-06, + "loss": 1.1326, + "step": 5676 + }, + { + "epoch": 0.17, + "learning_rate": 4.743764083762473e-06, + "loss": 1.186, + "step": 5677 + }, + { + "epoch": 0.17, + "learning_rate": 4.743656503612087e-06, + "loss": 1.1031, + "step": 5678 + }, + { + "epoch": 0.17, + "learning_rate": 4.74354890210317e-06, + "loss": 1.1702, + "step": 5679 + }, + { + "epoch": 0.17, + "learning_rate": 4.743441279236749e-06, + "loss": 1.2367, + "step": 5680 + }, + { + "epoch": 0.17, + "learning_rate": 4.743333635013847e-06, + "loss": 1.1442, + "step": 5681 + }, + { + "epoch": 0.17, + "learning_rate": 4.7432259694354895e-06, + "loss": 1.0792, + "step": 5682 + }, + { + "epoch": 0.17, + "learning_rate": 4.743118282502703e-06, + "loss": 1.2863, + "step": 5683 + }, + { + "epoch": 0.17, + "learning_rate": 4.743010574216508e-06, + "loss": 1.0743, + "step": 5684 + }, + { + "epoch": 0.17, + "learning_rate": 4.742902844577934e-06, + "loss": 1.2258, + "step": 5685 + }, + { + "epoch": 0.17, + "learning_rate": 4.742795093588004e-06, + "loss": 1.1952, + "step": 5686 + }, + { + "epoch": 0.17, + "learning_rate": 4.742687321247746e-06, + "loss": 1.1269, + "step": 5687 + }, + { + "epoch": 0.17, + "learning_rate": 4.742579527558185e-06, + "loss": 1.1504, + "step": 5688 + }, + { + "epoch": 0.17, + "learning_rate": 4.742471712520346e-06, + "loss": 1.1103, + "step": 5689 + }, + { + "epoch": 0.17, + "learning_rate": 4.742363876135256e-06, + "loss": 1.062, + "step": 5690 + }, + { + "epoch": 0.17, + "learning_rate": 4.742256018403943e-06, + "loss": 1.2657, + "step": 5691 + }, + { + "epoch": 0.17, + "learning_rate": 4.7421481393274326e-06, + "loss": 1.1396, + "step": 5692 + }, + { + "epoch": 0.17, + "learning_rate": 4.742040238906751e-06, + "loss": 1.1133, + "step": 5693 + }, + { + "epoch": 0.17, + "learning_rate": 4.741932317142926e-06, + "loss": 1.1678, + "step": 5694 + }, + { + "epoch": 0.17, + "learning_rate": 4.741824374036986e-06, + "loss": 1.1683, + "step": 5695 + }, + { + "epoch": 0.17, + "learning_rate": 4.741716409589958e-06, + "loss": 1.1197, + "step": 5696 + }, + { + "epoch": 0.17, + "learning_rate": 4.741608423802868e-06, + "loss": 1.1317, + "step": 5697 + }, + { + "epoch": 0.17, + "learning_rate": 4.741500416676746e-06, + "loss": 1.1918, + "step": 5698 + }, + { + "epoch": 0.17, + "learning_rate": 4.74139238821262e-06, + "loss": 1.2187, + "step": 5699 + }, + { + "epoch": 0.17, + "learning_rate": 4.741284338411518e-06, + "loss": 1.2037, + "step": 5700 + }, + { + "epoch": 0.17, + "learning_rate": 4.7411762672744675e-06, + "loss": 1.1311, + "step": 5701 + }, + { + "epoch": 0.17, + "learning_rate": 4.7410681748024995e-06, + "loss": 1.1329, + "step": 5702 + }, + { + "epoch": 0.17, + "learning_rate": 4.740960060996641e-06, + "loss": 1.0681, + "step": 5703 + }, + { + "epoch": 0.17, + "learning_rate": 4.740851925857922e-06, + "loss": 1.213, + "step": 5704 + }, + { + "epoch": 0.17, + "learning_rate": 4.740743769387373e-06, + "loss": 1.1732, + "step": 5705 + }, + { + "epoch": 0.17, + "learning_rate": 4.7406355915860215e-06, + "loss": 1.2332, + "step": 5706 + }, + { + "epoch": 0.17, + "learning_rate": 4.740527392454898e-06, + "loss": 1.1642, + "step": 5707 + }, + { + "epoch": 0.17, + "learning_rate": 4.740419171995033e-06, + "loss": 1.2925, + "step": 5708 + }, + { + "epoch": 0.17, + "learning_rate": 4.740310930207458e-06, + "loss": 1.1591, + "step": 5709 + }, + { + "epoch": 0.17, + "learning_rate": 4.7402026670932e-06, + "loss": 1.1331, + "step": 5710 + }, + { + "epoch": 0.17, + "learning_rate": 4.740094382653292e-06, + "loss": 1.0693, + "step": 5711 + }, + { + "epoch": 0.17, + "learning_rate": 4.739986076888765e-06, + "loss": 1.2311, + "step": 5712 + }, + { + "epoch": 0.17, + "learning_rate": 4.739877749800648e-06, + "loss": 1.2762, + "step": 5713 + }, + { + "epoch": 0.17, + "learning_rate": 4.739769401389975e-06, + "loss": 1.1754, + "step": 5714 + }, + { + "epoch": 0.17, + "learning_rate": 4.7396610316577765e-06, + "loss": 1.0999, + "step": 5715 + }, + { + "epoch": 0.17, + "learning_rate": 4.739552640605082e-06, + "loss": 1.1145, + "step": 5716 + }, + { + "epoch": 0.17, + "learning_rate": 4.739444228232925e-06, + "loss": 1.1238, + "step": 5717 + }, + { + "epoch": 0.17, + "learning_rate": 4.739335794542339e-06, + "loss": 1.165, + "step": 5718 + }, + { + "epoch": 0.17, + "learning_rate": 4.739227339534354e-06, + "loss": 1.2449, + "step": 5719 + }, + { + "epoch": 0.17, + "learning_rate": 4.739118863210003e-06, + "loss": 1.1027, + "step": 5720 + }, + { + "epoch": 0.17, + "learning_rate": 4.739010365570318e-06, + "loss": 1.1255, + "step": 5721 + }, + { + "epoch": 0.17, + "learning_rate": 4.738901846616334e-06, + "loss": 1.0936, + "step": 5722 + }, + { + "epoch": 0.17, + "learning_rate": 4.738793306349082e-06, + "loss": 1.1193, + "step": 5723 + }, + { + "epoch": 0.17, + "learning_rate": 4.738684744769597e-06, + "loss": 1.0358, + "step": 5724 + }, + { + "epoch": 0.17, + "learning_rate": 4.73857616187891e-06, + "loss": 1.1431, + "step": 5725 + }, + { + "epoch": 0.17, + "learning_rate": 4.738467557678057e-06, + "loss": 1.1904, + "step": 5726 + }, + { + "epoch": 0.17, + "learning_rate": 4.738358932168071e-06, + "loss": 1.146, + "step": 5727 + }, + { + "epoch": 0.17, + "learning_rate": 4.738250285349985e-06, + "loss": 1.2111, + "step": 5728 + }, + { + "epoch": 0.17, + "learning_rate": 4.738141617224835e-06, + "loss": 1.1447, + "step": 5729 + }, + { + "epoch": 0.17, + "learning_rate": 4.7380329277936545e-06, + "loss": 1.1174, + "step": 5730 + }, + { + "epoch": 0.17, + "learning_rate": 4.737924217057479e-06, + "loss": 1.261, + "step": 5731 + }, + { + "epoch": 0.17, + "learning_rate": 4.737815485017342e-06, + "loss": 1.1846, + "step": 5732 + }, + { + "epoch": 0.17, + "learning_rate": 4.73770673167428e-06, + "loss": 1.1707, + "step": 5733 + }, + { + "epoch": 0.17, + "learning_rate": 4.737597957029327e-06, + "loss": 1.1704, + "step": 5734 + }, + { + "epoch": 0.17, + "learning_rate": 4.737489161083519e-06, + "loss": 1.1062, + "step": 5735 + }, + { + "epoch": 0.17, + "learning_rate": 4.737380343837893e-06, + "loss": 1.1597, + "step": 5736 + }, + { + "epoch": 0.17, + "learning_rate": 4.737271505293482e-06, + "loss": 1.1838, + "step": 5737 + }, + { + "epoch": 0.17, + "learning_rate": 4.7371626454513255e-06, + "loss": 1.1434, + "step": 5738 + }, + { + "epoch": 0.17, + "learning_rate": 4.737053764312457e-06, + "loss": 1.25, + "step": 5739 + }, + { + "epoch": 0.17, + "learning_rate": 4.736944861877914e-06, + "loss": 1.1146, + "step": 5740 + }, + { + "epoch": 0.17, + "learning_rate": 4.736835938148734e-06, + "loss": 1.202, + "step": 5741 + }, + { + "epoch": 0.17, + "learning_rate": 4.736726993125953e-06, + "loss": 1.2382, + "step": 5742 + }, + { + "epoch": 0.17, + "learning_rate": 4.736618026810608e-06, + "loss": 1.1831, + "step": 5743 + }, + { + "epoch": 0.17, + "learning_rate": 4.736509039203736e-06, + "loss": 1.0616, + "step": 5744 + }, + { + "epoch": 0.17, + "learning_rate": 4.736400030306376e-06, + "loss": 1.1375, + "step": 5745 + }, + { + "epoch": 0.17, + "learning_rate": 4.736291000119564e-06, + "loss": 1.241, + "step": 5746 + }, + { + "epoch": 0.17, + "learning_rate": 4.7361819486443395e-06, + "loss": 0.999, + "step": 5747 + }, + { + "epoch": 0.17, + "learning_rate": 4.736072875881739e-06, + "loss": 1.087, + "step": 5748 + }, + { + "epoch": 0.17, + "learning_rate": 4.735963781832802e-06, + "loss": 1.2711, + "step": 5749 + }, + { + "epoch": 0.17, + "learning_rate": 4.735854666498567e-06, + "loss": 1.2129, + "step": 5750 + }, + { + "epoch": 0.17, + "learning_rate": 4.735745529880073e-06, + "loss": 1.1536, + "step": 5751 + }, + { + "epoch": 0.17, + "learning_rate": 4.735636371978357e-06, + "loss": 1.0687, + "step": 5752 + }, + { + "epoch": 0.17, + "learning_rate": 4.73552719279446e-06, + "loss": 1.0732, + "step": 5753 + }, + { + "epoch": 0.17, + "learning_rate": 4.735417992329421e-06, + "loss": 1.2078, + "step": 5754 + }, + { + "epoch": 0.17, + "learning_rate": 4.735308770584279e-06, + "loss": 1.1682, + "step": 5755 + }, + { + "epoch": 0.17, + "learning_rate": 4.735199527560074e-06, + "loss": 1.0764, + "step": 5756 + }, + { + "epoch": 0.17, + "learning_rate": 4.735090263257847e-06, + "loss": 1.1951, + "step": 5757 + }, + { + "epoch": 0.17, + "learning_rate": 4.7349809776786355e-06, + "loss": 1.2082, + "step": 5758 + }, + { + "epoch": 0.17, + "learning_rate": 4.734871670823482e-06, + "loss": 1.1208, + "step": 5759 + }, + { + "epoch": 0.17, + "learning_rate": 4.734762342693428e-06, + "loss": 1.1242, + "step": 5760 + }, + { + "epoch": 0.17, + "learning_rate": 4.734652993289511e-06, + "loss": 1.1287, + "step": 5761 + }, + { + "epoch": 0.17, + "learning_rate": 4.734543622612774e-06, + "loss": 1.3248, + "step": 5762 + }, + { + "epoch": 0.17, + "learning_rate": 4.734434230664259e-06, + "loss": 1.1852, + "step": 5763 + }, + { + "epoch": 0.17, + "learning_rate": 4.734324817445005e-06, + "loss": 1.1759, + "step": 5764 + }, + { + "epoch": 0.17, + "learning_rate": 4.734215382956056e-06, + "loss": 1.1897, + "step": 5765 + }, + { + "epoch": 0.17, + "learning_rate": 4.7341059271984515e-06, + "loss": 1.1834, + "step": 5766 + }, + { + "epoch": 0.17, + "learning_rate": 4.733996450173235e-06, + "loss": 1.1854, + "step": 5767 + }, + { + "epoch": 0.17, + "learning_rate": 4.733886951881449e-06, + "loss": 1.1725, + "step": 5768 + }, + { + "epoch": 0.17, + "learning_rate": 4.733777432324134e-06, + "loss": 1.1677, + "step": 5769 + }, + { + "epoch": 0.17, + "learning_rate": 4.7336678915023335e-06, + "loss": 1.1814, + "step": 5770 + }, + { + "epoch": 0.17, + "learning_rate": 4.7335583294170915e-06, + "loss": 1.1287, + "step": 5771 + }, + { + "epoch": 0.17, + "learning_rate": 4.73344874606945e-06, + "loss": 1.1235, + "step": 5772 + }, + { + "epoch": 0.17, + "learning_rate": 4.733339141460451e-06, + "loss": 1.1462, + "step": 5773 + }, + { + "epoch": 0.17, + "learning_rate": 4.7332295155911395e-06, + "loss": 1.1841, + "step": 5774 + }, + { + "epoch": 0.17, + "learning_rate": 4.733119868462559e-06, + "loss": 1.1931, + "step": 5775 + }, + { + "epoch": 0.17, + "learning_rate": 4.733010200075752e-06, + "loss": 1.0857, + "step": 5776 + }, + { + "epoch": 0.17, + "learning_rate": 4.732900510431764e-06, + "loss": 1.0972, + "step": 5777 + }, + { + "epoch": 0.17, + "learning_rate": 4.732790799531638e-06, + "loss": 1.1199, + "step": 5778 + }, + { + "epoch": 0.17, + "learning_rate": 4.732681067376419e-06, + "loss": 1.1638, + "step": 5779 + }, + { + "epoch": 0.17, + "learning_rate": 4.732571313967152e-06, + "loss": 1.1811, + "step": 5780 + }, + { + "epoch": 0.17, + "learning_rate": 4.732461539304881e-06, + "loss": 1.3009, + "step": 5781 + }, + { + "epoch": 0.17, + "learning_rate": 4.732351743390652e-06, + "loss": 1.0652, + "step": 5782 + }, + { + "epoch": 0.17, + "learning_rate": 4.732241926225509e-06, + "loss": 1.0646, + "step": 5783 + }, + { + "epoch": 0.17, + "learning_rate": 4.732132087810498e-06, + "loss": 1.2261, + "step": 5784 + }, + { + "epoch": 0.17, + "learning_rate": 4.732022228146664e-06, + "loss": 1.1785, + "step": 5785 + }, + { + "epoch": 0.17, + "learning_rate": 4.7319123472350546e-06, + "loss": 1.1472, + "step": 5786 + }, + { + "epoch": 0.17, + "learning_rate": 4.731802445076714e-06, + "loss": 1.0569, + "step": 5787 + }, + { + "epoch": 0.17, + "learning_rate": 4.731692521672688e-06, + "loss": 1.1716, + "step": 5788 + }, + { + "epoch": 0.17, + "learning_rate": 4.731582577024026e-06, + "loss": 1.2284, + "step": 5789 + }, + { + "epoch": 0.17, + "learning_rate": 4.7314726111317714e-06, + "loss": 1.0691, + "step": 5790 + }, + { + "epoch": 0.17, + "learning_rate": 4.731362623996972e-06, + "loss": 1.2162, + "step": 5791 + }, + { + "epoch": 0.17, + "learning_rate": 4.731252615620675e-06, + "loss": 1.3097, + "step": 5792 + }, + { + "epoch": 0.17, + "learning_rate": 4.731142586003928e-06, + "loss": 1.1086, + "step": 5793 + }, + { + "epoch": 0.17, + "learning_rate": 4.731032535147779e-06, + "loss": 1.0952, + "step": 5794 + }, + { + "epoch": 0.17, + "learning_rate": 4.730922463053274e-06, + "loss": 1.037, + "step": 5795 + }, + { + "epoch": 0.17, + "learning_rate": 4.730812369721461e-06, + "loss": 1.1378, + "step": 5796 + }, + { + "epoch": 0.17, + "learning_rate": 4.73070225515339e-06, + "loss": 1.2426, + "step": 5797 + }, + { + "epoch": 0.17, + "learning_rate": 4.730592119350107e-06, + "loss": 1.0581, + "step": 5798 + }, + { + "epoch": 0.17, + "learning_rate": 4.730481962312662e-06, + "loss": 1.1022, + "step": 5799 + }, + { + "epoch": 0.17, + "learning_rate": 4.730371784042102e-06, + "loss": 1.069, + "step": 5800 + }, + { + "epoch": 0.17, + "learning_rate": 4.730261584539478e-06, + "loss": 1.1367, + "step": 5801 + }, + { + "epoch": 0.17, + "learning_rate": 4.730151363805836e-06, + "loss": 1.1285, + "step": 5802 + }, + { + "epoch": 0.17, + "learning_rate": 4.730041121842229e-06, + "loss": 1.0363, + "step": 5803 + }, + { + "epoch": 0.17, + "learning_rate": 4.729930858649703e-06, + "loss": 1.2523, + "step": 5804 + }, + { + "epoch": 0.17, + "learning_rate": 4.72982057422931e-06, + "loss": 1.1599, + "step": 5805 + }, + { + "epoch": 0.17, + "learning_rate": 4.7297102685821e-06, + "loss": 1.1196, + "step": 5806 + }, + { + "epoch": 0.17, + "learning_rate": 4.72959994170912e-06, + "loss": 1.095, + "step": 5807 + }, + { + "epoch": 0.17, + "learning_rate": 4.729489593611424e-06, + "loss": 1.1554, + "step": 5808 + }, + { + "epoch": 0.17, + "learning_rate": 4.7293792242900605e-06, + "loss": 1.1395, + "step": 5809 + }, + { + "epoch": 0.18, + "learning_rate": 4.72926883374608e-06, + "loss": 1.2498, + "step": 5810 + }, + { + "epoch": 0.18, + "learning_rate": 4.729158421980534e-06, + "loss": 1.1956, + "step": 5811 + }, + { + "epoch": 0.18, + "learning_rate": 4.729047988994473e-06, + "loss": 1.0873, + "step": 5812 + }, + { + "epoch": 0.18, + "learning_rate": 4.72893753478895e-06, + "loss": 1.1592, + "step": 5813 + }, + { + "epoch": 0.18, + "learning_rate": 4.728827059365014e-06, + "loss": 1.1088, + "step": 5814 + }, + { + "epoch": 0.18, + "learning_rate": 4.728716562723718e-06, + "loss": 1.0882, + "step": 5815 + }, + { + "epoch": 0.18, + "learning_rate": 4.728606044866114e-06, + "loss": 1.0612, + "step": 5816 + }, + { + "epoch": 0.18, + "learning_rate": 4.728495505793254e-06, + "loss": 1.2762, + "step": 5817 + }, + { + "epoch": 0.18, + "learning_rate": 4.72838494550619e-06, + "loss": 1.1875, + "step": 5818 + }, + { + "epoch": 0.18, + "learning_rate": 4.728274364005974e-06, + "loss": 1.2311, + "step": 5819 + }, + { + "epoch": 0.18, + "learning_rate": 4.72816376129366e-06, + "loss": 1.1604, + "step": 5820 + }, + { + "epoch": 0.18, + "learning_rate": 4.7280531373703e-06, + "loss": 1.0126, + "step": 5821 + }, + { + "epoch": 0.18, + "learning_rate": 4.727942492236947e-06, + "loss": 1.0026, + "step": 5822 + }, + { + "epoch": 0.18, + "learning_rate": 4.7278318258946536e-06, + "loss": 1.1952, + "step": 5823 + }, + { + "epoch": 0.18, + "learning_rate": 4.7277211383444755e-06, + "loss": 1.0819, + "step": 5824 + }, + { + "epoch": 0.18, + "learning_rate": 4.727610429587464e-06, + "loss": 1.1707, + "step": 5825 + }, + { + "epoch": 0.18, + "learning_rate": 4.727499699624675e-06, + "loss": 1.1978, + "step": 5826 + }, + { + "epoch": 0.18, + "learning_rate": 4.7273889484571614e-06, + "loss": 1.1458, + "step": 5827 + }, + { + "epoch": 0.18, + "learning_rate": 4.727278176085977e-06, + "loss": 1.1665, + "step": 5828 + }, + { + "epoch": 0.18, + "learning_rate": 4.727167382512178e-06, + "loss": 1.1516, + "step": 5829 + }, + { + "epoch": 0.18, + "learning_rate": 4.7270565677368176e-06, + "loss": 1.1589, + "step": 5830 + }, + { + "epoch": 0.18, + "learning_rate": 4.726945731760951e-06, + "loss": 1.2101, + "step": 5831 + }, + { + "epoch": 0.18, + "learning_rate": 4.726834874585635e-06, + "loss": 1.2144, + "step": 5832 + }, + { + "epoch": 0.18, + "learning_rate": 4.726723996211922e-06, + "loss": 1.2242, + "step": 5833 + }, + { + "epoch": 0.18, + "learning_rate": 4.72661309664087e-06, + "loss": 1.0941, + "step": 5834 + }, + { + "epoch": 0.18, + "learning_rate": 4.726502175873533e-06, + "loss": 1.1106, + "step": 5835 + }, + { + "epoch": 0.18, + "learning_rate": 4.726391233910967e-06, + "loss": 1.1439, + "step": 5836 + }, + { + "epoch": 0.18, + "learning_rate": 4.72628027075423e-06, + "loss": 1.2582, + "step": 5837 + }, + { + "epoch": 0.18, + "learning_rate": 4.726169286404376e-06, + "loss": 1.2261, + "step": 5838 + }, + { + "epoch": 0.18, + "learning_rate": 4.726058280862464e-06, + "loss": 1.126, + "step": 5839 + }, + { + "epoch": 0.18, + "learning_rate": 4.725947254129548e-06, + "loss": 1.1648, + "step": 5840 + }, + { + "epoch": 0.18, + "learning_rate": 4.725836206206686e-06, + "loss": 1.1178, + "step": 5841 + }, + { + "epoch": 0.18, + "learning_rate": 4.725725137094937e-06, + "loss": 1.1511, + "step": 5842 + }, + { + "epoch": 0.18, + "learning_rate": 4.725614046795355e-06, + "loss": 1.194, + "step": 5843 + }, + { + "epoch": 0.18, + "learning_rate": 4.725502935309e-06, + "loss": 1.0922, + "step": 5844 + }, + { + "epoch": 0.18, + "learning_rate": 4.725391802636928e-06, + "loss": 1.2018, + "step": 5845 + }, + { + "epoch": 0.18, + "learning_rate": 4.725280648780199e-06, + "loss": 1.1652, + "step": 5846 + }, + { + "epoch": 0.18, + "learning_rate": 4.7251694737398695e-06, + "loss": 1.2025, + "step": 5847 + }, + { + "epoch": 0.18, + "learning_rate": 4.7250582775169985e-06, + "loss": 1.2555, + "step": 5848 + }, + { + "epoch": 0.18, + "learning_rate": 4.724947060112644e-06, + "loss": 1.1037, + "step": 5849 + }, + { + "epoch": 0.18, + "learning_rate": 4.7248358215278645e-06, + "loss": 1.1866, + "step": 5850 + }, + { + "epoch": 0.18, + "learning_rate": 4.724724561763721e-06, + "loss": 1.1566, + "step": 5851 + }, + { + "epoch": 0.18, + "learning_rate": 4.72461328082127e-06, + "loss": 1.0645, + "step": 5852 + }, + { + "epoch": 0.18, + "learning_rate": 4.7245019787015716e-06, + "loss": 1.1954, + "step": 5853 + }, + { + "epoch": 0.18, + "learning_rate": 4.724390655405686e-06, + "loss": 1.1046, + "step": 5854 + }, + { + "epoch": 0.18, + "learning_rate": 4.724279310934673e-06, + "loss": 1.1263, + "step": 5855 + }, + { + "epoch": 0.18, + "learning_rate": 4.724167945289593e-06, + "loss": 1.1925, + "step": 5856 + }, + { + "epoch": 0.18, + "learning_rate": 4.724056558471504e-06, + "loss": 1.1782, + "step": 5857 + }, + { + "epoch": 0.18, + "learning_rate": 4.723945150481468e-06, + "loss": 1.2637, + "step": 5858 + }, + { + "epoch": 0.18, + "learning_rate": 4.7238337213205455e-06, + "loss": 1.0854, + "step": 5859 + }, + { + "epoch": 0.18, + "learning_rate": 4.723722270989797e-06, + "loss": 1.1824, + "step": 5860 + }, + { + "epoch": 0.18, + "learning_rate": 4.723610799490284e-06, + "loss": 1.2516, + "step": 5861 + }, + { + "epoch": 0.18, + "learning_rate": 4.723499306823066e-06, + "loss": 1.1423, + "step": 5862 + }, + { + "epoch": 0.18, + "learning_rate": 4.723387792989206e-06, + "loss": 1.2233, + "step": 5863 + }, + { + "epoch": 0.18, + "learning_rate": 4.723276257989765e-06, + "loss": 1.2269, + "step": 5864 + }, + { + "epoch": 0.18, + "learning_rate": 4.723164701825805e-06, + "loss": 1.1316, + "step": 5865 + }, + { + "epoch": 0.18, + "learning_rate": 4.723053124498388e-06, + "loss": 0.9932, + "step": 5866 + }, + { + "epoch": 0.18, + "learning_rate": 4.7229415260085756e-06, + "loss": 1.1011, + "step": 5867 + }, + { + "epoch": 0.18, + "learning_rate": 4.72282990635743e-06, + "loss": 1.2937, + "step": 5868 + }, + { + "epoch": 0.18, + "learning_rate": 4.722718265546015e-06, + "loss": 1.1452, + "step": 5869 + }, + { + "epoch": 0.18, + "learning_rate": 4.722606603575392e-06, + "loss": 1.1683, + "step": 5870 + }, + { + "epoch": 0.18, + "learning_rate": 4.722494920446625e-06, + "loss": 1.1415, + "step": 5871 + }, + { + "epoch": 0.18, + "learning_rate": 4.722383216160776e-06, + "loss": 1.2638, + "step": 5872 + }, + { + "epoch": 0.18, + "learning_rate": 4.72227149071891e-06, + "loss": 1.2326, + "step": 5873 + }, + { + "epoch": 0.18, + "learning_rate": 4.722159744122089e-06, + "loss": 1.2415, + "step": 5874 + }, + { + "epoch": 0.18, + "learning_rate": 4.722047976371378e-06, + "loss": 1.0273, + "step": 5875 + }, + { + "epoch": 0.18, + "learning_rate": 4.721936187467841e-06, + "loss": 1.1956, + "step": 5876 + }, + { + "epoch": 0.18, + "learning_rate": 4.721824377412541e-06, + "loss": 1.142, + "step": 5877 + }, + { + "epoch": 0.18, + "learning_rate": 4.721712546206543e-06, + "loss": 1.1826, + "step": 5878 + }, + { + "epoch": 0.18, + "learning_rate": 4.72160069385091e-06, + "loss": 1.1519, + "step": 5879 + }, + { + "epoch": 0.18, + "learning_rate": 4.72148882034671e-06, + "loss": 1.2303, + "step": 5880 + }, + { + "epoch": 0.18, + "learning_rate": 4.721376925695007e-06, + "loss": 1.1583, + "step": 5881 + }, + { + "epoch": 0.18, + "learning_rate": 4.721265009896865e-06, + "loss": 1.1541, + "step": 5882 + }, + { + "epoch": 0.18, + "learning_rate": 4.72115307295335e-06, + "loss": 1.1366, + "step": 5883 + }, + { + "epoch": 0.18, + "learning_rate": 4.721041114865526e-06, + "loss": 1.0782, + "step": 5884 + }, + { + "epoch": 0.18, + "learning_rate": 4.720929135634462e-06, + "loss": 1.1221, + "step": 5885 + }, + { + "epoch": 0.18, + "learning_rate": 4.7208171352612205e-06, + "loss": 1.2039, + "step": 5886 + }, + { + "epoch": 0.18, + "learning_rate": 4.720705113746871e-06, + "loss": 1.1702, + "step": 5887 + }, + { + "epoch": 0.18, + "learning_rate": 4.720593071092478e-06, + "loss": 1.1021, + "step": 5888 + }, + { + "epoch": 0.18, + "learning_rate": 4.720481007299109e-06, + "loss": 1.1957, + "step": 5889 + }, + { + "epoch": 0.18, + "learning_rate": 4.7203689223678294e-06, + "loss": 1.1887, + "step": 5890 + }, + { + "epoch": 0.18, + "learning_rate": 4.720256816299707e-06, + "loss": 1.115, + "step": 5891 + }, + { + "epoch": 0.18, + "learning_rate": 4.720144689095809e-06, + "loss": 1.0497, + "step": 5892 + }, + { + "epoch": 0.18, + "learning_rate": 4.720032540757203e-06, + "loss": 1.1153, + "step": 5893 + }, + { + "epoch": 0.18, + "learning_rate": 4.719920371284957e-06, + "loss": 1.1725, + "step": 5894 + }, + { + "epoch": 0.18, + "learning_rate": 4.7198081806801375e-06, + "loss": 1.1414, + "step": 5895 + }, + { + "epoch": 0.18, + "learning_rate": 4.719695968943813e-06, + "loss": 1.1683, + "step": 5896 + }, + { + "epoch": 0.18, + "learning_rate": 4.719583736077053e-06, + "loss": 1.1725, + "step": 5897 + }, + { + "epoch": 0.18, + "learning_rate": 4.719471482080924e-06, + "loss": 1.2302, + "step": 5898 + }, + { + "epoch": 0.18, + "learning_rate": 4.7193592069564956e-06, + "loss": 1.2582, + "step": 5899 + }, + { + "epoch": 0.18, + "learning_rate": 4.719246910704836e-06, + "loss": 1.3387, + "step": 5900 + }, + { + "epoch": 0.18, + "learning_rate": 4.719134593327015e-06, + "loss": 1.1791, + "step": 5901 + }, + { + "epoch": 0.18, + "learning_rate": 4.719022254824102e-06, + "loss": 1.0442, + "step": 5902 + }, + { + "epoch": 0.18, + "learning_rate": 4.7189098951971645e-06, + "loss": 1.1228, + "step": 5903 + }, + { + "epoch": 0.18, + "learning_rate": 4.718797514447275e-06, + "loss": 1.1472, + "step": 5904 + }, + { + "epoch": 0.18, + "learning_rate": 4.718685112575501e-06, + "loss": 1.1407, + "step": 5905 + }, + { + "epoch": 0.18, + "learning_rate": 4.718572689582913e-06, + "loss": 1.1459, + "step": 5906 + }, + { + "epoch": 0.18, + "learning_rate": 4.718460245470582e-06, + "loss": 1.187, + "step": 5907 + }, + { + "epoch": 0.18, + "learning_rate": 4.718347780239578e-06, + "loss": 1.0871, + "step": 5908 + }, + { + "epoch": 0.18, + "learning_rate": 4.718235293890971e-06, + "loss": 1.1013, + "step": 5909 + }, + { + "epoch": 0.18, + "learning_rate": 4.718122786425833e-06, + "loss": 1.1567, + "step": 5910 + }, + { + "epoch": 0.18, + "learning_rate": 4.718010257845234e-06, + "loss": 1.088, + "step": 5911 + }, + { + "epoch": 0.18, + "learning_rate": 4.717897708150245e-06, + "loss": 1.2122, + "step": 5912 + }, + { + "epoch": 0.18, + "learning_rate": 4.7177851373419385e-06, + "loss": 1.174, + "step": 5913 + }, + { + "epoch": 0.18, + "learning_rate": 4.717672545421386e-06, + "loss": 1.2136, + "step": 5914 + }, + { + "epoch": 0.18, + "learning_rate": 4.717559932389658e-06, + "loss": 1.1838, + "step": 5915 + }, + { + "epoch": 0.18, + "learning_rate": 4.7174472982478285e-06, + "loss": 1.1885, + "step": 5916 + }, + { + "epoch": 0.18, + "learning_rate": 4.717334642996968e-06, + "loss": 1.1937, + "step": 5917 + }, + { + "epoch": 0.18, + "learning_rate": 4.71722196663815e-06, + "loss": 1.2341, + "step": 5918 + }, + { + "epoch": 0.18, + "learning_rate": 4.717109269172446e-06, + "loss": 1.1198, + "step": 5919 + }, + { + "epoch": 0.18, + "learning_rate": 4.71699655060093e-06, + "loss": 1.0998, + "step": 5920 + }, + { + "epoch": 0.18, + "learning_rate": 4.716883810924675e-06, + "loss": 1.0839, + "step": 5921 + }, + { + "epoch": 0.18, + "learning_rate": 4.716771050144754e-06, + "loss": 1.1141, + "step": 5922 + }, + { + "epoch": 0.18, + "learning_rate": 4.71665826826224e-06, + "loss": 1.1157, + "step": 5923 + }, + { + "epoch": 0.18, + "learning_rate": 4.716545465278206e-06, + "loss": 1.1772, + "step": 5924 + }, + { + "epoch": 0.18, + "learning_rate": 4.716432641193728e-06, + "loss": 1.1701, + "step": 5925 + }, + { + "epoch": 0.18, + "learning_rate": 4.7163197960098775e-06, + "loss": 1.0554, + "step": 5926 + }, + { + "epoch": 0.18, + "learning_rate": 4.716206929727731e-06, + "loss": 1.0982, + "step": 5927 + }, + { + "epoch": 0.18, + "learning_rate": 4.716094042348362e-06, + "loss": 1.1037, + "step": 5928 + }, + { + "epoch": 0.18, + "learning_rate": 4.715981133872843e-06, + "loss": 1.0888, + "step": 5929 + }, + { + "epoch": 0.18, + "learning_rate": 4.715868204302253e-06, + "loss": 1.1555, + "step": 5930 + }, + { + "epoch": 0.18, + "learning_rate": 4.715755253637664e-06, + "loss": 1.0562, + "step": 5931 + }, + { + "epoch": 0.18, + "learning_rate": 4.7156422818801525e-06, + "loss": 1.1284, + "step": 5932 + }, + { + "epoch": 0.18, + "learning_rate": 4.715529289030793e-06, + "loss": 1.1382, + "step": 5933 + }, + { + "epoch": 0.18, + "learning_rate": 4.715416275090662e-06, + "loss": 1.1376, + "step": 5934 + }, + { + "epoch": 0.18, + "learning_rate": 4.715303240060835e-06, + "loss": 1.0914, + "step": 5935 + }, + { + "epoch": 0.18, + "learning_rate": 4.715190183942388e-06, + "loss": 1.1653, + "step": 5936 + }, + { + "epoch": 0.18, + "learning_rate": 4.7150771067363975e-06, + "loss": 1.1833, + "step": 5937 + }, + { + "epoch": 0.18, + "learning_rate": 4.714964008443941e-06, + "loss": 1.152, + "step": 5938 + }, + { + "epoch": 0.18, + "learning_rate": 4.714850889066092e-06, + "loss": 1.0626, + "step": 5939 + }, + { + "epoch": 0.18, + "learning_rate": 4.7147377486039295e-06, + "loss": 1.158, + "step": 5940 + }, + { + "epoch": 0.18, + "learning_rate": 4.714624587058531e-06, + "loss": 1.1371, + "step": 5941 + }, + { + "epoch": 0.18, + "learning_rate": 4.714511404430973e-06, + "loss": 1.1638, + "step": 5942 + }, + { + "epoch": 0.18, + "learning_rate": 4.714398200722332e-06, + "loss": 1.2308, + "step": 5943 + }, + { + "epoch": 0.18, + "learning_rate": 4.714284975933687e-06, + "loss": 1.1569, + "step": 5944 + }, + { + "epoch": 0.18, + "learning_rate": 4.714171730066116e-06, + "loss": 1.1705, + "step": 5945 + }, + { + "epoch": 0.18, + "learning_rate": 4.714058463120696e-06, + "loss": 1.1975, + "step": 5946 + }, + { + "epoch": 0.18, + "learning_rate": 4.7139451750985065e-06, + "loss": 1.0565, + "step": 5947 + }, + { + "epoch": 0.18, + "learning_rate": 4.713831866000625e-06, + "loss": 1.249, + "step": 5948 + }, + { + "epoch": 0.18, + "learning_rate": 4.71371853582813e-06, + "loss": 1.1062, + "step": 5949 + }, + { + "epoch": 0.18, + "learning_rate": 4.713605184582101e-06, + "loss": 1.2361, + "step": 5950 + }, + { + "epoch": 0.18, + "learning_rate": 4.713491812263616e-06, + "loss": 1.1357, + "step": 5951 + }, + { + "epoch": 0.18, + "learning_rate": 4.713378418873757e-06, + "loss": 1.1362, + "step": 5952 + }, + { + "epoch": 0.18, + "learning_rate": 4.713265004413599e-06, + "loss": 1.1105, + "step": 5953 + }, + { + "epoch": 0.18, + "learning_rate": 4.713151568884226e-06, + "loss": 1.2318, + "step": 5954 + }, + { + "epoch": 0.18, + "learning_rate": 4.7130381122867145e-06, + "loss": 1.1411, + "step": 5955 + }, + { + "epoch": 0.18, + "learning_rate": 4.712924634622147e-06, + "loss": 1.0914, + "step": 5956 + }, + { + "epoch": 0.18, + "learning_rate": 4.7128111358916016e-06, + "loss": 1.2146, + "step": 5957 + }, + { + "epoch": 0.18, + "learning_rate": 4.7126976160961616e-06, + "loss": 1.2012, + "step": 5958 + }, + { + "epoch": 0.18, + "learning_rate": 4.7125840752369045e-06, + "loss": 1.2228, + "step": 5959 + }, + { + "epoch": 0.18, + "learning_rate": 4.712470513314913e-06, + "loss": 1.2043, + "step": 5960 + }, + { + "epoch": 0.18, + "learning_rate": 4.712356930331268e-06, + "loss": 1.1747, + "step": 5961 + }, + { + "epoch": 0.18, + "learning_rate": 4.71224332628705e-06, + "loss": 1.2228, + "step": 5962 + }, + { + "epoch": 0.18, + "learning_rate": 4.712129701183341e-06, + "loss": 1.2073, + "step": 5963 + }, + { + "epoch": 0.18, + "learning_rate": 4.7120160550212235e-06, + "loss": 1.2031, + "step": 5964 + }, + { + "epoch": 0.18, + "learning_rate": 4.7119023878017785e-06, + "loss": 1.1962, + "step": 5965 + }, + { + "epoch": 0.18, + "learning_rate": 4.711788699526087e-06, + "loss": 1.1194, + "step": 5966 + }, + { + "epoch": 0.18, + "learning_rate": 4.711674990195234e-06, + "loss": 1.1819, + "step": 5967 + }, + { + "epoch": 0.18, + "learning_rate": 4.711561259810299e-06, + "loss": 1.314, + "step": 5968 + }, + { + "epoch": 0.18, + "learning_rate": 4.711447508372366e-06, + "loss": 1.1962, + "step": 5969 + }, + { + "epoch": 0.18, + "learning_rate": 4.711333735882518e-06, + "loss": 1.1121, + "step": 5970 + }, + { + "epoch": 0.18, + "learning_rate": 4.711219942341838e-06, + "loss": 1.0791, + "step": 5971 + }, + { + "epoch": 0.18, + "learning_rate": 4.711106127751408e-06, + "loss": 1.0894, + "step": 5972 + }, + { + "epoch": 0.18, + "learning_rate": 4.710992292112314e-06, + "loss": 1.0952, + "step": 5973 + }, + { + "epoch": 0.18, + "learning_rate": 4.710878435425637e-06, + "loss": 1.0672, + "step": 5974 + }, + { + "epoch": 0.18, + "learning_rate": 4.710764557692463e-06, + "loss": 1.1289, + "step": 5975 + }, + { + "epoch": 0.18, + "learning_rate": 4.710650658913876e-06, + "loss": 1.1295, + "step": 5976 + }, + { + "epoch": 0.18, + "learning_rate": 4.710536739090958e-06, + "loss": 1.1186, + "step": 5977 + }, + { + "epoch": 0.18, + "learning_rate": 4.7104227982247955e-06, + "loss": 1.0634, + "step": 5978 + }, + { + "epoch": 0.18, + "learning_rate": 4.710308836316472e-06, + "loss": 1.1255, + "step": 5979 + }, + { + "epoch": 0.18, + "learning_rate": 4.710194853367074e-06, + "loss": 1.2563, + "step": 5980 + }, + { + "epoch": 0.18, + "learning_rate": 4.710080849377684e-06, + "loss": 1.3062, + "step": 5981 + }, + { + "epoch": 0.18, + "learning_rate": 4.709966824349389e-06, + "loss": 1.0984, + "step": 5982 + }, + { + "epoch": 0.18, + "learning_rate": 4.709852778283275e-06, + "loss": 1.2363, + "step": 5983 + }, + { + "epoch": 0.18, + "learning_rate": 4.709738711180426e-06, + "loss": 1.1016, + "step": 5984 + }, + { + "epoch": 0.18, + "learning_rate": 4.70962462304193e-06, + "loss": 1.1327, + "step": 5985 + }, + { + "epoch": 0.18, + "learning_rate": 4.70951051386887e-06, + "loss": 1.2665, + "step": 5986 + }, + { + "epoch": 0.18, + "learning_rate": 4.709396383662334e-06, + "loss": 1.2076, + "step": 5987 + }, + { + "epoch": 0.18, + "learning_rate": 4.7092822324234105e-06, + "loss": 1.202, + "step": 5988 + }, + { + "epoch": 0.18, + "learning_rate": 4.709168060153183e-06, + "loss": 1.0997, + "step": 5989 + }, + { + "epoch": 0.18, + "learning_rate": 4.70905386685274e-06, + "loss": 1.1981, + "step": 5990 + }, + { + "epoch": 0.18, + "learning_rate": 4.7089396525231676e-06, + "loss": 1.0938, + "step": 5991 + }, + { + "epoch": 0.18, + "learning_rate": 4.708825417165553e-06, + "loss": 1.0494, + "step": 5992 + }, + { + "epoch": 0.18, + "learning_rate": 4.708711160780986e-06, + "loss": 1.2291, + "step": 5993 + }, + { + "epoch": 0.18, + "learning_rate": 4.708596883370551e-06, + "loss": 1.107, + "step": 5994 + }, + { + "epoch": 0.18, + "learning_rate": 4.708482584935338e-06, + "loss": 1.2523, + "step": 5995 + }, + { + "epoch": 0.18, + "learning_rate": 4.708368265476434e-06, + "loss": 1.054, + "step": 5996 + }, + { + "epoch": 0.18, + "learning_rate": 4.708253924994928e-06, + "loss": 1.049, + "step": 5997 + }, + { + "epoch": 0.18, + "learning_rate": 4.708139563491908e-06, + "loss": 1.2289, + "step": 5998 + }, + { + "epoch": 0.18, + "learning_rate": 4.7080251809684635e-06, + "loss": 1.4247, + "step": 5999 + }, + { + "epoch": 0.18, + "learning_rate": 4.707910777425681e-06, + "loss": 1.1728, + "step": 6000 + }, + { + "epoch": 0.18, + "learning_rate": 4.707796352864653e-06, + "loss": 1.2828, + "step": 6001 + }, + { + "epoch": 0.18, + "learning_rate": 4.707681907286467e-06, + "loss": 1.1046, + "step": 6002 + }, + { + "epoch": 0.18, + "learning_rate": 4.707567440692212e-06, + "loss": 1.1583, + "step": 6003 + }, + { + "epoch": 0.18, + "learning_rate": 4.707452953082978e-06, + "loss": 1.2365, + "step": 6004 + }, + { + "epoch": 0.18, + "learning_rate": 4.707338444459855e-06, + "loss": 1.1747, + "step": 6005 + }, + { + "epoch": 0.18, + "learning_rate": 4.707223914823933e-06, + "loss": 1.196, + "step": 6006 + }, + { + "epoch": 0.18, + "learning_rate": 4.707109364176303e-06, + "loss": 1.1561, + "step": 6007 + }, + { + "epoch": 0.18, + "learning_rate": 4.706994792518054e-06, + "loss": 1.1918, + "step": 6008 + }, + { + "epoch": 0.18, + "learning_rate": 4.706880199850279e-06, + "loss": 1.1, + "step": 6009 + }, + { + "epoch": 0.18, + "learning_rate": 4.706765586174066e-06, + "loss": 1.1268, + "step": 6010 + }, + { + "epoch": 0.18, + "learning_rate": 4.706650951490508e-06, + "loss": 1.1573, + "step": 6011 + }, + { + "epoch": 0.18, + "learning_rate": 4.706536295800696e-06, + "loss": 1.2206, + "step": 6012 + }, + { + "epoch": 0.18, + "learning_rate": 4.70642161910572e-06, + "loss": 1.1268, + "step": 6013 + }, + { + "epoch": 0.18, + "learning_rate": 4.706306921406673e-06, + "loss": 1.1986, + "step": 6014 + }, + { + "epoch": 0.18, + "learning_rate": 4.706192202704648e-06, + "loss": 1.1995, + "step": 6015 + }, + { + "epoch": 0.18, + "learning_rate": 4.706077463000734e-06, + "loss": 1.1069, + "step": 6016 + }, + { + "epoch": 0.18, + "learning_rate": 4.705962702296026e-06, + "loss": 1.2539, + "step": 6017 + }, + { + "epoch": 0.18, + "learning_rate": 4.705847920591616e-06, + "loss": 1.1365, + "step": 6018 + }, + { + "epoch": 0.18, + "learning_rate": 4.7057331178885954e-06, + "loss": 1.1929, + "step": 6019 + }, + { + "epoch": 0.18, + "learning_rate": 4.705618294188058e-06, + "loss": 1.1846, + "step": 6020 + }, + { + "epoch": 0.18, + "learning_rate": 4.705503449491096e-06, + "loss": 0.9722, + "step": 6021 + }, + { + "epoch": 0.18, + "learning_rate": 4.705388583798805e-06, + "loss": 1.2217, + "step": 6022 + }, + { + "epoch": 0.18, + "learning_rate": 4.705273697112276e-06, + "loss": 1.0921, + "step": 6023 + }, + { + "epoch": 0.18, + "learning_rate": 4.705158789432603e-06, + "loss": 1.1411, + "step": 6024 + }, + { + "epoch": 0.18, + "learning_rate": 4.705043860760881e-06, + "loss": 1.2045, + "step": 6025 + }, + { + "epoch": 0.18, + "learning_rate": 4.704928911098204e-06, + "loss": 1.0812, + "step": 6026 + }, + { + "epoch": 0.18, + "learning_rate": 4.704813940445665e-06, + "loss": 1.1293, + "step": 6027 + }, + { + "epoch": 0.18, + "learning_rate": 4.704698948804359e-06, + "loss": 1.1111, + "step": 6028 + }, + { + "epoch": 0.18, + "learning_rate": 4.704583936175381e-06, + "loss": 1.2217, + "step": 6029 + }, + { + "epoch": 0.18, + "learning_rate": 4.704468902559826e-06, + "loss": 1.1447, + "step": 6030 + }, + { + "epoch": 0.18, + "learning_rate": 4.704353847958788e-06, + "loss": 1.1746, + "step": 6031 + }, + { + "epoch": 0.18, + "learning_rate": 4.704238772373363e-06, + "loss": 1.0733, + "step": 6032 + }, + { + "epoch": 0.18, + "learning_rate": 4.704123675804647e-06, + "loss": 1.1777, + "step": 6033 + }, + { + "epoch": 0.18, + "learning_rate": 4.704008558253736e-06, + "loss": 1.1771, + "step": 6034 + }, + { + "epoch": 0.18, + "learning_rate": 4.703893419721724e-06, + "loss": 1.1836, + "step": 6035 + }, + { + "epoch": 0.18, + "learning_rate": 4.703778260209708e-06, + "loss": 1.0981, + "step": 6036 + }, + { + "epoch": 0.18, + "learning_rate": 4.7036630797187845e-06, + "loss": 1.2242, + "step": 6037 + }, + { + "epoch": 0.18, + "learning_rate": 4.703547878250049e-06, + "loss": 1.1863, + "step": 6038 + }, + { + "epoch": 0.18, + "learning_rate": 4.7034326558046e-06, + "loss": 1.2349, + "step": 6039 + }, + { + "epoch": 0.18, + "learning_rate": 4.7033174123835335e-06, + "loss": 1.1115, + "step": 6040 + }, + { + "epoch": 0.18, + "learning_rate": 4.703202147987945e-06, + "loss": 1.1264, + "step": 6041 + }, + { + "epoch": 0.18, + "learning_rate": 4.703086862618935e-06, + "loss": 1.2047, + "step": 6042 + }, + { + "epoch": 0.18, + "learning_rate": 4.7029715562775975e-06, + "loss": 1.1823, + "step": 6043 + }, + { + "epoch": 0.18, + "learning_rate": 4.7028562289650335e-06, + "loss": 1.1783, + "step": 6044 + }, + { + "epoch": 0.18, + "learning_rate": 4.7027408806823375e-06, + "loss": 1.2213, + "step": 6045 + }, + { + "epoch": 0.18, + "learning_rate": 4.70262551143061e-06, + "loss": 1.1268, + "step": 6046 + }, + { + "epoch": 0.18, + "learning_rate": 4.702510121210948e-06, + "loss": 1.1603, + "step": 6047 + }, + { + "epoch": 0.18, + "learning_rate": 4.702394710024451e-06, + "loss": 1.1233, + "step": 6048 + }, + { + "epoch": 0.18, + "learning_rate": 4.702279277872217e-06, + "loss": 1.2095, + "step": 6049 + }, + { + "epoch": 0.18, + "learning_rate": 4.702163824755345e-06, + "loss": 0.9932, + "step": 6050 + }, + { + "epoch": 0.18, + "learning_rate": 4.702048350674934e-06, + "loss": 1.0639, + "step": 6051 + }, + { + "epoch": 0.18, + "learning_rate": 4.701932855632082e-06, + "loss": 1.1107, + "step": 6052 + }, + { + "epoch": 0.18, + "learning_rate": 4.701817339627891e-06, + "loss": 1.1934, + "step": 6053 + }, + { + "epoch": 0.18, + "learning_rate": 4.701701802663459e-06, + "loss": 1.2224, + "step": 6054 + }, + { + "epoch": 0.18, + "learning_rate": 4.701586244739886e-06, + "loss": 1.1568, + "step": 6055 + }, + { + "epoch": 0.18, + "learning_rate": 4.701470665858273e-06, + "loss": 1.1664, + "step": 6056 + }, + { + "epoch": 0.18, + "learning_rate": 4.701355066019718e-06, + "loss": 1.1407, + "step": 6057 + }, + { + "epoch": 0.18, + "learning_rate": 4.701239445225324e-06, + "loss": 1.1475, + "step": 6058 + }, + { + "epoch": 0.18, + "learning_rate": 4.701123803476191e-06, + "loss": 1.155, + "step": 6059 + }, + { + "epoch": 0.18, + "learning_rate": 4.701008140773419e-06, + "loss": 1.1644, + "step": 6060 + }, + { + "epoch": 0.18, + "learning_rate": 4.70089245711811e-06, + "loss": 1.1801, + "step": 6061 + }, + { + "epoch": 0.18, + "learning_rate": 4.700776752511364e-06, + "loss": 1.1155, + "step": 6062 + }, + { + "epoch": 0.18, + "learning_rate": 4.700661026954284e-06, + "loss": 1.1768, + "step": 6063 + }, + { + "epoch": 0.18, + "learning_rate": 4.70054528044797e-06, + "loss": 1.1472, + "step": 6064 + }, + { + "epoch": 0.18, + "learning_rate": 4.700429512993526e-06, + "loss": 1.1413, + "step": 6065 + }, + { + "epoch": 0.18, + "learning_rate": 4.700313724592051e-06, + "loss": 1.1224, + "step": 6066 + }, + { + "epoch": 0.18, + "learning_rate": 4.700197915244651e-06, + "loss": 1.2635, + "step": 6067 + }, + { + "epoch": 0.18, + "learning_rate": 4.700082084952426e-06, + "loss": 1.1256, + "step": 6068 + }, + { + "epoch": 0.18, + "learning_rate": 4.699966233716479e-06, + "loss": 1.2435, + "step": 6069 + }, + { + "epoch": 0.18, + "learning_rate": 4.699850361537913e-06, + "loss": 1.0928, + "step": 6070 + }, + { + "epoch": 0.18, + "learning_rate": 4.6997344684178305e-06, + "loss": 1.254, + "step": 6071 + }, + { + "epoch": 0.18, + "learning_rate": 4.699618554357336e-06, + "loss": 1.1265, + "step": 6072 + }, + { + "epoch": 0.18, + "learning_rate": 4.699502619357532e-06, + "loss": 1.1863, + "step": 6073 + }, + { + "epoch": 0.18, + "learning_rate": 4.699386663419522e-06, + "loss": 1.0863, + "step": 6074 + }, + { + "epoch": 0.18, + "learning_rate": 4.699270686544411e-06, + "loss": 1.2307, + "step": 6075 + }, + { + "epoch": 0.18, + "learning_rate": 4.699154688733301e-06, + "loss": 1.1932, + "step": 6076 + }, + { + "epoch": 0.18, + "learning_rate": 4.699038669987298e-06, + "loss": 1.0869, + "step": 6077 + }, + { + "epoch": 0.18, + "learning_rate": 4.698922630307506e-06, + "loss": 1.0054, + "step": 6078 + }, + { + "epoch": 0.18, + "learning_rate": 4.698806569695031e-06, + "loss": 1.0997, + "step": 6079 + }, + { + "epoch": 0.18, + "learning_rate": 4.698690488150974e-06, + "loss": 1.1984, + "step": 6080 + }, + { + "epoch": 0.18, + "learning_rate": 4.698574385676445e-06, + "loss": 1.291, + "step": 6081 + }, + { + "epoch": 0.18, + "learning_rate": 4.698458262272545e-06, + "loss": 1.0887, + "step": 6082 + }, + { + "epoch": 0.18, + "learning_rate": 4.698342117940382e-06, + "loss": 1.2169, + "step": 6083 + }, + { + "epoch": 0.18, + "learning_rate": 4.69822595268106e-06, + "loss": 1.1005, + "step": 6084 + }, + { + "epoch": 0.18, + "learning_rate": 4.698109766495686e-06, + "loss": 1.0764, + "step": 6085 + }, + { + "epoch": 0.18, + "learning_rate": 4.697993559385365e-06, + "loss": 1.1885, + "step": 6086 + }, + { + "epoch": 0.18, + "learning_rate": 4.697877331351205e-06, + "loss": 1.0737, + "step": 6087 + }, + { + "epoch": 0.18, + "learning_rate": 4.697761082394311e-06, + "loss": 1.2357, + "step": 6088 + }, + { + "epoch": 0.18, + "learning_rate": 4.697644812515791e-06, + "loss": 1.022, + "step": 6089 + }, + { + "epoch": 0.18, + "learning_rate": 4.697528521716749e-06, + "loss": 1.1382, + "step": 6090 + }, + { + "epoch": 0.18, + "learning_rate": 4.697412209998294e-06, + "loss": 1.1857, + "step": 6091 + }, + { + "epoch": 0.18, + "learning_rate": 4.697295877361534e-06, + "loss": 1.1494, + "step": 6092 + }, + { + "epoch": 0.18, + "learning_rate": 4.697179523807575e-06, + "loss": 1.0682, + "step": 6093 + }, + { + "epoch": 0.18, + "learning_rate": 4.697063149337525e-06, + "loss": 1.1638, + "step": 6094 + }, + { + "epoch": 0.18, + "learning_rate": 4.696946753952492e-06, + "loss": 1.1447, + "step": 6095 + }, + { + "epoch": 0.18, + "learning_rate": 4.696830337653585e-06, + "loss": 1.136, + "step": 6096 + }, + { + "epoch": 0.18, + "learning_rate": 4.69671390044191e-06, + "loss": 1.1783, + "step": 6097 + }, + { + "epoch": 0.18, + "learning_rate": 4.6965974423185774e-06, + "loss": 1.2366, + "step": 6098 + }, + { + "epoch": 0.18, + "learning_rate": 4.696480963284695e-06, + "loss": 1.2075, + "step": 6099 + }, + { + "epoch": 0.18, + "learning_rate": 4.696364463341371e-06, + "loss": 1.1708, + "step": 6100 + }, + { + "epoch": 0.18, + "learning_rate": 4.696247942489716e-06, + "loss": 1.1642, + "step": 6101 + }, + { + "epoch": 0.18, + "learning_rate": 4.696131400730838e-06, + "loss": 1.0643, + "step": 6102 + }, + { + "epoch": 0.18, + "learning_rate": 4.696014838065847e-06, + "loss": 1.1078, + "step": 6103 + }, + { + "epoch": 0.18, + "learning_rate": 4.695898254495851e-06, + "loss": 1.1877, + "step": 6104 + }, + { + "epoch": 0.18, + "learning_rate": 4.695781650021963e-06, + "loss": 1.1584, + "step": 6105 + }, + { + "epoch": 0.18, + "learning_rate": 4.69566502464529e-06, + "loss": 1.1155, + "step": 6106 + }, + { + "epoch": 0.18, + "learning_rate": 4.695548378366944e-06, + "loss": 1.1788, + "step": 6107 + }, + { + "epoch": 0.18, + "learning_rate": 4.695431711188035e-06, + "loss": 1.1043, + "step": 6108 + }, + { + "epoch": 0.18, + "learning_rate": 4.6953150231096735e-06, + "loss": 1.0053, + "step": 6109 + }, + { + "epoch": 0.18, + "learning_rate": 4.69519831413297e-06, + "loss": 1.1325, + "step": 6110 + }, + { + "epoch": 0.18, + "learning_rate": 4.695081584259036e-06, + "loss": 1.1252, + "step": 6111 + }, + { + "epoch": 0.18, + "learning_rate": 4.694964833488982e-06, + "loss": 1.2996, + "step": 6112 + }, + { + "epoch": 0.18, + "learning_rate": 4.69484806182392e-06, + "loss": 1.0649, + "step": 6113 + }, + { + "epoch": 0.18, + "learning_rate": 4.694731269264961e-06, + "loss": 1.1658, + "step": 6114 + }, + { + "epoch": 0.18, + "learning_rate": 4.694614455813219e-06, + "loss": 1.2858, + "step": 6115 + }, + { + "epoch": 0.18, + "learning_rate": 4.694497621469803e-06, + "loss": 1.1785, + "step": 6116 + }, + { + "epoch": 0.18, + "learning_rate": 4.694380766235827e-06, + "loss": 1.2003, + "step": 6117 + }, + { + "epoch": 0.18, + "learning_rate": 4.694263890112402e-06, + "loss": 1.1086, + "step": 6118 + }, + { + "epoch": 0.18, + "learning_rate": 4.694146993100643e-06, + "loss": 1.1475, + "step": 6119 + }, + { + "epoch": 0.18, + "learning_rate": 4.694030075201661e-06, + "loss": 1.1421, + "step": 6120 + }, + { + "epoch": 0.18, + "learning_rate": 4.693913136416569e-06, + "loss": 1.1693, + "step": 6121 + }, + { + "epoch": 0.18, + "learning_rate": 4.693796176746481e-06, + "loss": 1.1555, + "step": 6122 + }, + { + "epoch": 0.18, + "learning_rate": 4.69367919619251e-06, + "loss": 1.2262, + "step": 6123 + }, + { + "epoch": 0.18, + "learning_rate": 4.6935621947557695e-06, + "loss": 1.0751, + "step": 6124 + }, + { + "epoch": 0.18, + "learning_rate": 4.693445172437373e-06, + "loss": 1.2383, + "step": 6125 + }, + { + "epoch": 0.18, + "learning_rate": 4.693328129238435e-06, + "loss": 1.1082, + "step": 6126 + }, + { + "epoch": 0.18, + "learning_rate": 4.693211065160069e-06, + "loss": 1.1544, + "step": 6127 + }, + { + "epoch": 0.18, + "learning_rate": 4.693093980203391e-06, + "loss": 1.0047, + "step": 6128 + }, + { + "epoch": 0.18, + "learning_rate": 4.6929768743695134e-06, + "loss": 1.0098, + "step": 6129 + }, + { + "epoch": 0.18, + "learning_rate": 4.692859747659553e-06, + "loss": 1.1819, + "step": 6130 + }, + { + "epoch": 0.18, + "learning_rate": 4.692742600074624e-06, + "loss": 1.1636, + "step": 6131 + }, + { + "epoch": 0.18, + "learning_rate": 4.6926254316158414e-06, + "loss": 1.2405, + "step": 6132 + }, + { + "epoch": 0.18, + "learning_rate": 4.692508242284321e-06, + "loss": 1.126, + "step": 6133 + }, + { + "epoch": 0.18, + "learning_rate": 4.692391032081177e-06, + "loss": 1.1113, + "step": 6134 + }, + { + "epoch": 0.18, + "learning_rate": 4.692273801007526e-06, + "loss": 1.1782, + "step": 6135 + }, + { + "epoch": 0.18, + "learning_rate": 4.692156549064486e-06, + "loss": 1.1912, + "step": 6136 + }, + { + "epoch": 0.18, + "learning_rate": 4.69203927625317e-06, + "loss": 1.1695, + "step": 6137 + }, + { + "epoch": 0.18, + "learning_rate": 4.691921982574697e-06, + "loss": 1.232, + "step": 6138 + }, + { + "epoch": 0.18, + "learning_rate": 4.691804668030182e-06, + "loss": 1.1476, + "step": 6139 + }, + { + "epoch": 0.18, + "learning_rate": 4.691687332620741e-06, + "loss": 1.0894, + "step": 6140 + }, + { + "epoch": 0.18, + "learning_rate": 4.691569976347493e-06, + "loss": 1.2771, + "step": 6141 + }, + { + "epoch": 0.19, + "learning_rate": 4.6914525992115545e-06, + "loss": 1.2604, + "step": 6142 + }, + { + "epoch": 0.19, + "learning_rate": 4.691335201214043e-06, + "loss": 1.2037, + "step": 6143 + }, + { + "epoch": 0.19, + "learning_rate": 4.691217782356075e-06, + "loss": 1.1414, + "step": 6144 + }, + { + "epoch": 0.19, + "learning_rate": 4.69110034263877e-06, + "loss": 1.0715, + "step": 6145 + }, + { + "epoch": 0.19, + "learning_rate": 4.690982882063244e-06, + "loss": 1.2649, + "step": 6146 + }, + { + "epoch": 0.19, + "learning_rate": 4.690865400630616e-06, + "loss": 1.1815, + "step": 6147 + }, + { + "epoch": 0.19, + "learning_rate": 4.690747898342005e-06, + "loss": 1.2058, + "step": 6148 + }, + { + "epoch": 0.19, + "learning_rate": 4.69063037519853e-06, + "loss": 1.2069, + "step": 6149 + }, + { + "epoch": 0.19, + "learning_rate": 4.690512831201308e-06, + "loss": 1.1721, + "step": 6150 + }, + { + "epoch": 0.19, + "learning_rate": 4.690395266351458e-06, + "loss": 1.1747, + "step": 6151 + }, + { + "epoch": 0.19, + "learning_rate": 4.690277680650101e-06, + "loss": 1.192, + "step": 6152 + }, + { + "epoch": 0.19, + "learning_rate": 4.690160074098356e-06, + "loss": 1.1038, + "step": 6153 + }, + { + "epoch": 0.19, + "learning_rate": 4.690042446697342e-06, + "loss": 1.1885, + "step": 6154 + }, + { + "epoch": 0.19, + "learning_rate": 4.689924798448177e-06, + "loss": 1.1699, + "step": 6155 + }, + { + "epoch": 0.19, + "learning_rate": 4.689807129351984e-06, + "loss": 1.1321, + "step": 6156 + }, + { + "epoch": 0.19, + "learning_rate": 4.689689439409881e-06, + "loss": 1.0947, + "step": 6157 + }, + { + "epoch": 0.19, + "learning_rate": 4.689571728622989e-06, + "loss": 1.0423, + "step": 6158 + }, + { + "epoch": 0.19, + "learning_rate": 4.689453996992429e-06, + "loss": 0.9735, + "step": 6159 + }, + { + "epoch": 0.19, + "learning_rate": 4.689336244519322e-06, + "loss": 1.0319, + "step": 6160 + }, + { + "epoch": 0.19, + "learning_rate": 4.689218471204787e-06, + "loss": 1.2474, + "step": 6161 + }, + { + "epoch": 0.19, + "learning_rate": 4.689100677049948e-06, + "loss": 1.1189, + "step": 6162 + }, + { + "epoch": 0.19, + "learning_rate": 4.688982862055924e-06, + "loss": 1.1134, + "step": 6163 + }, + { + "epoch": 0.19, + "learning_rate": 4.688865026223838e-06, + "loss": 1.0871, + "step": 6164 + }, + { + "epoch": 0.19, + "learning_rate": 4.68874716955481e-06, + "loss": 1.1793, + "step": 6165 + }, + { + "epoch": 0.19, + "learning_rate": 4.688629292049964e-06, + "loss": 1.1665, + "step": 6166 + }, + { + "epoch": 0.19, + "learning_rate": 4.688511393710421e-06, + "loss": 1.1242, + "step": 6167 + }, + { + "epoch": 0.19, + "learning_rate": 4.688393474537304e-06, + "loss": 1.1467, + "step": 6168 + }, + { + "epoch": 0.19, + "learning_rate": 4.688275534531735e-06, + "loss": 1.066, + "step": 6169 + }, + { + "epoch": 0.19, + "learning_rate": 4.688157573694837e-06, + "loss": 1.1446, + "step": 6170 + }, + { + "epoch": 0.19, + "learning_rate": 4.688039592027731e-06, + "loss": 1.197, + "step": 6171 + }, + { + "epoch": 0.19, + "learning_rate": 4.6879215895315436e-06, + "loss": 1.2003, + "step": 6172 + }, + { + "epoch": 0.19, + "learning_rate": 4.687803566207396e-06, + "loss": 1.2406, + "step": 6173 + }, + { + "epoch": 0.19, + "learning_rate": 4.687685522056412e-06, + "loss": 1.1993, + "step": 6174 + }, + { + "epoch": 0.19, + "learning_rate": 4.687567457079716e-06, + "loss": 1.1898, + "step": 6175 + }, + { + "epoch": 0.19, + "learning_rate": 4.687449371278431e-06, + "loss": 1.1987, + "step": 6176 + }, + { + "epoch": 0.19, + "learning_rate": 4.6873312646536815e-06, + "loss": 1.1035, + "step": 6177 + }, + { + "epoch": 0.19, + "learning_rate": 4.687213137206592e-06, + "loss": 1.1984, + "step": 6178 + }, + { + "epoch": 0.19, + "learning_rate": 4.687094988938286e-06, + "loss": 1.1273, + "step": 6179 + }, + { + "epoch": 0.19, + "learning_rate": 4.68697681984989e-06, + "loss": 1.1282, + "step": 6180 + }, + { + "epoch": 0.19, + "learning_rate": 4.686858629942527e-06, + "loss": 1.1938, + "step": 6181 + }, + { + "epoch": 0.19, + "learning_rate": 4.686740419217324e-06, + "loss": 1.1481, + "step": 6182 + }, + { + "epoch": 0.19, + "learning_rate": 4.686622187675405e-06, + "loss": 1.1643, + "step": 6183 + }, + { + "epoch": 0.19, + "learning_rate": 4.686503935317896e-06, + "loss": 1.1766, + "step": 6184 + }, + { + "epoch": 0.19, + "learning_rate": 4.686385662145922e-06, + "loss": 1.1493, + "step": 6185 + }, + { + "epoch": 0.19, + "learning_rate": 4.686267368160611e-06, + "loss": 1.1347, + "step": 6186 + }, + { + "epoch": 0.19, + "learning_rate": 4.686149053363086e-06, + "loss": 1.1126, + "step": 6187 + }, + { + "epoch": 0.19, + "learning_rate": 4.686030717754476e-06, + "loss": 1.0924, + "step": 6188 + }, + { + "epoch": 0.19, + "learning_rate": 4.685912361335906e-06, + "loss": 1.1661, + "step": 6189 + }, + { + "epoch": 0.19, + "learning_rate": 4.685793984108503e-06, + "loss": 1.0546, + "step": 6190 + }, + { + "epoch": 0.19, + "learning_rate": 4.685675586073394e-06, + "loss": 1.1114, + "step": 6191 + }, + { + "epoch": 0.19, + "learning_rate": 4.685557167231706e-06, + "loss": 1.1512, + "step": 6192 + }, + { + "epoch": 0.19, + "learning_rate": 4.685438727584566e-06, + "loss": 1.1241, + "step": 6193 + }, + { + "epoch": 0.19, + "learning_rate": 4.6853202671331025e-06, + "loss": 1.2205, + "step": 6194 + }, + { + "epoch": 0.19, + "learning_rate": 4.685201785878442e-06, + "loss": 1.1959, + "step": 6195 + }, + { + "epoch": 0.19, + "learning_rate": 4.685083283821713e-06, + "loss": 1.0831, + "step": 6196 + }, + { + "epoch": 0.19, + "learning_rate": 4.684964760964044e-06, + "loss": 1.0858, + "step": 6197 + }, + { + "epoch": 0.19, + "learning_rate": 4.684846217306563e-06, + "loss": 1.0947, + "step": 6198 + }, + { + "epoch": 0.19, + "learning_rate": 4.6847276528503975e-06, + "loss": 1.1157, + "step": 6199 + }, + { + "epoch": 0.19, + "learning_rate": 4.684609067596677e-06, + "loss": 1.1168, + "step": 6200 + }, + { + "epoch": 0.19, + "learning_rate": 4.684490461546532e-06, + "loss": 1.1225, + "step": 6201 + }, + { + "epoch": 0.19, + "learning_rate": 4.684371834701087e-06, + "loss": 1.1141, + "step": 6202 + }, + { + "epoch": 0.19, + "learning_rate": 4.684253187061476e-06, + "loss": 1.2032, + "step": 6203 + }, + { + "epoch": 0.19, + "learning_rate": 4.684134518628827e-06, + "loss": 1.1334, + "step": 6204 + }, + { + "epoch": 0.19, + "learning_rate": 4.684015829404268e-06, + "loss": 1.2772, + "step": 6205 + }, + { + "epoch": 0.19, + "learning_rate": 4.683897119388931e-06, + "loss": 1.1996, + "step": 6206 + }, + { + "epoch": 0.19, + "learning_rate": 4.683778388583945e-06, + "loss": 1.2452, + "step": 6207 + }, + { + "epoch": 0.19, + "learning_rate": 4.68365963699044e-06, + "loss": 1.1804, + "step": 6208 + }, + { + "epoch": 0.19, + "learning_rate": 4.683540864609548e-06, + "loss": 1.2017, + "step": 6209 + }, + { + "epoch": 0.19, + "learning_rate": 4.683422071442397e-06, + "loss": 1.1575, + "step": 6210 + }, + { + "epoch": 0.19, + "learning_rate": 4.683303257490121e-06, + "loss": 1.174, + "step": 6211 + }, + { + "epoch": 0.19, + "learning_rate": 4.683184422753849e-06, + "loss": 1.2759, + "step": 6212 + }, + { + "epoch": 0.19, + "learning_rate": 4.683065567234712e-06, + "loss": 1.1222, + "step": 6213 + }, + { + "epoch": 0.19, + "learning_rate": 4.682946690933844e-06, + "loss": 1.1201, + "step": 6214 + }, + { + "epoch": 0.19, + "learning_rate": 4.682827793852373e-06, + "loss": 1.2097, + "step": 6215 + }, + { + "epoch": 0.19, + "learning_rate": 4.6827088759914345e-06, + "loss": 1.1957, + "step": 6216 + }, + { + "epoch": 0.19, + "learning_rate": 4.682589937352157e-06, + "loss": 1.2517, + "step": 6217 + }, + { + "epoch": 0.19, + "learning_rate": 4.682470977935675e-06, + "loss": 1.2003, + "step": 6218 + }, + { + "epoch": 0.19, + "learning_rate": 4.682351997743121e-06, + "loss": 1.2034, + "step": 6219 + }, + { + "epoch": 0.19, + "learning_rate": 4.682232996775626e-06, + "loss": 1.0353, + "step": 6220 + }, + { + "epoch": 0.19, + "learning_rate": 4.682113975034324e-06, + "loss": 1.1487, + "step": 6221 + }, + { + "epoch": 0.19, + "learning_rate": 4.681994932520349e-06, + "loss": 1.1345, + "step": 6222 + }, + { + "epoch": 0.19, + "learning_rate": 4.681875869234833e-06, + "loss": 1.1998, + "step": 6223 + }, + { + "epoch": 0.19, + "learning_rate": 4.681756785178909e-06, + "loss": 1.3082, + "step": 6224 + }, + { + "epoch": 0.19, + "learning_rate": 4.681637680353711e-06, + "loss": 1.0995, + "step": 6225 + }, + { + "epoch": 0.19, + "learning_rate": 4.681518554760372e-06, + "loss": 1.0731, + "step": 6226 + }, + { + "epoch": 0.19, + "learning_rate": 4.681399408400029e-06, + "loss": 1.1368, + "step": 6227 + }, + { + "epoch": 0.19, + "learning_rate": 4.681280241273814e-06, + "loss": 1.1413, + "step": 6228 + }, + { + "epoch": 0.19, + "learning_rate": 4.681161053382861e-06, + "loss": 1.1925, + "step": 6229 + }, + { + "epoch": 0.19, + "learning_rate": 4.681041844728305e-06, + "loss": 1.1924, + "step": 6230 + }, + { + "epoch": 0.19, + "learning_rate": 4.680922615311281e-06, + "loss": 1.3188, + "step": 6231 + }, + { + "epoch": 0.19, + "learning_rate": 4.680803365132925e-06, + "loss": 1.0345, + "step": 6232 + }, + { + "epoch": 0.19, + "learning_rate": 4.680684094194371e-06, + "loss": 1.0759, + "step": 6233 + }, + { + "epoch": 0.19, + "learning_rate": 4.680564802496754e-06, + "loss": 1.0794, + "step": 6234 + }, + { + "epoch": 0.19, + "learning_rate": 4.680445490041211e-06, + "loss": 1.1174, + "step": 6235 + }, + { + "epoch": 0.19, + "learning_rate": 4.680326156828876e-06, + "loss": 1.1259, + "step": 6236 + }, + { + "epoch": 0.19, + "learning_rate": 4.6802068028608874e-06, + "loss": 1.2006, + "step": 6237 + }, + { + "epoch": 0.19, + "learning_rate": 4.68008742813838e-06, + "loss": 1.0464, + "step": 6238 + }, + { + "epoch": 0.19, + "learning_rate": 4.679968032662489e-06, + "loss": 1.1044, + "step": 6239 + }, + { + "epoch": 0.19, + "learning_rate": 4.679848616434353e-06, + "loss": 1.193, + "step": 6240 + }, + { + "epoch": 0.19, + "learning_rate": 4.679729179455108e-06, + "loss": 1.1121, + "step": 6241 + }, + { + "epoch": 0.19, + "learning_rate": 4.679609721725891e-06, + "loss": 1.2039, + "step": 6242 + }, + { + "epoch": 0.19, + "learning_rate": 4.679490243247839e-06, + "loss": 1.1028, + "step": 6243 + }, + { + "epoch": 0.19, + "learning_rate": 4.67937074402209e-06, + "loss": 1.0853, + "step": 6244 + }, + { + "epoch": 0.19, + "learning_rate": 4.679251224049781e-06, + "loss": 1.1216, + "step": 6245 + }, + { + "epoch": 0.19, + "learning_rate": 4.67913168333205e-06, + "loss": 1.1195, + "step": 6246 + }, + { + "epoch": 0.19, + "learning_rate": 4.679012121870035e-06, + "loss": 1.0891, + "step": 6247 + }, + { + "epoch": 0.19, + "learning_rate": 4.678892539664873e-06, + "loss": 1.0762, + "step": 6248 + }, + { + "epoch": 0.19, + "learning_rate": 4.678772936717705e-06, + "loss": 1.2192, + "step": 6249 + }, + { + "epoch": 0.19, + "learning_rate": 4.678653313029667e-06, + "loss": 1.1683, + "step": 6250 + }, + { + "epoch": 0.19, + "learning_rate": 4.678533668601899e-06, + "loss": 1.1249, + "step": 6251 + }, + { + "epoch": 0.19, + "learning_rate": 4.678414003435539e-06, + "loss": 1.1621, + "step": 6252 + }, + { + "epoch": 0.19, + "learning_rate": 4.678294317531728e-06, + "loss": 1.2095, + "step": 6253 + }, + { + "epoch": 0.19, + "learning_rate": 4.678174610891603e-06, + "loss": 1.0165, + "step": 6254 + }, + { + "epoch": 0.19, + "learning_rate": 4.678054883516306e-06, + "loss": 1.1461, + "step": 6255 + }, + { + "epoch": 0.19, + "learning_rate": 4.6779351354069746e-06, + "loss": 1.0939, + "step": 6256 + }, + { + "epoch": 0.19, + "learning_rate": 4.6778153665647494e-06, + "loss": 1.0897, + "step": 6257 + }, + { + "epoch": 0.19, + "learning_rate": 4.677695576990772e-06, + "loss": 1.1312, + "step": 6258 + }, + { + "epoch": 0.19, + "learning_rate": 4.67757576668618e-06, + "loss": 1.0255, + "step": 6259 + }, + { + "epoch": 0.19, + "learning_rate": 4.677455935652117e-06, + "loss": 1.0821, + "step": 6260 + }, + { + "epoch": 0.19, + "learning_rate": 4.677336083889721e-06, + "loss": 1.1464, + "step": 6261 + }, + { + "epoch": 0.19, + "learning_rate": 4.677216211400135e-06, + "loss": 1.2416, + "step": 6262 + }, + { + "epoch": 0.19, + "learning_rate": 4.677096318184498e-06, + "loss": 1.1683, + "step": 6263 + }, + { + "epoch": 0.19, + "learning_rate": 4.676976404243954e-06, + "loss": 1.2074, + "step": 6264 + }, + { + "epoch": 0.19, + "learning_rate": 4.676856469579643e-06, + "loss": 1.0652, + "step": 6265 + }, + { + "epoch": 0.19, + "learning_rate": 4.676736514192706e-06, + "loss": 1.1134, + "step": 6266 + }, + { + "epoch": 0.19, + "learning_rate": 4.676616538084286e-06, + "loss": 1.1063, + "step": 6267 + }, + { + "epoch": 0.19, + "learning_rate": 4.6764965412555245e-06, + "loss": 1.1873, + "step": 6268 + }, + { + "epoch": 0.19, + "learning_rate": 4.676376523707565e-06, + "loss": 1.1339, + "step": 6269 + }, + { + "epoch": 0.19, + "learning_rate": 4.676256485441548e-06, + "loss": 1.1952, + "step": 6270 + }, + { + "epoch": 0.19, + "learning_rate": 4.676136426458618e-06, + "loss": 1.1686, + "step": 6271 + }, + { + "epoch": 0.19, + "learning_rate": 4.676016346759918e-06, + "loss": 1.2288, + "step": 6272 + }, + { + "epoch": 0.19, + "learning_rate": 4.6758962463465895e-06, + "loss": 1.2402, + "step": 6273 + }, + { + "epoch": 0.19, + "learning_rate": 4.675776125219778e-06, + "loss": 1.1708, + "step": 6274 + }, + { + "epoch": 0.19, + "learning_rate": 4.675655983380624e-06, + "loss": 1.1986, + "step": 6275 + }, + { + "epoch": 0.19, + "learning_rate": 4.675535820830274e-06, + "loss": 1.1311, + "step": 6276 + }, + { + "epoch": 0.19, + "learning_rate": 4.67541563756987e-06, + "loss": 1.1041, + "step": 6277 + }, + { + "epoch": 0.19, + "learning_rate": 4.675295433600557e-06, + "loss": 1.0995, + "step": 6278 + }, + { + "epoch": 0.19, + "learning_rate": 4.675175208923479e-06, + "loss": 1.1075, + "step": 6279 + }, + { + "epoch": 0.19, + "learning_rate": 4.675054963539782e-06, + "loss": 1.1735, + "step": 6280 + }, + { + "epoch": 0.19, + "learning_rate": 4.674934697450607e-06, + "loss": 1.157, + "step": 6281 + }, + { + "epoch": 0.19, + "learning_rate": 4.674814410657103e-06, + "loss": 1.1932, + "step": 6282 + }, + { + "epoch": 0.19, + "learning_rate": 4.674694103160412e-06, + "loss": 1.041, + "step": 6283 + }, + { + "epoch": 0.19, + "learning_rate": 4.674573774961681e-06, + "loss": 1.1832, + "step": 6284 + }, + { + "epoch": 0.19, + "learning_rate": 4.674453426062055e-06, + "loss": 1.1148, + "step": 6285 + }, + { + "epoch": 0.19, + "learning_rate": 4.67433305646268e-06, + "loss": 1.1854, + "step": 6286 + }, + { + "epoch": 0.19, + "learning_rate": 4.674212666164701e-06, + "loss": 1.165, + "step": 6287 + }, + { + "epoch": 0.19, + "learning_rate": 4.6740922551692645e-06, + "loss": 1.111, + "step": 6288 + }, + { + "epoch": 0.19, + "learning_rate": 4.673971823477517e-06, + "loss": 1.1728, + "step": 6289 + }, + { + "epoch": 0.19, + "learning_rate": 4.6738513710906056e-06, + "loss": 1.1368, + "step": 6290 + }, + { + "epoch": 0.19, + "learning_rate": 4.6737308980096755e-06, + "loss": 1.1997, + "step": 6291 + }, + { + "epoch": 0.19, + "learning_rate": 4.673610404235873e-06, + "loss": 1.2446, + "step": 6292 + }, + { + "epoch": 0.19, + "learning_rate": 4.673489889770347e-06, + "loss": 1.0296, + "step": 6293 + }, + { + "epoch": 0.19, + "learning_rate": 4.673369354614244e-06, + "loss": 1.0687, + "step": 6294 + }, + { + "epoch": 0.19, + "learning_rate": 4.673248798768713e-06, + "loss": 1.133, + "step": 6295 + }, + { + "epoch": 0.19, + "learning_rate": 4.673128222234899e-06, + "loss": 1.1075, + "step": 6296 + }, + { + "epoch": 0.19, + "learning_rate": 4.67300762501395e-06, + "loss": 1.1751, + "step": 6297 + }, + { + "epoch": 0.19, + "learning_rate": 4.672887007107016e-06, + "loss": 1.3054, + "step": 6298 + }, + { + "epoch": 0.19, + "learning_rate": 4.672766368515244e-06, + "loss": 1.3577, + "step": 6299 + }, + { + "epoch": 0.19, + "learning_rate": 4.672645709239783e-06, + "loss": 1.2408, + "step": 6300 + }, + { + "epoch": 0.19, + "learning_rate": 4.6725250292817805e-06, + "loss": 1.1215, + "step": 6301 + }, + { + "epoch": 0.19, + "learning_rate": 4.672404328642386e-06, + "loss": 1.1655, + "step": 6302 + }, + { + "epoch": 0.19, + "learning_rate": 4.67228360732275e-06, + "loss": 1.1832, + "step": 6303 + }, + { + "epoch": 0.19, + "learning_rate": 4.672162865324018e-06, + "loss": 1.163, + "step": 6304 + }, + { + "epoch": 0.19, + "learning_rate": 4.672042102647343e-06, + "loss": 1.1478, + "step": 6305 + }, + { + "epoch": 0.19, + "learning_rate": 4.671921319293873e-06, + "loss": 1.1296, + "step": 6306 + }, + { + "epoch": 0.19, + "learning_rate": 4.671800515264758e-06, + "loss": 1.229, + "step": 6307 + }, + { + "epoch": 0.19, + "learning_rate": 4.671679690561149e-06, + "loss": 1.1771, + "step": 6308 + }, + { + "epoch": 0.19, + "learning_rate": 4.671558845184194e-06, + "loss": 1.1591, + "step": 6309 + }, + { + "epoch": 0.19, + "learning_rate": 4.6714379791350455e-06, + "loss": 1.1564, + "step": 6310 + }, + { + "epoch": 0.19, + "learning_rate": 4.671317092414853e-06, + "loss": 1.2029, + "step": 6311 + }, + { + "epoch": 0.19, + "learning_rate": 4.6711961850247675e-06, + "loss": 1.0497, + "step": 6312 + }, + { + "epoch": 0.19, + "learning_rate": 4.67107525696594e-06, + "loss": 1.108, + "step": 6313 + }, + { + "epoch": 0.19, + "learning_rate": 4.670954308239521e-06, + "loss": 1.1147, + "step": 6314 + }, + { + "epoch": 0.19, + "learning_rate": 4.670833338846664e-06, + "loss": 1.1793, + "step": 6315 + }, + { + "epoch": 0.19, + "learning_rate": 4.6707123487885186e-06, + "loss": 1.0615, + "step": 6316 + }, + { + "epoch": 0.19, + "learning_rate": 4.670591338066237e-06, + "loss": 1.3019, + "step": 6317 + }, + { + "epoch": 0.19, + "learning_rate": 4.6704703066809705e-06, + "loss": 1.1761, + "step": 6318 + }, + { + "epoch": 0.19, + "learning_rate": 4.670349254633872e-06, + "loss": 1.1495, + "step": 6319 + }, + { + "epoch": 0.19, + "learning_rate": 4.670228181926094e-06, + "loss": 1.121, + "step": 6320 + }, + { + "epoch": 0.19, + "learning_rate": 4.67010708855879e-06, + "loss": 1.2013, + "step": 6321 + }, + { + "epoch": 0.19, + "learning_rate": 4.669985974533111e-06, + "loss": 1.0524, + "step": 6322 + }, + { + "epoch": 0.19, + "learning_rate": 4.669864839850211e-06, + "loss": 1.1231, + "step": 6323 + }, + { + "epoch": 0.19, + "learning_rate": 4.669743684511243e-06, + "loss": 1.098, + "step": 6324 + }, + { + "epoch": 0.19, + "learning_rate": 4.6696225085173585e-06, + "loss": 1.1555, + "step": 6325 + }, + { + "epoch": 0.19, + "learning_rate": 4.669501311869714e-06, + "loss": 1.1455, + "step": 6326 + }, + { + "epoch": 0.19, + "learning_rate": 4.669380094569462e-06, + "loss": 1.1067, + "step": 6327 + }, + { + "epoch": 0.19, + "learning_rate": 4.669258856617756e-06, + "loss": 1.0129, + "step": 6328 + }, + { + "epoch": 0.19, + "learning_rate": 4.66913759801575e-06, + "loss": 1.1857, + "step": 6329 + }, + { + "epoch": 0.19, + "learning_rate": 4.6690163187645995e-06, + "loss": 1.2083, + "step": 6330 + }, + { + "epoch": 0.19, + "learning_rate": 4.668895018865457e-06, + "loss": 1.2468, + "step": 6331 + }, + { + "epoch": 0.19, + "learning_rate": 4.66877369831948e-06, + "loss": 1.1464, + "step": 6332 + }, + { + "epoch": 0.19, + "learning_rate": 4.668652357127821e-06, + "loss": 1.1322, + "step": 6333 + }, + { + "epoch": 0.19, + "learning_rate": 4.668530995291636e-06, + "loss": 1.116, + "step": 6334 + }, + { + "epoch": 0.19, + "learning_rate": 4.668409612812081e-06, + "loss": 1.2815, + "step": 6335 + }, + { + "epoch": 0.19, + "learning_rate": 4.66828820969031e-06, + "loss": 1.1312, + "step": 6336 + }, + { + "epoch": 0.19, + "learning_rate": 4.6681667859274805e-06, + "loss": 1.2634, + "step": 6337 + }, + { + "epoch": 0.19, + "learning_rate": 4.668045341524747e-06, + "loss": 1.2189, + "step": 6338 + }, + { + "epoch": 0.19, + "learning_rate": 4.667923876483266e-06, + "loss": 1.2358, + "step": 6339 + }, + { + "epoch": 0.19, + "learning_rate": 4.667802390804193e-06, + "loss": 1.1954, + "step": 6340 + }, + { + "epoch": 0.19, + "learning_rate": 4.667680884488686e-06, + "loss": 1.1887, + "step": 6341 + }, + { + "epoch": 0.19, + "learning_rate": 4.667559357537901e-06, + "loss": 1.1665, + "step": 6342 + }, + { + "epoch": 0.19, + "learning_rate": 4.667437809952995e-06, + "loss": 1.1925, + "step": 6343 + }, + { + "epoch": 0.19, + "learning_rate": 4.667316241735125e-06, + "loss": 1.2452, + "step": 6344 + }, + { + "epoch": 0.19, + "learning_rate": 4.667194652885447e-06, + "loss": 1.0715, + "step": 6345 + }, + { + "epoch": 0.19, + "learning_rate": 4.667073043405122e-06, + "loss": 1.1987, + "step": 6346 + }, + { + "epoch": 0.19, + "learning_rate": 4.666951413295303e-06, + "loss": 1.1071, + "step": 6347 + }, + { + "epoch": 0.19, + "learning_rate": 4.666829762557151e-06, + "loss": 1.1168, + "step": 6348 + }, + { + "epoch": 0.19, + "learning_rate": 4.666708091191824e-06, + "loss": 1.1008, + "step": 6349 + }, + { + "epoch": 0.19, + "learning_rate": 4.666586399200478e-06, + "loss": 1.1757, + "step": 6350 + }, + { + "epoch": 0.19, + "learning_rate": 4.666464686584274e-06, + "loss": 1.0391, + "step": 6351 + }, + { + "epoch": 0.19, + "learning_rate": 4.66634295334437e-06, + "loss": 1.0966, + "step": 6352 + }, + { + "epoch": 0.19, + "learning_rate": 4.6662211994819235e-06, + "loss": 1.1302, + "step": 6353 + }, + { + "epoch": 0.19, + "learning_rate": 4.666099424998094e-06, + "loss": 1.1306, + "step": 6354 + }, + { + "epoch": 0.19, + "learning_rate": 4.665977629894043e-06, + "loss": 1.0934, + "step": 6355 + }, + { + "epoch": 0.19, + "learning_rate": 4.665855814170927e-06, + "loss": 1.1838, + "step": 6356 + }, + { + "epoch": 0.19, + "learning_rate": 4.665733977829907e-06, + "loss": 1.1639, + "step": 6357 + }, + { + "epoch": 0.19, + "learning_rate": 4.665612120872142e-06, + "loss": 1.144, + "step": 6358 + }, + { + "epoch": 0.19, + "learning_rate": 4.665490243298793e-06, + "loss": 1.1686, + "step": 6359 + }, + { + "epoch": 0.19, + "learning_rate": 4.66536834511102e-06, + "loss": 1.0964, + "step": 6360 + }, + { + "epoch": 0.19, + "learning_rate": 4.665246426309983e-06, + "loss": 1.1398, + "step": 6361 + }, + { + "epoch": 0.19, + "learning_rate": 4.665124486896842e-06, + "loss": 1.1609, + "step": 6362 + }, + { + "epoch": 0.19, + "learning_rate": 4.66500252687276e-06, + "loss": 1.183, + "step": 6363 + }, + { + "epoch": 0.19, + "learning_rate": 4.664880546238897e-06, + "loss": 1.256, + "step": 6364 + }, + { + "epoch": 0.19, + "learning_rate": 4.6647585449964125e-06, + "loss": 1.2186, + "step": 6365 + }, + { + "epoch": 0.19, + "learning_rate": 4.6646365231464704e-06, + "loss": 1.1567, + "step": 6366 + }, + { + "epoch": 0.19, + "learning_rate": 4.66451448069023e-06, + "loss": 1.1709, + "step": 6367 + }, + { + "epoch": 0.19, + "learning_rate": 4.6643924176288556e-06, + "loss": 1.2751, + "step": 6368 + }, + { + "epoch": 0.19, + "learning_rate": 4.664270333963506e-06, + "loss": 1.1044, + "step": 6369 + }, + { + "epoch": 0.19, + "learning_rate": 4.664148229695347e-06, + "loss": 1.1501, + "step": 6370 + }, + { + "epoch": 0.19, + "learning_rate": 4.664026104825537e-06, + "loss": 1.1169, + "step": 6371 + }, + { + "epoch": 0.19, + "learning_rate": 4.663903959355242e-06, + "loss": 1.0407, + "step": 6372 + }, + { + "epoch": 0.19, + "learning_rate": 4.663781793285624e-06, + "loss": 1.0406, + "step": 6373 + }, + { + "epoch": 0.19, + "learning_rate": 4.6636596066178455e-06, + "loss": 1.3184, + "step": 6374 + }, + { + "epoch": 0.19, + "learning_rate": 4.663537399353069e-06, + "loss": 1.2096, + "step": 6375 + }, + { + "epoch": 0.19, + "learning_rate": 4.663415171492458e-06, + "loss": 1.0483, + "step": 6376 + }, + { + "epoch": 0.19, + "learning_rate": 4.663292923037177e-06, + "loss": 1.187, + "step": 6377 + }, + { + "epoch": 0.19, + "learning_rate": 4.663170653988389e-06, + "loss": 1.1412, + "step": 6378 + }, + { + "epoch": 0.19, + "learning_rate": 4.663048364347259e-06, + "loss": 1.1689, + "step": 6379 + }, + { + "epoch": 0.19, + "learning_rate": 4.662926054114949e-06, + "loss": 1.1491, + "step": 6380 + }, + { + "epoch": 0.19, + "learning_rate": 4.662803723292625e-06, + "loss": 1.3429, + "step": 6381 + }, + { + "epoch": 0.19, + "learning_rate": 4.662681371881453e-06, + "loss": 1.2332, + "step": 6382 + }, + { + "epoch": 0.19, + "learning_rate": 4.662558999882594e-06, + "loss": 1.1196, + "step": 6383 + }, + { + "epoch": 0.19, + "learning_rate": 4.662436607297215e-06, + "loss": 1.1493, + "step": 6384 + }, + { + "epoch": 0.19, + "learning_rate": 4.662314194126481e-06, + "loss": 1.1243, + "step": 6385 + }, + { + "epoch": 0.19, + "learning_rate": 4.6621917603715576e-06, + "loss": 1.0696, + "step": 6386 + }, + { + "epoch": 0.19, + "learning_rate": 4.6620693060336095e-06, + "loss": 1.1041, + "step": 6387 + }, + { + "epoch": 0.19, + "learning_rate": 4.6619468311138035e-06, + "loss": 1.2606, + "step": 6388 + }, + { + "epoch": 0.19, + "learning_rate": 4.661824335613305e-06, + "loss": 1.171, + "step": 6389 + }, + { + "epoch": 0.19, + "learning_rate": 4.66170181953328e-06, + "loss": 1.1198, + "step": 6390 + }, + { + "epoch": 0.19, + "learning_rate": 4.661579282874895e-06, + "loss": 1.1244, + "step": 6391 + }, + { + "epoch": 0.19, + "learning_rate": 4.661456725639316e-06, + "loss": 1.0927, + "step": 6392 + }, + { + "epoch": 0.19, + "learning_rate": 4.66133414782771e-06, + "loss": 1.2139, + "step": 6393 + }, + { + "epoch": 0.19, + "learning_rate": 4.661211549441243e-06, + "loss": 1.1141, + "step": 6394 + }, + { + "epoch": 0.19, + "learning_rate": 4.661088930481084e-06, + "loss": 1.1528, + "step": 6395 + }, + { + "epoch": 0.19, + "learning_rate": 4.6609662909483985e-06, + "loss": 1.1959, + "step": 6396 + }, + { + "epoch": 0.19, + "learning_rate": 4.660843630844355e-06, + "loss": 1.236, + "step": 6397 + }, + { + "epoch": 0.19, + "learning_rate": 4.66072095017012e-06, + "loss": 1.1173, + "step": 6398 + }, + { + "epoch": 0.19, + "learning_rate": 4.660598248926863e-06, + "loss": 1.2988, + "step": 6399 + }, + { + "epoch": 0.19, + "learning_rate": 4.660475527115752e-06, + "loss": 1.1335, + "step": 6400 + }, + { + "epoch": 0.19, + "learning_rate": 4.660352784737953e-06, + "loss": 1.0759, + "step": 6401 + }, + { + "epoch": 0.19, + "learning_rate": 4.6602300217946374e-06, + "loss": 1.0911, + "step": 6402 + }, + { + "epoch": 0.19, + "learning_rate": 4.660107238286971e-06, + "loss": 1.129, + "step": 6403 + }, + { + "epoch": 0.19, + "learning_rate": 4.659984434216125e-06, + "loss": 1.087, + "step": 6404 + }, + { + "epoch": 0.19, + "learning_rate": 4.659861609583267e-06, + "loss": 1.2203, + "step": 6405 + }, + { + "epoch": 0.19, + "learning_rate": 4.659738764389567e-06, + "loss": 1.199, + "step": 6406 + }, + { + "epoch": 0.19, + "learning_rate": 4.659615898636194e-06, + "loss": 1.1078, + "step": 6407 + }, + { + "epoch": 0.19, + "learning_rate": 4.6594930123243176e-06, + "loss": 1.1613, + "step": 6408 + }, + { + "epoch": 0.19, + "learning_rate": 4.6593701054551075e-06, + "loss": 1.0734, + "step": 6409 + }, + { + "epoch": 0.19, + "learning_rate": 4.659247178029735e-06, + "loss": 1.1064, + "step": 6410 + }, + { + "epoch": 0.19, + "learning_rate": 4.6591242300493685e-06, + "loss": 1.1447, + "step": 6411 + }, + { + "epoch": 0.19, + "learning_rate": 4.659001261515179e-06, + "loss": 1.2029, + "step": 6412 + }, + { + "epoch": 0.19, + "learning_rate": 4.658878272428337e-06, + "loss": 1.2205, + "step": 6413 + }, + { + "epoch": 0.19, + "learning_rate": 4.658755262790016e-06, + "loss": 1.1693, + "step": 6414 + }, + { + "epoch": 0.19, + "learning_rate": 4.658632232601382e-06, + "loss": 1.2242, + "step": 6415 + }, + { + "epoch": 0.19, + "learning_rate": 4.65850918186361e-06, + "loss": 1.0232, + "step": 6416 + }, + { + "epoch": 0.19, + "learning_rate": 4.6583861105778696e-06, + "loss": 1.1895, + "step": 6417 + }, + { + "epoch": 0.19, + "learning_rate": 4.658263018745333e-06, + "loss": 1.1328, + "step": 6418 + }, + { + "epoch": 0.19, + "learning_rate": 4.658139906367172e-06, + "loss": 1.2146, + "step": 6419 + }, + { + "epoch": 0.19, + "learning_rate": 4.658016773444559e-06, + "loss": 1.1527, + "step": 6420 + }, + { + "epoch": 0.19, + "learning_rate": 4.657893619978665e-06, + "loss": 1.036, + "step": 6421 + }, + { + "epoch": 0.19, + "learning_rate": 4.657770445970663e-06, + "loss": 1.1577, + "step": 6422 + }, + { + "epoch": 0.19, + "learning_rate": 4.657647251421726e-06, + "loss": 1.1597, + "step": 6423 + }, + { + "epoch": 0.19, + "learning_rate": 4.6575240363330265e-06, + "loss": 1.1523, + "step": 6424 + }, + { + "epoch": 0.19, + "learning_rate": 4.657400800705737e-06, + "loss": 1.1481, + "step": 6425 + }, + { + "epoch": 0.19, + "learning_rate": 4.657277544541031e-06, + "loss": 1.2001, + "step": 6426 + }, + { + "epoch": 0.19, + "learning_rate": 4.657154267840081e-06, + "loss": 1.0788, + "step": 6427 + }, + { + "epoch": 0.19, + "learning_rate": 4.6570309706040615e-06, + "loss": 1.098, + "step": 6428 + }, + { + "epoch": 0.19, + "learning_rate": 4.656907652834147e-06, + "loss": 1.179, + "step": 6429 + }, + { + "epoch": 0.19, + "learning_rate": 4.6567843145315095e-06, + "loss": 1.1599, + "step": 6430 + }, + { + "epoch": 0.19, + "learning_rate": 4.656660955697325e-06, + "loss": 1.1887, + "step": 6431 + }, + { + "epoch": 0.19, + "learning_rate": 4.6565375763327655e-06, + "loss": 1.1917, + "step": 6432 + }, + { + "epoch": 0.19, + "learning_rate": 4.6564141764390085e-06, + "loss": 1.1337, + "step": 6433 + }, + { + "epoch": 0.19, + "learning_rate": 4.656290756017226e-06, + "loss": 1.2053, + "step": 6434 + }, + { + "epoch": 0.19, + "learning_rate": 4.656167315068594e-06, + "loss": 1.1355, + "step": 6435 + }, + { + "epoch": 0.19, + "learning_rate": 4.656043853594288e-06, + "loss": 1.108, + "step": 6436 + }, + { + "epoch": 0.19, + "learning_rate": 4.655920371595483e-06, + "loss": 1.2715, + "step": 6437 + }, + { + "epoch": 0.19, + "learning_rate": 4.655796869073354e-06, + "loss": 1.1313, + "step": 6438 + }, + { + "epoch": 0.19, + "learning_rate": 4.655673346029077e-06, + "loss": 1.0955, + "step": 6439 + }, + { + "epoch": 0.19, + "learning_rate": 4.655549802463828e-06, + "loss": 1.118, + "step": 6440 + }, + { + "epoch": 0.19, + "learning_rate": 4.655426238378784e-06, + "loss": 1.2083, + "step": 6441 + }, + { + "epoch": 0.19, + "learning_rate": 4.655302653775119e-06, + "loss": 1.1293, + "step": 6442 + }, + { + "epoch": 0.19, + "learning_rate": 4.655179048654011e-06, + "loss": 1.2015, + "step": 6443 + }, + { + "epoch": 0.19, + "learning_rate": 4.655055423016638e-06, + "loss": 1.1449, + "step": 6444 + }, + { + "epoch": 0.19, + "learning_rate": 4.654931776864174e-06, + "loss": 1.2233, + "step": 6445 + }, + { + "epoch": 0.19, + "learning_rate": 4.654808110197797e-06, + "loss": 1.1429, + "step": 6446 + }, + { + "epoch": 0.19, + "learning_rate": 4.654684423018685e-06, + "loss": 1.1337, + "step": 6447 + }, + { + "epoch": 0.19, + "learning_rate": 4.6545607153280146e-06, + "loss": 1.218, + "step": 6448 + }, + { + "epoch": 0.19, + "learning_rate": 4.654436987126965e-06, + "loss": 1.1779, + "step": 6449 + }, + { + "epoch": 0.19, + "learning_rate": 4.654313238416712e-06, + "loss": 1.0595, + "step": 6450 + }, + { + "epoch": 0.19, + "learning_rate": 4.6541894691984345e-06, + "loss": 1.0853, + "step": 6451 + }, + { + "epoch": 0.19, + "learning_rate": 4.654065679473311e-06, + "loss": 1.1646, + "step": 6452 + }, + { + "epoch": 0.19, + "learning_rate": 4.653941869242519e-06, + "loss": 1.1299, + "step": 6453 + }, + { + "epoch": 0.19, + "learning_rate": 4.653818038507239e-06, + "loss": 0.9478, + "step": 6454 + }, + { + "epoch": 0.19, + "learning_rate": 4.653694187268648e-06, + "loss": 1.2415, + "step": 6455 + }, + { + "epoch": 0.19, + "learning_rate": 4.653570315527925e-06, + "loss": 1.2132, + "step": 6456 + }, + { + "epoch": 0.19, + "learning_rate": 4.65344642328625e-06, + "loss": 1.1462, + "step": 6457 + }, + { + "epoch": 0.19, + "learning_rate": 4.653322510544803e-06, + "loss": 1.1907, + "step": 6458 + }, + { + "epoch": 0.19, + "learning_rate": 4.6531985773047625e-06, + "loss": 1.009, + "step": 6459 + }, + { + "epoch": 0.19, + "learning_rate": 4.653074623567308e-06, + "loss": 1.2145, + "step": 6460 + }, + { + "epoch": 0.19, + "learning_rate": 4.652950649333621e-06, + "loss": 1.2587, + "step": 6461 + }, + { + "epoch": 0.19, + "learning_rate": 4.65282665460488e-06, + "loss": 1.1519, + "step": 6462 + }, + { + "epoch": 0.19, + "learning_rate": 4.652702639382265e-06, + "loss": 1.0361, + "step": 6463 + }, + { + "epoch": 0.19, + "learning_rate": 4.652578603666959e-06, + "loss": 1.0625, + "step": 6464 + }, + { + "epoch": 0.19, + "learning_rate": 4.652454547460142e-06, + "loss": 1.0466, + "step": 6465 + }, + { + "epoch": 0.19, + "learning_rate": 4.652330470762994e-06, + "loss": 1.0929, + "step": 6466 + }, + { + "epoch": 0.19, + "learning_rate": 4.652206373576695e-06, + "loss": 1.1005, + "step": 6467 + }, + { + "epoch": 0.19, + "learning_rate": 4.652082255902429e-06, + "loss": 1.2032, + "step": 6468 + }, + { + "epoch": 0.19, + "learning_rate": 4.651958117741377e-06, + "loss": 1.0323, + "step": 6469 + }, + { + "epoch": 0.19, + "learning_rate": 4.65183395909472e-06, + "loss": 1.1655, + "step": 6470 + }, + { + "epoch": 0.19, + "learning_rate": 4.651709779963639e-06, + "loss": 1.1345, + "step": 6471 + }, + { + "epoch": 0.19, + "learning_rate": 4.6515855803493175e-06, + "loss": 1.2031, + "step": 6472 + }, + { + "epoch": 0.19, + "learning_rate": 4.651461360252938e-06, + "loss": 1.2526, + "step": 6473 + }, + { + "epoch": 0.2, + "learning_rate": 4.651337119675683e-06, + "loss": 1.1569, + "step": 6474 + }, + { + "epoch": 0.2, + "learning_rate": 4.651212858618733e-06, + "loss": 1.1479, + "step": 6475 + }, + { + "epoch": 0.2, + "learning_rate": 4.651088577083273e-06, + "loss": 1.1428, + "step": 6476 + }, + { + "epoch": 0.2, + "learning_rate": 4.650964275070488e-06, + "loss": 1.1967, + "step": 6477 + }, + { + "epoch": 0.2, + "learning_rate": 4.650839952581556e-06, + "loss": 1.0869, + "step": 6478 + }, + { + "epoch": 0.2, + "learning_rate": 4.650715609617666e-06, + "loss": 1.2408, + "step": 6479 + }, + { + "epoch": 0.2, + "learning_rate": 4.6505912461799985e-06, + "loss": 1.0402, + "step": 6480 + }, + { + "epoch": 0.2, + "learning_rate": 4.650466862269738e-06, + "loss": 1.2397, + "step": 6481 + }, + { + "epoch": 0.2, + "learning_rate": 4.650342457888068e-06, + "loss": 1.1207, + "step": 6482 + }, + { + "epoch": 0.2, + "learning_rate": 4.650218033036174e-06, + "loss": 1.0825, + "step": 6483 + }, + { + "epoch": 0.2, + "learning_rate": 4.65009358771524e-06, + "loss": 1.136, + "step": 6484 + }, + { + "epoch": 0.2, + "learning_rate": 4.64996912192645e-06, + "loss": 1.0883, + "step": 6485 + }, + { + "epoch": 0.2, + "learning_rate": 4.64984463567099e-06, + "loss": 1.0546, + "step": 6486 + }, + { + "epoch": 0.2, + "learning_rate": 4.649720128950045e-06, + "loss": 1.3011, + "step": 6487 + }, + { + "epoch": 0.2, + "learning_rate": 4.649595601764799e-06, + "loss": 1.1349, + "step": 6488 + }, + { + "epoch": 0.2, + "learning_rate": 4.649471054116438e-06, + "loss": 1.1378, + "step": 6489 + }, + { + "epoch": 0.2, + "learning_rate": 4.649346486006148e-06, + "loss": 1.1547, + "step": 6490 + }, + { + "epoch": 0.2, + "learning_rate": 4.6492218974351145e-06, + "loss": 1.1117, + "step": 6491 + }, + { + "epoch": 0.2, + "learning_rate": 4.649097288404523e-06, + "loss": 1.1149, + "step": 6492 + }, + { + "epoch": 0.2, + "learning_rate": 4.648972658915562e-06, + "loss": 1.1061, + "step": 6493 + }, + { + "epoch": 0.2, + "learning_rate": 4.648848008969415e-06, + "loss": 1.2819, + "step": 6494 + }, + { + "epoch": 0.2, + "learning_rate": 4.6487233385672705e-06, + "loss": 1.1508, + "step": 6495 + }, + { + "epoch": 0.2, + "learning_rate": 4.648598647710314e-06, + "loss": 1.1783, + "step": 6496 + }, + { + "epoch": 0.2, + "learning_rate": 4.6484739363997334e-06, + "loss": 1.0952, + "step": 6497 + }, + { + "epoch": 0.2, + "learning_rate": 4.648349204636717e-06, + "loss": 1.1713, + "step": 6498 + }, + { + "epoch": 0.2, + "learning_rate": 4.648224452422448e-06, + "loss": 1.1146, + "step": 6499 + }, + { + "epoch": 0.2, + "learning_rate": 4.648099679758119e-06, + "loss": 1.1114, + "step": 6500 + }, + { + "epoch": 0.2, + "learning_rate": 4.647974886644916e-06, + "loss": 1.1121, + "step": 6501 + }, + { + "epoch": 0.2, + "learning_rate": 4.6478500730840244e-06, + "loss": 1.1425, + "step": 6502 + }, + { + "epoch": 0.2, + "learning_rate": 4.647725239076636e-06, + "loss": 1.0457, + "step": 6503 + }, + { + "epoch": 0.2, + "learning_rate": 4.647600384623938e-06, + "loss": 1.1294, + "step": 6504 + }, + { + "epoch": 0.2, + "learning_rate": 4.6474755097271185e-06, + "loss": 1.1575, + "step": 6505 + }, + { + "epoch": 0.2, + "learning_rate": 4.6473506143873655e-06, + "loss": 1.109, + "step": 6506 + }, + { + "epoch": 0.2, + "learning_rate": 4.647225698605869e-06, + "loss": 1.1056, + "step": 6507 + }, + { + "epoch": 0.2, + "learning_rate": 4.647100762383819e-06, + "loss": 1.122, + "step": 6508 + }, + { + "epoch": 0.2, + "learning_rate": 4.646975805722404e-06, + "loss": 1.1921, + "step": 6509 + }, + { + "epoch": 0.2, + "learning_rate": 4.646850828622812e-06, + "loss": 1.1771, + "step": 6510 + }, + { + "epoch": 0.2, + "learning_rate": 4.646725831086235e-06, + "loss": 1.1516, + "step": 6511 + }, + { + "epoch": 0.2, + "learning_rate": 4.6466008131138616e-06, + "loss": 1.2342, + "step": 6512 + }, + { + "epoch": 0.2, + "learning_rate": 4.646475774706882e-06, + "loss": 1.1928, + "step": 6513 + }, + { + "epoch": 0.2, + "learning_rate": 4.646350715866488e-06, + "loss": 1.1842, + "step": 6514 + }, + { + "epoch": 0.2, + "learning_rate": 4.646225636593867e-06, + "loss": 1.2189, + "step": 6515 + }, + { + "epoch": 0.2, + "learning_rate": 4.6461005368902135e-06, + "loss": 1.0963, + "step": 6516 + }, + { + "epoch": 0.2, + "learning_rate": 4.645975416756715e-06, + "loss": 1.2164, + "step": 6517 + }, + { + "epoch": 0.2, + "learning_rate": 4.6458502761945655e-06, + "loss": 1.1509, + "step": 6518 + }, + { + "epoch": 0.2, + "learning_rate": 4.645725115204954e-06, + "loss": 1.222, + "step": 6519 + }, + { + "epoch": 0.2, + "learning_rate": 4.645599933789072e-06, + "loss": 1.1953, + "step": 6520 + }, + { + "epoch": 0.2, + "learning_rate": 4.645474731948113e-06, + "loss": 1.0972, + "step": 6521 + }, + { + "epoch": 0.2, + "learning_rate": 4.645349509683268e-06, + "loss": 1.1224, + "step": 6522 + }, + { + "epoch": 0.2, + "learning_rate": 4.645224266995729e-06, + "loss": 1.1941, + "step": 6523 + }, + { + "epoch": 0.2, + "learning_rate": 4.645099003886688e-06, + "loss": 1.2103, + "step": 6524 + }, + { + "epoch": 0.2, + "learning_rate": 4.644973720357338e-06, + "loss": 1.208, + "step": 6525 + }, + { + "epoch": 0.2, + "learning_rate": 4.64484841640887e-06, + "loss": 1.1377, + "step": 6526 + }, + { + "epoch": 0.2, + "learning_rate": 4.644723092042479e-06, + "loss": 1.1297, + "step": 6527 + }, + { + "epoch": 0.2, + "learning_rate": 4.644597747259356e-06, + "loss": 1.0501, + "step": 6528 + }, + { + "epoch": 0.2, + "learning_rate": 4.644472382060696e-06, + "loss": 1.1139, + "step": 6529 + }, + { + "epoch": 0.2, + "learning_rate": 4.644346996447692e-06, + "loss": 1.1168, + "step": 6530 + }, + { + "epoch": 0.2, + "learning_rate": 4.644221590421537e-06, + "loss": 1.1234, + "step": 6531 + }, + { + "epoch": 0.2, + "learning_rate": 4.644096163983426e-06, + "loss": 1.147, + "step": 6532 + }, + { + "epoch": 0.2, + "learning_rate": 4.6439707171345515e-06, + "loss": 1.1333, + "step": 6533 + }, + { + "epoch": 0.2, + "learning_rate": 4.643845249876109e-06, + "loss": 1.0096, + "step": 6534 + }, + { + "epoch": 0.2, + "learning_rate": 4.643719762209291e-06, + "loss": 1.1662, + "step": 6535 + }, + { + "epoch": 0.2, + "learning_rate": 4.6435942541352945e-06, + "loss": 1.1241, + "step": 6536 + }, + { + "epoch": 0.2, + "learning_rate": 4.643468725655312e-06, + "loss": 1.2147, + "step": 6537 + }, + { + "epoch": 0.2, + "learning_rate": 4.643343176770539e-06, + "loss": 1.1275, + "step": 6538 + }, + { + "epoch": 0.2, + "learning_rate": 4.643217607482173e-06, + "loss": 1.2446, + "step": 6539 + }, + { + "epoch": 0.2, + "learning_rate": 4.643092017791407e-06, + "loss": 1.0646, + "step": 6540 + }, + { + "epoch": 0.2, + "learning_rate": 4.6429664076994375e-06, + "loss": 1.1403, + "step": 6541 + }, + { + "epoch": 0.2, + "learning_rate": 4.642840777207459e-06, + "loss": 1.1469, + "step": 6542 + }, + { + "epoch": 0.2, + "learning_rate": 4.642715126316669e-06, + "loss": 1.1619, + "step": 6543 + }, + { + "epoch": 0.2, + "learning_rate": 4.642589455028263e-06, + "loss": 1.1624, + "step": 6544 + }, + { + "epoch": 0.2, + "learning_rate": 4.642463763343436e-06, + "loss": 1.132, + "step": 6545 + }, + { + "epoch": 0.2, + "learning_rate": 4.642338051263387e-06, + "loss": 1.0916, + "step": 6546 + }, + { + "epoch": 0.2, + "learning_rate": 4.642212318789311e-06, + "loss": 1.1855, + "step": 6547 + }, + { + "epoch": 0.2, + "learning_rate": 4.6420865659224065e-06, + "loss": 1.1411, + "step": 6548 + }, + { + "epoch": 0.2, + "learning_rate": 4.641960792663869e-06, + "loss": 1.0718, + "step": 6549 + }, + { + "epoch": 0.2, + "learning_rate": 4.641834999014896e-06, + "loss": 1.0993, + "step": 6550 + }, + { + "epoch": 0.2, + "learning_rate": 4.641709184976685e-06, + "loss": 1.2005, + "step": 6551 + }, + { + "epoch": 0.2, + "learning_rate": 4.641583350550435e-06, + "loss": 1.1191, + "step": 6552 + }, + { + "epoch": 0.2, + "learning_rate": 4.641457495737342e-06, + "loss": 1.0878, + "step": 6553 + }, + { + "epoch": 0.2, + "learning_rate": 4.641331620538606e-06, + "loss": 1.0281, + "step": 6554 + }, + { + "epoch": 0.2, + "learning_rate": 4.641205724955424e-06, + "loss": 1.1522, + "step": 6555 + }, + { + "epoch": 0.2, + "learning_rate": 4.641079808988994e-06, + "loss": 1.2603, + "step": 6556 + }, + { + "epoch": 0.2, + "learning_rate": 4.640953872640516e-06, + "loss": 1.1884, + "step": 6557 + }, + { + "epoch": 0.2, + "learning_rate": 4.640827915911188e-06, + "loss": 1.0817, + "step": 6558 + }, + { + "epoch": 0.2, + "learning_rate": 4.64070193880221e-06, + "loss": 1.2012, + "step": 6559 + }, + { + "epoch": 0.2, + "learning_rate": 4.64057594131478e-06, + "loss": 1.1287, + "step": 6560 + }, + { + "epoch": 0.2, + "learning_rate": 4.640449923450098e-06, + "loss": 1.1721, + "step": 6561 + }, + { + "epoch": 0.2, + "learning_rate": 4.640323885209363e-06, + "loss": 1.0233, + "step": 6562 + }, + { + "epoch": 0.2, + "learning_rate": 4.6401978265937765e-06, + "loss": 1.149, + "step": 6563 + }, + { + "epoch": 0.2, + "learning_rate": 4.640071747604537e-06, + "loss": 1.1736, + "step": 6564 + }, + { + "epoch": 0.2, + "learning_rate": 4.639945648242845e-06, + "loss": 1.1611, + "step": 6565 + }, + { + "epoch": 0.2, + "learning_rate": 4.639819528509901e-06, + "loss": 1.1732, + "step": 6566 + }, + { + "epoch": 0.2, + "learning_rate": 4.639693388406906e-06, + "loss": 1.1744, + "step": 6567 + }, + { + "epoch": 0.2, + "learning_rate": 4.63956722793506e-06, + "loss": 1.0314, + "step": 6568 + }, + { + "epoch": 0.2, + "learning_rate": 4.639441047095565e-06, + "loss": 1.0974, + "step": 6569 + }, + { + "epoch": 0.2, + "learning_rate": 4.639314845889622e-06, + "loss": 1.0571, + "step": 6570 + }, + { + "epoch": 0.2, + "learning_rate": 4.639188624318431e-06, + "loss": 1.1373, + "step": 6571 + }, + { + "epoch": 0.2, + "learning_rate": 4.639062382383195e-06, + "loss": 1.3024, + "step": 6572 + }, + { + "epoch": 0.2, + "learning_rate": 4.638936120085115e-06, + "loss": 1.205, + "step": 6573 + }, + { + "epoch": 0.2, + "learning_rate": 4.638809837425394e-06, + "loss": 1.188, + "step": 6574 + }, + { + "epoch": 0.2, + "learning_rate": 4.638683534405233e-06, + "loss": 1.2054, + "step": 6575 + }, + { + "epoch": 0.2, + "learning_rate": 4.638557211025835e-06, + "loss": 1.1296, + "step": 6576 + }, + { + "epoch": 0.2, + "learning_rate": 4.638430867288402e-06, + "loss": 1.1488, + "step": 6577 + }, + { + "epoch": 0.2, + "learning_rate": 4.638304503194137e-06, + "loss": 1.1835, + "step": 6578 + }, + { + "epoch": 0.2, + "learning_rate": 4.6381781187442425e-06, + "loss": 1.2279, + "step": 6579 + }, + { + "epoch": 0.2, + "learning_rate": 4.638051713939923e-06, + "loss": 1.1982, + "step": 6580 + }, + { + "epoch": 0.2, + "learning_rate": 4.637925288782381e-06, + "loss": 1.0681, + "step": 6581 + }, + { + "epoch": 0.2, + "learning_rate": 4.637798843272819e-06, + "loss": 1.1772, + "step": 6582 + }, + { + "epoch": 0.2, + "learning_rate": 4.637672377412442e-06, + "loss": 1.0604, + "step": 6583 + }, + { + "epoch": 0.2, + "learning_rate": 4.637545891202454e-06, + "loss": 1.1252, + "step": 6584 + }, + { + "epoch": 0.2, + "learning_rate": 4.637419384644058e-06, + "loss": 1.2355, + "step": 6585 + }, + { + "epoch": 0.2, + "learning_rate": 4.637292857738459e-06, + "loss": 1.1322, + "step": 6586 + }, + { + "epoch": 0.2, + "learning_rate": 4.637166310486861e-06, + "loss": 1.3287, + "step": 6587 + }, + { + "epoch": 0.2, + "learning_rate": 4.63703974289047e-06, + "loss": 1.1775, + "step": 6588 + }, + { + "epoch": 0.2, + "learning_rate": 4.636913154950489e-06, + "loss": 1.1455, + "step": 6589 + }, + { + "epoch": 0.2, + "learning_rate": 4.636786546668125e-06, + "loss": 1.1683, + "step": 6590 + }, + { + "epoch": 0.2, + "learning_rate": 4.636659918044581e-06, + "loss": 1.0551, + "step": 6591 + }, + { + "epoch": 0.2, + "learning_rate": 4.6365332690810635e-06, + "loss": 1.1669, + "step": 6592 + }, + { + "epoch": 0.2, + "learning_rate": 4.636406599778779e-06, + "loss": 1.1301, + "step": 6593 + }, + { + "epoch": 0.2, + "learning_rate": 4.636279910138933e-06, + "loss": 1.1796, + "step": 6594 + }, + { + "epoch": 0.2, + "learning_rate": 4.6361532001627305e-06, + "loss": 1.2083, + "step": 6595 + }, + { + "epoch": 0.2, + "learning_rate": 4.636026469851379e-06, + "loss": 1.1459, + "step": 6596 + }, + { + "epoch": 0.2, + "learning_rate": 4.6358997192060826e-06, + "loss": 1.07, + "step": 6597 + }, + { + "epoch": 0.2, + "learning_rate": 4.635772948228051e-06, + "loss": 1.1901, + "step": 6598 + }, + { + "epoch": 0.2, + "learning_rate": 4.63564615691849e-06, + "loss": 1.0654, + "step": 6599 + }, + { + "epoch": 0.2, + "learning_rate": 4.6355193452786045e-06, + "loss": 1.1463, + "step": 6600 + }, + { + "epoch": 0.2, + "learning_rate": 4.635392513309605e-06, + "loss": 1.0695, + "step": 6601 + }, + { + "epoch": 0.2, + "learning_rate": 4.6352656610126955e-06, + "loss": 1.2184, + "step": 6602 + }, + { + "epoch": 0.2, + "learning_rate": 4.635138788389087e-06, + "loss": 1.2266, + "step": 6603 + }, + { + "epoch": 0.2, + "learning_rate": 4.635011895439984e-06, + "loss": 1.1367, + "step": 6604 + }, + { + "epoch": 0.2, + "learning_rate": 4.634884982166596e-06, + "loss": 1.2079, + "step": 6605 + }, + { + "epoch": 0.2, + "learning_rate": 4.634758048570132e-06, + "loss": 1.21, + "step": 6606 + }, + { + "epoch": 0.2, + "learning_rate": 4.6346310946518e-06, + "loss": 1.2242, + "step": 6607 + }, + { + "epoch": 0.2, + "learning_rate": 4.634504120412807e-06, + "loss": 1.1139, + "step": 6608 + }, + { + "epoch": 0.2, + "learning_rate": 4.634377125854363e-06, + "loss": 1.2144, + "step": 6609 + }, + { + "epoch": 0.2, + "learning_rate": 4.634250110977678e-06, + "loss": 1.2016, + "step": 6610 + }, + { + "epoch": 0.2, + "learning_rate": 4.634123075783958e-06, + "loss": 1.3132, + "step": 6611 + }, + { + "epoch": 0.2, + "learning_rate": 4.633996020274415e-06, + "loss": 1.2676, + "step": 6612 + }, + { + "epoch": 0.2, + "learning_rate": 4.633868944450258e-06, + "loss": 1.1647, + "step": 6613 + }, + { + "epoch": 0.2, + "learning_rate": 4.633741848312696e-06, + "loss": 1.0416, + "step": 6614 + }, + { + "epoch": 0.2, + "learning_rate": 4.6336147318629395e-06, + "loss": 1.1407, + "step": 6615 + }, + { + "epoch": 0.2, + "learning_rate": 4.633487595102198e-06, + "loss": 1.1558, + "step": 6616 + }, + { + "epoch": 0.2, + "learning_rate": 4.633360438031682e-06, + "loss": 1.1115, + "step": 6617 + }, + { + "epoch": 0.2, + "learning_rate": 4.633233260652602e-06, + "loss": 1.1548, + "step": 6618 + }, + { + "epoch": 0.2, + "learning_rate": 4.63310606296617e-06, + "loss": 1.1301, + "step": 6619 + }, + { + "epoch": 0.2, + "learning_rate": 4.6329788449735935e-06, + "loss": 1.0604, + "step": 6620 + }, + { + "epoch": 0.2, + "learning_rate": 4.6328516066760874e-06, + "loss": 1.1842, + "step": 6621 + }, + { + "epoch": 0.2, + "learning_rate": 4.632724348074861e-06, + "loss": 1.2369, + "step": 6622 + }, + { + "epoch": 0.2, + "learning_rate": 4.632597069171125e-06, + "loss": 1.251, + "step": 6623 + }, + { + "epoch": 0.2, + "learning_rate": 4.632469769966093e-06, + "loss": 1.2104, + "step": 6624 + }, + { + "epoch": 0.2, + "learning_rate": 4.632342450460975e-06, + "loss": 1.0437, + "step": 6625 + }, + { + "epoch": 0.2, + "learning_rate": 4.6322151106569844e-06, + "loss": 1.1103, + "step": 6626 + }, + { + "epoch": 0.2, + "learning_rate": 4.6320877505553325e-06, + "loss": 1.1885, + "step": 6627 + }, + { + "epoch": 0.2, + "learning_rate": 4.631960370157232e-06, + "loss": 1.1204, + "step": 6628 + }, + { + "epoch": 0.2, + "learning_rate": 4.631832969463896e-06, + "loss": 1.1393, + "step": 6629 + }, + { + "epoch": 0.2, + "learning_rate": 4.631705548476537e-06, + "loss": 1.1769, + "step": 6630 + }, + { + "epoch": 0.2, + "learning_rate": 4.631578107196367e-06, + "loss": 1.2633, + "step": 6631 + }, + { + "epoch": 0.2, + "learning_rate": 4.631450645624601e-06, + "loss": 1.2109, + "step": 6632 + }, + { + "epoch": 0.2, + "learning_rate": 4.631323163762451e-06, + "loss": 1.1412, + "step": 6633 + }, + { + "epoch": 0.2, + "learning_rate": 4.631195661611131e-06, + "loss": 1.1655, + "step": 6634 + }, + { + "epoch": 0.2, + "learning_rate": 4.631068139171855e-06, + "loss": 1.1516, + "step": 6635 + }, + { + "epoch": 0.2, + "learning_rate": 4.630940596445835e-06, + "loss": 1.1187, + "step": 6636 + }, + { + "epoch": 0.2, + "learning_rate": 4.630813033434289e-06, + "loss": 1.1961, + "step": 6637 + }, + { + "epoch": 0.2, + "learning_rate": 4.630685450138428e-06, + "loss": 1.0699, + "step": 6638 + }, + { + "epoch": 0.2, + "learning_rate": 4.630557846559468e-06, + "loss": 1.1594, + "step": 6639 + }, + { + "epoch": 0.2, + "learning_rate": 4.630430222698623e-06, + "loss": 0.9834, + "step": 6640 + }, + { + "epoch": 0.2, + "learning_rate": 4.630302578557109e-06, + "loss": 1.0652, + "step": 6641 + }, + { + "epoch": 0.2, + "learning_rate": 4.63017491413614e-06, + "loss": 1.1716, + "step": 6642 + }, + { + "epoch": 0.2, + "learning_rate": 4.6300472294369325e-06, + "loss": 1.269, + "step": 6643 + }, + { + "epoch": 0.2, + "learning_rate": 4.6299195244607e-06, + "loss": 1.2179, + "step": 6644 + }, + { + "epoch": 0.2, + "learning_rate": 4.62979179920866e-06, + "loss": 1.1152, + "step": 6645 + }, + { + "epoch": 0.2, + "learning_rate": 4.629664053682028e-06, + "loss": 1.0372, + "step": 6646 + }, + { + "epoch": 0.2, + "learning_rate": 4.62953628788202e-06, + "loss": 1.1129, + "step": 6647 + }, + { + "epoch": 0.2, + "learning_rate": 4.629408501809852e-06, + "loss": 1.1233, + "step": 6648 + }, + { + "epoch": 0.2, + "learning_rate": 4.62928069546674e-06, + "loss": 1.2961, + "step": 6649 + }, + { + "epoch": 0.2, + "learning_rate": 4.629152868853903e-06, + "loss": 1.2009, + "step": 6650 + }, + { + "epoch": 0.2, + "learning_rate": 4.629025021972554e-06, + "loss": 1.3302, + "step": 6651 + }, + { + "epoch": 0.2, + "learning_rate": 4.6288971548239135e-06, + "loss": 1.2111, + "step": 6652 + }, + { + "epoch": 0.2, + "learning_rate": 4.628769267409197e-06, + "loss": 1.2129, + "step": 6653 + }, + { + "epoch": 0.2, + "learning_rate": 4.628641359729622e-06, + "loss": 1.1762, + "step": 6654 + }, + { + "epoch": 0.2, + "learning_rate": 4.6285134317864065e-06, + "loss": 1.1668, + "step": 6655 + }, + { + "epoch": 0.2, + "learning_rate": 4.628385483580769e-06, + "loss": 1.1376, + "step": 6656 + }, + { + "epoch": 0.2, + "learning_rate": 4.628257515113926e-06, + "loss": 1.1445, + "step": 6657 + }, + { + "epoch": 0.2, + "learning_rate": 4.628129526387097e-06, + "loss": 1.1908, + "step": 6658 + }, + { + "epoch": 0.2, + "learning_rate": 4.6280015174015e-06, + "loss": 1.2559, + "step": 6659 + }, + { + "epoch": 0.2, + "learning_rate": 4.627873488158353e-06, + "loss": 1.117, + "step": 6660 + }, + { + "epoch": 0.2, + "learning_rate": 4.627745438658875e-06, + "loss": 1.0901, + "step": 6661 + }, + { + "epoch": 0.2, + "learning_rate": 4.6276173689042855e-06, + "loss": 1.3143, + "step": 6662 + }, + { + "epoch": 0.2, + "learning_rate": 4.627489278895804e-06, + "loss": 1.1906, + "step": 6663 + }, + { + "epoch": 0.2, + "learning_rate": 4.627361168634648e-06, + "loss": 1.1654, + "step": 6664 + }, + { + "epoch": 0.2, + "learning_rate": 4.627233038122039e-06, + "loss": 1.1711, + "step": 6665 + }, + { + "epoch": 0.2, + "learning_rate": 4.627104887359195e-06, + "loss": 1.069, + "step": 6666 + }, + { + "epoch": 0.2, + "learning_rate": 4.6269767163473375e-06, + "loss": 1.1069, + "step": 6667 + }, + { + "epoch": 0.2, + "learning_rate": 4.626848525087687e-06, + "loss": 1.0264, + "step": 6668 + }, + { + "epoch": 0.2, + "learning_rate": 4.626720313581462e-06, + "loss": 1.0717, + "step": 6669 + }, + { + "epoch": 0.2, + "learning_rate": 4.626592081829883e-06, + "loss": 1.1658, + "step": 6670 + }, + { + "epoch": 0.2, + "learning_rate": 4.626463829834174e-06, + "loss": 1.1357, + "step": 6671 + }, + { + "epoch": 0.2, + "learning_rate": 4.626335557595552e-06, + "loss": 1.141, + "step": 6672 + }, + { + "epoch": 0.2, + "learning_rate": 4.626207265115239e-06, + "loss": 1.1829, + "step": 6673 + }, + { + "epoch": 0.2, + "learning_rate": 4.626078952394457e-06, + "loss": 1.1937, + "step": 6674 + }, + { + "epoch": 0.2, + "learning_rate": 4.625950619434428e-06, + "loss": 1.1081, + "step": 6675 + }, + { + "epoch": 0.2, + "learning_rate": 4.625822266236373e-06, + "loss": 1.2022, + "step": 6676 + }, + { + "epoch": 0.2, + "learning_rate": 4.625693892801513e-06, + "loss": 1.1769, + "step": 6677 + }, + { + "epoch": 0.2, + "learning_rate": 4.625565499131071e-06, + "loss": 1.1104, + "step": 6678 + }, + { + "epoch": 0.2, + "learning_rate": 4.62543708522627e-06, + "loss": 1.1611, + "step": 6679 + }, + { + "epoch": 0.2, + "learning_rate": 4.625308651088332e-06, + "loss": 1.2627, + "step": 6680 + }, + { + "epoch": 0.2, + "learning_rate": 4.625180196718479e-06, + "loss": 1.2377, + "step": 6681 + }, + { + "epoch": 0.2, + "learning_rate": 4.625051722117932e-06, + "loss": 1.1228, + "step": 6682 + }, + { + "epoch": 0.2, + "learning_rate": 4.624923227287918e-06, + "loss": 1.0963, + "step": 6683 + }, + { + "epoch": 0.2, + "learning_rate": 4.624794712229657e-06, + "loss": 1.0663, + "step": 6684 + }, + { + "epoch": 0.2, + "learning_rate": 4.624666176944376e-06, + "loss": 1.0696, + "step": 6685 + }, + { + "epoch": 0.2, + "learning_rate": 4.624537621433295e-06, + "loss": 1.1214, + "step": 6686 + }, + { + "epoch": 0.2, + "learning_rate": 4.624409045697639e-06, + "loss": 1.0966, + "step": 6687 + }, + { + "epoch": 0.2, + "learning_rate": 4.624280449738631e-06, + "loss": 1.1366, + "step": 6688 + }, + { + "epoch": 0.2, + "learning_rate": 4.624151833557497e-06, + "loss": 1.0776, + "step": 6689 + }, + { + "epoch": 0.2, + "learning_rate": 4.624023197155461e-06, + "loss": 1.1625, + "step": 6690 + }, + { + "epoch": 0.2, + "learning_rate": 4.623894540533747e-06, + "loss": 1.1073, + "step": 6691 + }, + { + "epoch": 0.2, + "learning_rate": 4.623765863693579e-06, + "loss": 1.1711, + "step": 6692 + }, + { + "epoch": 0.2, + "learning_rate": 4.623637166636184e-06, + "loss": 1.1414, + "step": 6693 + }, + { + "epoch": 0.2, + "learning_rate": 4.623508449362785e-06, + "loss": 1.0314, + "step": 6694 + }, + { + "epoch": 0.2, + "learning_rate": 4.623379711874609e-06, + "loss": 1.1408, + "step": 6695 + }, + { + "epoch": 0.2, + "learning_rate": 4.623250954172881e-06, + "loss": 1.1073, + "step": 6696 + }, + { + "epoch": 0.2, + "learning_rate": 4.623122176258826e-06, + "loss": 1.1188, + "step": 6697 + }, + { + "epoch": 0.2, + "learning_rate": 4.62299337813367e-06, + "loss": 1.3013, + "step": 6698 + }, + { + "epoch": 0.2, + "learning_rate": 4.62286455979864e-06, + "loss": 1.2894, + "step": 6699 + }, + { + "epoch": 0.2, + "learning_rate": 4.622735721254962e-06, + "loss": 1.1348, + "step": 6700 + }, + { + "epoch": 0.2, + "learning_rate": 4.622606862503862e-06, + "loss": 1.1472, + "step": 6701 + }, + { + "epoch": 0.2, + "learning_rate": 4.622477983546567e-06, + "loss": 1.1879, + "step": 6702 + }, + { + "epoch": 0.2, + "learning_rate": 4.622349084384304e-06, + "loss": 1.1716, + "step": 6703 + }, + { + "epoch": 0.2, + "learning_rate": 4.6222201650183e-06, + "loss": 1.112, + "step": 6704 + }, + { + "epoch": 0.2, + "learning_rate": 4.622091225449781e-06, + "loss": 1.1744, + "step": 6705 + }, + { + "epoch": 0.2, + "learning_rate": 4.621962265679977e-06, + "loss": 1.203, + "step": 6706 + }, + { + "epoch": 0.2, + "learning_rate": 4.621833285710113e-06, + "loss": 1.1868, + "step": 6707 + }, + { + "epoch": 0.2, + "learning_rate": 4.621704285541419e-06, + "loss": 1.1667, + "step": 6708 + }, + { + "epoch": 0.2, + "learning_rate": 4.621575265175122e-06, + "loss": 1.0308, + "step": 6709 + }, + { + "epoch": 0.2, + "learning_rate": 4.62144622461245e-06, + "loss": 1.1331, + "step": 6710 + }, + { + "epoch": 0.2, + "learning_rate": 4.6213171638546315e-06, + "loss": 1.2186, + "step": 6711 + }, + { + "epoch": 0.2, + "learning_rate": 4.621188082902895e-06, + "loss": 1.1266, + "step": 6712 + }, + { + "epoch": 0.2, + "learning_rate": 4.6210589817584704e-06, + "loss": 1.0571, + "step": 6713 + }, + { + "epoch": 0.2, + "learning_rate": 4.620929860422585e-06, + "loss": 1.1523, + "step": 6714 + }, + { + "epoch": 0.2, + "learning_rate": 4.6208007188964685e-06, + "loss": 1.1729, + "step": 6715 + }, + { + "epoch": 0.2, + "learning_rate": 4.620671557181352e-06, + "loss": 1.0538, + "step": 6716 + }, + { + "epoch": 0.2, + "learning_rate": 4.620542375278463e-06, + "loss": 1.1679, + "step": 6717 + }, + { + "epoch": 0.2, + "learning_rate": 4.620413173189031e-06, + "loss": 1.0429, + "step": 6718 + }, + { + "epoch": 0.2, + "learning_rate": 4.620283950914287e-06, + "loss": 1.1013, + "step": 6719 + }, + { + "epoch": 0.2, + "learning_rate": 4.620154708455462e-06, + "loss": 1.1149, + "step": 6720 + }, + { + "epoch": 0.2, + "learning_rate": 4.620025445813785e-06, + "loss": 1.1693, + "step": 6721 + }, + { + "epoch": 0.2, + "learning_rate": 4.619896162990487e-06, + "loss": 1.1819, + "step": 6722 + }, + { + "epoch": 0.2, + "learning_rate": 4.619766859986797e-06, + "loss": 1.0968, + "step": 6723 + }, + { + "epoch": 0.2, + "learning_rate": 4.619637536803949e-06, + "loss": 1.1539, + "step": 6724 + }, + { + "epoch": 0.2, + "learning_rate": 4.619508193443172e-06, + "loss": 1.1703, + "step": 6725 + }, + { + "epoch": 0.2, + "learning_rate": 4.619378829905698e-06, + "loss": 1.1324, + "step": 6726 + }, + { + "epoch": 0.2, + "learning_rate": 4.619249446192758e-06, + "loss": 1.2416, + "step": 6727 + }, + { + "epoch": 0.2, + "learning_rate": 4.619120042305584e-06, + "loss": 1.1166, + "step": 6728 + }, + { + "epoch": 0.2, + "learning_rate": 4.618990618245407e-06, + "loss": 1.1979, + "step": 6729 + }, + { + "epoch": 0.2, + "learning_rate": 4.618861174013462e-06, + "loss": 1.2772, + "step": 6730 + }, + { + "epoch": 0.2, + "learning_rate": 4.618731709610977e-06, + "loss": 1.3169, + "step": 6731 + }, + { + "epoch": 0.2, + "learning_rate": 4.618602225039187e-06, + "loss": 1.1354, + "step": 6732 + }, + { + "epoch": 0.2, + "learning_rate": 4.6184727202993246e-06, + "loss": 1.1248, + "step": 6733 + }, + { + "epoch": 0.2, + "learning_rate": 4.618343195392621e-06, + "loss": 1.2361, + "step": 6734 + }, + { + "epoch": 0.2, + "learning_rate": 4.6182136503203126e-06, + "loss": 1.2935, + "step": 6735 + }, + { + "epoch": 0.2, + "learning_rate": 4.618084085083629e-06, + "loss": 1.2274, + "step": 6736 + }, + { + "epoch": 0.2, + "learning_rate": 4.617954499683805e-06, + "loss": 1.267, + "step": 6737 + }, + { + "epoch": 0.2, + "learning_rate": 4.617824894122075e-06, + "loss": 1.183, + "step": 6738 + }, + { + "epoch": 0.2, + "learning_rate": 4.617695268399671e-06, + "loss": 1.1749, + "step": 6739 + }, + { + "epoch": 0.2, + "learning_rate": 4.617565622517829e-06, + "loss": 1.1033, + "step": 6740 + }, + { + "epoch": 0.2, + "learning_rate": 4.617435956477781e-06, + "loss": 1.1224, + "step": 6741 + }, + { + "epoch": 0.2, + "learning_rate": 4.617306270280763e-06, + "loss": 1.1791, + "step": 6742 + }, + { + "epoch": 0.2, + "learning_rate": 4.6171765639280095e-06, + "loss": 1.1437, + "step": 6743 + }, + { + "epoch": 0.2, + "learning_rate": 4.617046837420755e-06, + "loss": 1.1282, + "step": 6744 + }, + { + "epoch": 0.2, + "learning_rate": 4.616917090760232e-06, + "loss": 1.1745, + "step": 6745 + }, + { + "epoch": 0.2, + "learning_rate": 4.61678732394768e-06, + "loss": 1.1023, + "step": 6746 + }, + { + "epoch": 0.2, + "learning_rate": 4.616657536984331e-06, + "loss": 1.1193, + "step": 6747 + }, + { + "epoch": 0.2, + "learning_rate": 4.616527729871423e-06, + "loss": 1.3279, + "step": 6748 + }, + { + "epoch": 0.2, + "learning_rate": 4.61639790261019e-06, + "loss": 1.2006, + "step": 6749 + }, + { + "epoch": 0.2, + "learning_rate": 4.6162680552018674e-06, + "loss": 1.2841, + "step": 6750 + }, + { + "epoch": 0.2, + "learning_rate": 4.6161381876476925e-06, + "loss": 1.0848, + "step": 6751 + }, + { + "epoch": 0.2, + "learning_rate": 4.6160082999489014e-06, + "loss": 1.1678, + "step": 6752 + }, + { + "epoch": 0.2, + "learning_rate": 4.61587839210673e-06, + "loss": 1.1088, + "step": 6753 + }, + { + "epoch": 0.2, + "learning_rate": 4.615748464122416e-06, + "loss": 1.1514, + "step": 6754 + }, + { + "epoch": 0.2, + "learning_rate": 4.615618515997196e-06, + "loss": 1.1161, + "step": 6755 + }, + { + "epoch": 0.2, + "learning_rate": 4.615488547732305e-06, + "loss": 1.2732, + "step": 6756 + }, + { + "epoch": 0.2, + "learning_rate": 4.6153585593289825e-06, + "loss": 1.0648, + "step": 6757 + }, + { + "epoch": 0.2, + "learning_rate": 4.615228550788466e-06, + "loss": 1.2557, + "step": 6758 + }, + { + "epoch": 0.2, + "learning_rate": 4.615098522111992e-06, + "loss": 1.167, + "step": 6759 + }, + { + "epoch": 0.2, + "learning_rate": 4.6149684733007985e-06, + "loss": 1.1243, + "step": 6760 + }, + { + "epoch": 0.2, + "learning_rate": 4.614838404356124e-06, + "loss": 1.0861, + "step": 6761 + }, + { + "epoch": 0.2, + "learning_rate": 4.6147083152792064e-06, + "loss": 1.1375, + "step": 6762 + }, + { + "epoch": 0.2, + "learning_rate": 4.614578206071284e-06, + "loss": 1.1458, + "step": 6763 + }, + { + "epoch": 0.2, + "learning_rate": 4.6144480767335955e-06, + "loss": 1.1053, + "step": 6764 + }, + { + "epoch": 0.2, + "learning_rate": 4.61431792726738e-06, + "loss": 1.0768, + "step": 6765 + }, + { + "epoch": 0.2, + "learning_rate": 4.614187757673876e-06, + "loss": 1.2261, + "step": 6766 + }, + { + "epoch": 0.2, + "learning_rate": 4.614057567954323e-06, + "loss": 1.1862, + "step": 6767 + }, + { + "epoch": 0.2, + "learning_rate": 4.61392735810996e-06, + "loss": 1.1287, + "step": 6768 + }, + { + "epoch": 0.2, + "learning_rate": 4.613797128142026e-06, + "loss": 1.2103, + "step": 6769 + }, + { + "epoch": 0.2, + "learning_rate": 4.613666878051762e-06, + "loss": 1.1317, + "step": 6770 + }, + { + "epoch": 0.2, + "learning_rate": 4.613536607840406e-06, + "loss": 1.0903, + "step": 6771 + }, + { + "epoch": 0.2, + "learning_rate": 4.613406317509201e-06, + "loss": 1.0356, + "step": 6772 + }, + { + "epoch": 0.2, + "learning_rate": 4.613276007059386e-06, + "loss": 1.1151, + "step": 6773 + }, + { + "epoch": 0.2, + "learning_rate": 4.6131456764922e-06, + "loss": 1.139, + "step": 6774 + }, + { + "epoch": 0.2, + "learning_rate": 4.613015325808885e-06, + "loss": 1.1478, + "step": 6775 + }, + { + "epoch": 0.2, + "learning_rate": 4.612884955010683e-06, + "loss": 1.0902, + "step": 6776 + }, + { + "epoch": 0.2, + "learning_rate": 4.612754564098833e-06, + "loss": 1.0364, + "step": 6777 + }, + { + "epoch": 0.2, + "learning_rate": 4.6126241530745765e-06, + "loss": 1.1536, + "step": 6778 + }, + { + "epoch": 0.2, + "learning_rate": 4.612493721939156e-06, + "loss": 1.1719, + "step": 6779 + }, + { + "epoch": 0.2, + "learning_rate": 4.612363270693812e-06, + "loss": 1.1097, + "step": 6780 + }, + { + "epoch": 0.2, + "learning_rate": 4.612232799339789e-06, + "loss": 1.1168, + "step": 6781 + }, + { + "epoch": 0.2, + "learning_rate": 4.612102307878325e-06, + "loss": 1.1505, + "step": 6782 + }, + { + "epoch": 0.2, + "learning_rate": 4.611971796310665e-06, + "loss": 1.1444, + "step": 6783 + }, + { + "epoch": 0.2, + "learning_rate": 4.6118412646380515e-06, + "loss": 1.0792, + "step": 6784 + }, + { + "epoch": 0.2, + "learning_rate": 4.611710712861725e-06, + "loss": 1.1011, + "step": 6785 + }, + { + "epoch": 0.2, + "learning_rate": 4.61158014098293e-06, + "loss": 1.1512, + "step": 6786 + }, + { + "epoch": 0.2, + "learning_rate": 4.611449549002908e-06, + "loss": 1.1867, + "step": 6787 + }, + { + "epoch": 0.2, + "learning_rate": 4.611318936922905e-06, + "loss": 1.0588, + "step": 6788 + }, + { + "epoch": 0.2, + "learning_rate": 4.6111883047441616e-06, + "loss": 1.1316, + "step": 6789 + }, + { + "epoch": 0.2, + "learning_rate": 4.611057652467923e-06, + "loss": 1.1146, + "step": 6790 + }, + { + "epoch": 0.2, + "learning_rate": 4.610926980095431e-06, + "loss": 1.1134, + "step": 6791 + }, + { + "epoch": 0.2, + "learning_rate": 4.610796287627932e-06, + "loss": 1.1244, + "step": 6792 + }, + { + "epoch": 0.2, + "learning_rate": 4.610665575066668e-06, + "loss": 1.1281, + "step": 6793 + }, + { + "epoch": 0.2, + "learning_rate": 4.610534842412886e-06, + "loss": 1.0919, + "step": 6794 + }, + { + "epoch": 0.2, + "learning_rate": 4.610404089667827e-06, + "loss": 1.1606, + "step": 6795 + }, + { + "epoch": 0.2, + "learning_rate": 4.610273316832738e-06, + "loss": 1.185, + "step": 6796 + }, + { + "epoch": 0.2, + "learning_rate": 4.610142523908864e-06, + "loss": 1.0132, + "step": 6797 + }, + { + "epoch": 0.2, + "learning_rate": 4.610011710897449e-06, + "loss": 1.1917, + "step": 6798 + }, + { + "epoch": 0.2, + "learning_rate": 4.609880877799738e-06, + "loss": 1.2404, + "step": 6799 + }, + { + "epoch": 0.2, + "learning_rate": 4.609750024616978e-06, + "loss": 1.1797, + "step": 6800 + }, + { + "epoch": 0.2, + "learning_rate": 4.609619151350414e-06, + "loss": 1.1564, + "step": 6801 + }, + { + "epoch": 0.2, + "learning_rate": 4.609488258001291e-06, + "loss": 1.1041, + "step": 6802 + }, + { + "epoch": 0.2, + "learning_rate": 4.609357344570856e-06, + "loss": 1.1194, + "step": 6803 + }, + { + "epoch": 0.2, + "learning_rate": 4.6092264110603545e-06, + "loss": 1.2216, + "step": 6804 + }, + { + "epoch": 0.21, + "learning_rate": 4.609095457471035e-06, + "loss": 1.2285, + "step": 6805 + }, + { + "epoch": 0.21, + "learning_rate": 4.608964483804141e-06, + "loss": 1.2234, + "step": 6806 + }, + { + "epoch": 0.21, + "learning_rate": 4.608833490060921e-06, + "loss": 1.18, + "step": 6807 + }, + { + "epoch": 0.21, + "learning_rate": 4.608702476242622e-06, + "loss": 1.1864, + "step": 6808 + }, + { + "epoch": 0.21, + "learning_rate": 4.608571442350491e-06, + "loss": 1.1804, + "step": 6809 + }, + { + "epoch": 0.21, + "learning_rate": 4.608440388385776e-06, + "loss": 1.1716, + "step": 6810 + }, + { + "epoch": 0.21, + "learning_rate": 4.608309314349724e-06, + "loss": 1.1943, + "step": 6811 + }, + { + "epoch": 0.21, + "learning_rate": 4.608178220243582e-06, + "loss": 1.2548, + "step": 6812 + }, + { + "epoch": 0.21, + "learning_rate": 4.608047106068598e-06, + "loss": 1.1497, + "step": 6813 + }, + { + "epoch": 0.21, + "learning_rate": 4.607915971826022e-06, + "loss": 1.1098, + "step": 6814 + }, + { + "epoch": 0.21, + "learning_rate": 4.607784817517101e-06, + "loss": 1.1636, + "step": 6815 + }, + { + "epoch": 0.21, + "learning_rate": 4.607653643143084e-06, + "loss": 1.1234, + "step": 6816 + }, + { + "epoch": 0.21, + "learning_rate": 4.607522448705218e-06, + "loss": 1.1091, + "step": 6817 + }, + { + "epoch": 0.21, + "learning_rate": 4.607391234204755e-06, + "loss": 0.9704, + "step": 6818 + }, + { + "epoch": 0.21, + "learning_rate": 4.607259999642941e-06, + "loss": 1.2643, + "step": 6819 + }, + { + "epoch": 0.21, + "learning_rate": 4.6071287450210275e-06, + "loss": 1.1595, + "step": 6820 + }, + { + "epoch": 0.21, + "learning_rate": 4.606997470340263e-06, + "loss": 1.1411, + "step": 6821 + }, + { + "epoch": 0.21, + "learning_rate": 4.606866175601898e-06, + "loss": 1.223, + "step": 6822 + }, + { + "epoch": 0.21, + "learning_rate": 4.606734860807181e-06, + "loss": 1.0151, + "step": 6823 + }, + { + "epoch": 0.21, + "learning_rate": 4.6066035259573624e-06, + "loss": 1.0328, + "step": 6824 + }, + { + "epoch": 0.21, + "learning_rate": 4.606472171053693e-06, + "loss": 1.2269, + "step": 6825 + }, + { + "epoch": 0.21, + "learning_rate": 4.606340796097424e-06, + "loss": 1.1561, + "step": 6826 + }, + { + "epoch": 0.21, + "learning_rate": 4.606209401089804e-06, + "loss": 1.1523, + "step": 6827 + }, + { + "epoch": 0.21, + "learning_rate": 4.606077986032086e-06, + "loss": 1.0871, + "step": 6828 + }, + { + "epoch": 0.21, + "learning_rate": 4.605946550925519e-06, + "loss": 1.1359, + "step": 6829 + }, + { + "epoch": 0.21, + "learning_rate": 4.605815095771355e-06, + "loss": 1.249, + "step": 6830 + }, + { + "epoch": 0.21, + "learning_rate": 4.605683620570845e-06, + "loss": 1.1151, + "step": 6831 + }, + { + "epoch": 0.21, + "learning_rate": 4.605552125325242e-06, + "loss": 1.2499, + "step": 6832 + }, + { + "epoch": 0.21, + "learning_rate": 4.605420610035797e-06, + "loss": 1.0777, + "step": 6833 + }, + { + "epoch": 0.21, + "learning_rate": 4.605289074703761e-06, + "loss": 1.181, + "step": 6834 + }, + { + "epoch": 0.21, + "learning_rate": 4.605157519330388e-06, + "loss": 1.1635, + "step": 6835 + }, + { + "epoch": 0.21, + "learning_rate": 4.605025943916929e-06, + "loss": 1.1056, + "step": 6836 + }, + { + "epoch": 0.21, + "learning_rate": 4.6048943484646365e-06, + "loss": 1.0613, + "step": 6837 + }, + { + "epoch": 0.21, + "learning_rate": 4.604762732974763e-06, + "loss": 1.0573, + "step": 6838 + }, + { + "epoch": 0.21, + "learning_rate": 4.604631097448563e-06, + "loss": 1.1557, + "step": 6839 + }, + { + "epoch": 0.21, + "learning_rate": 4.604499441887288e-06, + "loss": 1.2069, + "step": 6840 + }, + { + "epoch": 0.21, + "learning_rate": 4.604367766292191e-06, + "loss": 1.1516, + "step": 6841 + }, + { + "epoch": 0.21, + "learning_rate": 4.604236070664528e-06, + "loss": 1.1467, + "step": 6842 + }, + { + "epoch": 0.21, + "learning_rate": 4.604104355005551e-06, + "loss": 1.2083, + "step": 6843 + }, + { + "epoch": 0.21, + "learning_rate": 4.603972619316513e-06, + "loss": 1.3035, + "step": 6844 + }, + { + "epoch": 0.21, + "learning_rate": 4.603840863598669e-06, + "loss": 1.1316, + "step": 6845 + }, + { + "epoch": 0.21, + "learning_rate": 4.603709087853274e-06, + "loss": 1.1932, + "step": 6846 + }, + { + "epoch": 0.21, + "learning_rate": 4.603577292081582e-06, + "loss": 1.0573, + "step": 6847 + }, + { + "epoch": 0.21, + "learning_rate": 4.603445476284845e-06, + "loss": 1.1103, + "step": 6848 + }, + { + "epoch": 0.21, + "learning_rate": 4.603313640464322e-06, + "loss": 1.0559, + "step": 6849 + }, + { + "epoch": 0.21, + "learning_rate": 4.603181784621266e-06, + "loss": 1.1301, + "step": 6850 + }, + { + "epoch": 0.21, + "learning_rate": 4.6030499087569315e-06, + "loss": 1.1162, + "step": 6851 + }, + { + "epoch": 0.21, + "learning_rate": 4.602918012872576e-06, + "loss": 1.1002, + "step": 6852 + }, + { + "epoch": 0.21, + "learning_rate": 4.602786096969453e-06, + "loss": 1.1799, + "step": 6853 + }, + { + "epoch": 0.21, + "learning_rate": 4.602654161048819e-06, + "loss": 1.1111, + "step": 6854 + }, + { + "epoch": 0.21, + "learning_rate": 4.60252220511193e-06, + "loss": 1.2352, + "step": 6855 + }, + { + "epoch": 0.21, + "learning_rate": 4.602390229160043e-06, + "loss": 1.0691, + "step": 6856 + }, + { + "epoch": 0.21, + "learning_rate": 4.602258233194413e-06, + "loss": 1.1884, + "step": 6857 + }, + { + "epoch": 0.21, + "learning_rate": 4.602126217216297e-06, + "loss": 1.1576, + "step": 6858 + }, + { + "epoch": 0.21, + "learning_rate": 4.601994181226952e-06, + "loss": 1.1134, + "step": 6859 + }, + { + "epoch": 0.21, + "learning_rate": 4.601862125227634e-06, + "loss": 1.153, + "step": 6860 + }, + { + "epoch": 0.21, + "learning_rate": 4.601730049219602e-06, + "loss": 1.1226, + "step": 6861 + }, + { + "epoch": 0.21, + "learning_rate": 4.601597953204112e-06, + "loss": 1.0668, + "step": 6862 + }, + { + "epoch": 0.21, + "learning_rate": 4.601465837182421e-06, + "loss": 1.2543, + "step": 6863 + }, + { + "epoch": 0.21, + "learning_rate": 4.601333701155788e-06, + "loss": 1.1852, + "step": 6864 + }, + { + "epoch": 0.21, + "learning_rate": 4.60120154512547e-06, + "loss": 1.0687, + "step": 6865 + }, + { + "epoch": 0.21, + "learning_rate": 4.601069369092725e-06, + "loss": 1.3774, + "step": 6866 + }, + { + "epoch": 0.21, + "learning_rate": 4.6009371730588115e-06, + "loss": 1.202, + "step": 6867 + }, + { + "epoch": 0.21, + "learning_rate": 4.600804957024988e-06, + "loss": 1.155, + "step": 6868 + }, + { + "epoch": 0.21, + "learning_rate": 4.600672720992514e-06, + "loss": 1.1752, + "step": 6869 + }, + { + "epoch": 0.21, + "learning_rate": 4.600540464962646e-06, + "loss": 1.1562, + "step": 6870 + }, + { + "epoch": 0.21, + "learning_rate": 4.600408188936645e-06, + "loss": 1.0698, + "step": 6871 + }, + { + "epoch": 0.21, + "learning_rate": 4.60027589291577e-06, + "loss": 1.172, + "step": 6872 + }, + { + "epoch": 0.21, + "learning_rate": 4.600143576901279e-06, + "loss": 1.2339, + "step": 6873 + }, + { + "epoch": 0.21, + "learning_rate": 4.600011240894434e-06, + "loss": 1.1828, + "step": 6874 + }, + { + "epoch": 0.21, + "learning_rate": 4.599878884896493e-06, + "loss": 1.1772, + "step": 6875 + }, + { + "epoch": 0.21, + "learning_rate": 4.5997465089087155e-06, + "loss": 1.1632, + "step": 6876 + }, + { + "epoch": 0.21, + "learning_rate": 4.599614112932363e-06, + "loss": 0.9822, + "step": 6877 + }, + { + "epoch": 0.21, + "learning_rate": 4.599481696968696e-06, + "loss": 1.0499, + "step": 6878 + }, + { + "epoch": 0.21, + "learning_rate": 4.5993492610189736e-06, + "loss": 1.1164, + "step": 6879 + }, + { + "epoch": 0.21, + "learning_rate": 4.5992168050844575e-06, + "loss": 1.0394, + "step": 6880 + }, + { + "epoch": 0.21, + "learning_rate": 4.599084329166409e-06, + "loss": 1.0126, + "step": 6881 + }, + { + "epoch": 0.21, + "learning_rate": 4.598951833266087e-06, + "loss": 1.1019, + "step": 6882 + }, + { + "epoch": 0.21, + "learning_rate": 4.598819317384757e-06, + "loss": 1.0317, + "step": 6883 + }, + { + "epoch": 0.21, + "learning_rate": 4.5986867815236755e-06, + "loss": 1.1071, + "step": 6884 + }, + { + "epoch": 0.21, + "learning_rate": 4.5985542256841085e-06, + "loss": 1.1033, + "step": 6885 + }, + { + "epoch": 0.21, + "learning_rate": 4.598421649867315e-06, + "loss": 1.2506, + "step": 6886 + }, + { + "epoch": 0.21, + "learning_rate": 4.5982890540745575e-06, + "loss": 1.1734, + "step": 6887 + }, + { + "epoch": 0.21, + "learning_rate": 4.5981564383070994e-06, + "loss": 1.1413, + "step": 6888 + }, + { + "epoch": 0.21, + "learning_rate": 4.598023802566203e-06, + "loss": 1.2546, + "step": 6889 + }, + { + "epoch": 0.21, + "learning_rate": 4.597891146853129e-06, + "loss": 1.1342, + "step": 6890 + }, + { + "epoch": 0.21, + "learning_rate": 4.597758471169143e-06, + "loss": 1.1249, + "step": 6891 + }, + { + "epoch": 0.21, + "learning_rate": 4.597625775515507e-06, + "loss": 1.0865, + "step": 6892 + }, + { + "epoch": 0.21, + "learning_rate": 4.597493059893483e-06, + "loss": 1.1318, + "step": 6893 + }, + { + "epoch": 0.21, + "learning_rate": 4.5973603243043354e-06, + "loss": 1.0582, + "step": 6894 + }, + { + "epoch": 0.21, + "learning_rate": 4.5972275687493275e-06, + "loss": 1.1522, + "step": 6895 + }, + { + "epoch": 0.21, + "learning_rate": 4.5970947932297234e-06, + "loss": 1.0773, + "step": 6896 + }, + { + "epoch": 0.21, + "learning_rate": 4.596961997746787e-06, + "loss": 1.098, + "step": 6897 + }, + { + "epoch": 0.21, + "learning_rate": 4.596829182301782e-06, + "loss": 1.2234, + "step": 6898 + }, + { + "epoch": 0.21, + "learning_rate": 4.596696346895973e-06, + "loss": 1.2892, + "step": 6899 + }, + { + "epoch": 0.21, + "learning_rate": 4.596563491530625e-06, + "loss": 1.1631, + "step": 6900 + }, + { + "epoch": 0.21, + "learning_rate": 4.596430616207002e-06, + "loss": 1.1129, + "step": 6901 + }, + { + "epoch": 0.21, + "learning_rate": 4.596297720926369e-06, + "loss": 1.1336, + "step": 6902 + }, + { + "epoch": 0.21, + "learning_rate": 4.596164805689992e-06, + "loss": 1.1698, + "step": 6903 + }, + { + "epoch": 0.21, + "learning_rate": 4.596031870499135e-06, + "loss": 1.0833, + "step": 6904 + }, + { + "epoch": 0.21, + "learning_rate": 4.595898915355063e-06, + "loss": 1.2063, + "step": 6905 + }, + { + "epoch": 0.21, + "learning_rate": 4.5957659402590445e-06, + "loss": 1.1445, + "step": 6906 + }, + { + "epoch": 0.21, + "learning_rate": 4.595632945212344e-06, + "loss": 1.1257, + "step": 6907 + }, + { + "epoch": 0.21, + "learning_rate": 4.595499930216225e-06, + "loss": 1.0881, + "step": 6908 + }, + { + "epoch": 0.21, + "learning_rate": 4.595366895271958e-06, + "loss": 1.1647, + "step": 6909 + }, + { + "epoch": 0.21, + "learning_rate": 4.595233840380806e-06, + "loss": 1.2117, + "step": 6910 + }, + { + "epoch": 0.21, + "learning_rate": 4.595100765544038e-06, + "loss": 1.1699, + "step": 6911 + }, + { + "epoch": 0.21, + "learning_rate": 4.594967670762919e-06, + "loss": 1.0435, + "step": 6912 + }, + { + "epoch": 0.21, + "learning_rate": 4.594834556038717e-06, + "loss": 1.2332, + "step": 6913 + }, + { + "epoch": 0.21, + "learning_rate": 4.594701421372699e-06, + "loss": 1.1821, + "step": 6914 + }, + { + "epoch": 0.21, + "learning_rate": 4.594568266766132e-06, + "loss": 1.219, + "step": 6915 + }, + { + "epoch": 0.21, + "learning_rate": 4.594435092220284e-06, + "loss": 1.1984, + "step": 6916 + }, + { + "epoch": 0.21, + "learning_rate": 4.594301897736422e-06, + "loss": 1.1536, + "step": 6917 + }, + { + "epoch": 0.21, + "learning_rate": 4.594168683315815e-06, + "loss": 1.2084, + "step": 6918 + }, + { + "epoch": 0.21, + "learning_rate": 4.594035448959732e-06, + "loss": 1.1611, + "step": 6919 + }, + { + "epoch": 0.21, + "learning_rate": 4.593902194669438e-06, + "loss": 1.0168, + "step": 6920 + }, + { + "epoch": 0.21, + "learning_rate": 4.593768920446205e-06, + "loss": 1.1395, + "step": 6921 + }, + { + "epoch": 0.21, + "learning_rate": 4.5936356262912995e-06, + "loss": 1.2681, + "step": 6922 + }, + { + "epoch": 0.21, + "learning_rate": 4.593502312205992e-06, + "loss": 1.079, + "step": 6923 + }, + { + "epoch": 0.21, + "learning_rate": 4.59336897819155e-06, + "loss": 1.1248, + "step": 6924 + }, + { + "epoch": 0.21, + "learning_rate": 4.593235624249244e-06, + "loss": 1.0909, + "step": 6925 + }, + { + "epoch": 0.21, + "learning_rate": 4.593102250380343e-06, + "loss": 1.2071, + "step": 6926 + }, + { + "epoch": 0.21, + "learning_rate": 4.592968856586117e-06, + "loss": 1.1368, + "step": 6927 + }, + { + "epoch": 0.21, + "learning_rate": 4.592835442867834e-06, + "loss": 1.1932, + "step": 6928 + }, + { + "epoch": 0.21, + "learning_rate": 4.592702009226767e-06, + "loss": 1.108, + "step": 6929 + }, + { + "epoch": 0.21, + "learning_rate": 4.592568555664183e-06, + "loss": 1.1785, + "step": 6930 + }, + { + "epoch": 0.21, + "learning_rate": 4.592435082181356e-06, + "loss": 1.1804, + "step": 6931 + }, + { + "epoch": 0.21, + "learning_rate": 4.592301588779554e-06, + "loss": 1.1296, + "step": 6932 + }, + { + "epoch": 0.21, + "learning_rate": 4.592168075460049e-06, + "loss": 1.1477, + "step": 6933 + }, + { + "epoch": 0.21, + "learning_rate": 4.592034542224112e-06, + "loss": 1.0563, + "step": 6934 + }, + { + "epoch": 0.21, + "learning_rate": 4.591900989073012e-06, + "loss": 1.3455, + "step": 6935 + }, + { + "epoch": 0.21, + "learning_rate": 4.5917674160080224e-06, + "loss": 1.286, + "step": 6936 + }, + { + "epoch": 0.21, + "learning_rate": 4.591633823030416e-06, + "loss": 1.2726, + "step": 6937 + }, + { + "epoch": 0.21, + "learning_rate": 4.591500210141462e-06, + "loss": 1.2103, + "step": 6938 + }, + { + "epoch": 0.21, + "learning_rate": 4.591366577342433e-06, + "loss": 1.1364, + "step": 6939 + }, + { + "epoch": 0.21, + "learning_rate": 4.591232924634602e-06, + "loss": 1.1345, + "step": 6940 + }, + { + "epoch": 0.21, + "learning_rate": 4.5910992520192406e-06, + "loss": 1.187, + "step": 6941 + }, + { + "epoch": 0.21, + "learning_rate": 4.590965559497621e-06, + "loss": 1.1286, + "step": 6942 + }, + { + "epoch": 0.21, + "learning_rate": 4.590831847071017e-06, + "loss": 1.1589, + "step": 6943 + }, + { + "epoch": 0.21, + "learning_rate": 4.5906981147407e-06, + "loss": 1.2111, + "step": 6944 + }, + { + "epoch": 0.21, + "learning_rate": 4.590564362507944e-06, + "loss": 1.0958, + "step": 6945 + }, + { + "epoch": 0.21, + "learning_rate": 4.590430590374023e-06, + "loss": 1.1509, + "step": 6946 + }, + { + "epoch": 0.21, + "learning_rate": 4.5902967983402095e-06, + "loss": 1.0274, + "step": 6947 + }, + { + "epoch": 0.21, + "learning_rate": 4.590162986407776e-06, + "loss": 1.2146, + "step": 6948 + }, + { + "epoch": 0.21, + "learning_rate": 4.590029154577998e-06, + "loss": 1.1598, + "step": 6949 + }, + { + "epoch": 0.21, + "learning_rate": 4.58989530285215e-06, + "loss": 1.1733, + "step": 6950 + }, + { + "epoch": 0.21, + "learning_rate": 4.589761431231504e-06, + "loss": 1.08, + "step": 6951 + }, + { + "epoch": 0.21, + "learning_rate": 4.589627539717336e-06, + "loss": 1.1011, + "step": 6952 + }, + { + "epoch": 0.21, + "learning_rate": 4.58949362831092e-06, + "loss": 1.0713, + "step": 6953 + }, + { + "epoch": 0.21, + "learning_rate": 4.589359697013532e-06, + "loss": 1.1114, + "step": 6954 + }, + { + "epoch": 0.21, + "learning_rate": 4.589225745826445e-06, + "loss": 1.1815, + "step": 6955 + }, + { + "epoch": 0.21, + "learning_rate": 4.589091774750935e-06, + "loss": 1.1456, + "step": 6956 + }, + { + "epoch": 0.21, + "learning_rate": 4.588957783788278e-06, + "loss": 1.2479, + "step": 6957 + }, + { + "epoch": 0.21, + "learning_rate": 4.588823772939749e-06, + "loss": 1.1597, + "step": 6958 + }, + { + "epoch": 0.21, + "learning_rate": 4.588689742206624e-06, + "loss": 1.0959, + "step": 6959 + }, + { + "epoch": 0.21, + "learning_rate": 4.588555691590178e-06, + "loss": 1.1526, + "step": 6960 + }, + { + "epoch": 0.21, + "learning_rate": 4.5884216210916875e-06, + "loss": 1.1982, + "step": 6961 + }, + { + "epoch": 0.21, + "learning_rate": 4.588287530712429e-06, + "loss": 1.0609, + "step": 6962 + }, + { + "epoch": 0.21, + "learning_rate": 4.588153420453679e-06, + "loss": 1.1369, + "step": 6963 + }, + { + "epoch": 0.21, + "learning_rate": 4.588019290316715e-06, + "loss": 1.1987, + "step": 6964 + }, + { + "epoch": 0.21, + "learning_rate": 4.587885140302812e-06, + "loss": 0.9916, + "step": 6965 + }, + { + "epoch": 0.21, + "learning_rate": 4.587750970413249e-06, + "loss": 1.0257, + "step": 6966 + }, + { + "epoch": 0.21, + "learning_rate": 4.587616780649302e-06, + "loss": 1.1688, + "step": 6967 + }, + { + "epoch": 0.21, + "learning_rate": 4.587482571012248e-06, + "loss": 1.2108, + "step": 6968 + }, + { + "epoch": 0.21, + "learning_rate": 4.5873483415033654e-06, + "loss": 1.0898, + "step": 6969 + }, + { + "epoch": 0.21, + "learning_rate": 4.587214092123932e-06, + "loss": 1.0698, + "step": 6970 + }, + { + "epoch": 0.21, + "learning_rate": 4.587079822875226e-06, + "loss": 1.0752, + "step": 6971 + }, + { + "epoch": 0.21, + "learning_rate": 4.586945533758525e-06, + "loss": 1.2004, + "step": 6972 + }, + { + "epoch": 0.21, + "learning_rate": 4.586811224775107e-06, + "loss": 1.2524, + "step": 6973 + }, + { + "epoch": 0.21, + "learning_rate": 4.586676895926253e-06, + "loss": 1.2266, + "step": 6974 + }, + { + "epoch": 0.21, + "learning_rate": 4.586542547213238e-06, + "loss": 1.1, + "step": 6975 + }, + { + "epoch": 0.21, + "learning_rate": 4.586408178637344e-06, + "loss": 1.1616, + "step": 6976 + }, + { + "epoch": 0.21, + "learning_rate": 4.5862737901998486e-06, + "loss": 1.1777, + "step": 6977 + }, + { + "epoch": 0.21, + "learning_rate": 4.586139381902031e-06, + "loss": 1.1569, + "step": 6978 + }, + { + "epoch": 0.21, + "learning_rate": 4.5860049537451724e-06, + "loss": 1.0767, + "step": 6979 + }, + { + "epoch": 0.21, + "learning_rate": 4.585870505730551e-06, + "loss": 1.1969, + "step": 6980 + }, + { + "epoch": 0.21, + "learning_rate": 4.585736037859446e-06, + "loss": 1.0548, + "step": 6981 + }, + { + "epoch": 0.21, + "learning_rate": 4.585601550133139e-06, + "loss": 1.2145, + "step": 6982 + }, + { + "epoch": 0.21, + "learning_rate": 4.585467042552909e-06, + "loss": 1.1945, + "step": 6983 + }, + { + "epoch": 0.21, + "learning_rate": 4.585332515120039e-06, + "loss": 1.0917, + "step": 6984 + }, + { + "epoch": 0.21, + "learning_rate": 4.585197967835806e-06, + "loss": 1.0983, + "step": 6985 + }, + { + "epoch": 0.21, + "learning_rate": 4.585063400701494e-06, + "loss": 1.0893, + "step": 6986 + }, + { + "epoch": 0.21, + "learning_rate": 4.5849288137183815e-06, + "loss": 1.2091, + "step": 6987 + }, + { + "epoch": 0.21, + "learning_rate": 4.584794206887752e-06, + "loss": 1.1747, + "step": 6988 + }, + { + "epoch": 0.21, + "learning_rate": 4.584659580210884e-06, + "loss": 1.0798, + "step": 6989 + }, + { + "epoch": 0.21, + "learning_rate": 4.584524933689062e-06, + "loss": 1.0912, + "step": 6990 + }, + { + "epoch": 0.21, + "learning_rate": 4.584390267323567e-06, + "loss": 1.0226, + "step": 6991 + }, + { + "epoch": 0.21, + "learning_rate": 4.584255581115679e-06, + "loss": 1.0294, + "step": 6992 + }, + { + "epoch": 0.21, + "learning_rate": 4.584120875066683e-06, + "loss": 1.2596, + "step": 6993 + }, + { + "epoch": 0.21, + "learning_rate": 4.58398614917786e-06, + "loss": 1.1785, + "step": 6994 + }, + { + "epoch": 0.21, + "learning_rate": 4.583851403450492e-06, + "loss": 1.1519, + "step": 6995 + }, + { + "epoch": 0.21, + "learning_rate": 4.5837166378858626e-06, + "loss": 1.1972, + "step": 6996 + }, + { + "epoch": 0.21, + "learning_rate": 4.583581852485254e-06, + "loss": 1.2296, + "step": 6997 + }, + { + "epoch": 0.21, + "learning_rate": 4.583447047249949e-06, + "loss": 1.2289, + "step": 6998 + }, + { + "epoch": 0.21, + "learning_rate": 4.583312222181233e-06, + "loss": 1.1908, + "step": 6999 + }, + { + "epoch": 0.21, + "learning_rate": 4.583177377280387e-06, + "loss": 1.2566, + "step": 7000 + }, + { + "epoch": 0.21, + "learning_rate": 4.583042512548697e-06, + "loss": 1.0394, + "step": 7001 + }, + { + "epoch": 0.21, + "learning_rate": 4.582907627987444e-06, + "loss": 1.1917, + "step": 7002 + }, + { + "epoch": 0.21, + "learning_rate": 4.582772723597914e-06, + "loss": 1.0591, + "step": 7003 + }, + { + "epoch": 0.21, + "learning_rate": 4.5826377993813905e-06, + "loss": 1.1523, + "step": 7004 + }, + { + "epoch": 0.21, + "learning_rate": 4.582502855339158e-06, + "loss": 1.157, + "step": 7005 + }, + { + "epoch": 0.21, + "learning_rate": 4.582367891472502e-06, + "loss": 1.1429, + "step": 7006 + }, + { + "epoch": 0.21, + "learning_rate": 4.582232907782707e-06, + "loss": 1.1132, + "step": 7007 + }, + { + "epoch": 0.21, + "learning_rate": 4.582097904271057e-06, + "loss": 1.2357, + "step": 7008 + }, + { + "epoch": 0.21, + "learning_rate": 4.581962880938837e-06, + "loss": 1.148, + "step": 7009 + }, + { + "epoch": 0.21, + "learning_rate": 4.581827837787334e-06, + "loss": 1.174, + "step": 7010 + }, + { + "epoch": 0.21, + "learning_rate": 4.581692774817832e-06, + "loss": 1.1299, + "step": 7011 + }, + { + "epoch": 0.21, + "learning_rate": 4.581557692031618e-06, + "loss": 1.1422, + "step": 7012 + }, + { + "epoch": 0.21, + "learning_rate": 4.581422589429977e-06, + "loss": 1.1245, + "step": 7013 + }, + { + "epoch": 0.21, + "learning_rate": 4.5812874670141955e-06, + "loss": 1.1161, + "step": 7014 + }, + { + "epoch": 0.21, + "learning_rate": 4.581152324785559e-06, + "loss": 1.1815, + "step": 7015 + }, + { + "epoch": 0.21, + "learning_rate": 4.581017162745356e-06, + "loss": 1.1634, + "step": 7016 + }, + { + "epoch": 0.21, + "learning_rate": 4.580881980894872e-06, + "loss": 1.1254, + "step": 7017 + }, + { + "epoch": 0.21, + "learning_rate": 4.580746779235392e-06, + "loss": 1.2823, + "step": 7018 + }, + { + "epoch": 0.21, + "learning_rate": 4.580611557768206e-06, + "loss": 1.1447, + "step": 7019 + }, + { + "epoch": 0.21, + "learning_rate": 4.580476316494599e-06, + "loss": 1.0311, + "step": 7020 + }, + { + "epoch": 0.21, + "learning_rate": 4.58034105541586e-06, + "loss": 1.2114, + "step": 7021 + }, + { + "epoch": 0.21, + "learning_rate": 4.5802057745332765e-06, + "loss": 1.1229, + "step": 7022 + }, + { + "epoch": 0.21, + "learning_rate": 4.580070473848135e-06, + "loss": 1.1299, + "step": 7023 + }, + { + "epoch": 0.21, + "learning_rate": 4.579935153361725e-06, + "loss": 1.1317, + "step": 7024 + }, + { + "epoch": 0.21, + "learning_rate": 4.579799813075335e-06, + "loss": 1.1465, + "step": 7025 + }, + { + "epoch": 0.21, + "learning_rate": 4.579664452990252e-06, + "loss": 1.1667, + "step": 7026 + }, + { + "epoch": 0.21, + "learning_rate": 4.579529073107764e-06, + "loss": 1.1727, + "step": 7027 + }, + { + "epoch": 0.21, + "learning_rate": 4.579393673429161e-06, + "loss": 1.1462, + "step": 7028 + }, + { + "epoch": 0.21, + "learning_rate": 4.579258253955731e-06, + "loss": 1.0958, + "step": 7029 + }, + { + "epoch": 0.21, + "learning_rate": 4.5791228146887656e-06, + "loss": 1.12, + "step": 7030 + }, + { + "epoch": 0.21, + "learning_rate": 4.578987355629552e-06, + "loss": 1.2008, + "step": 7031 + }, + { + "epoch": 0.21, + "learning_rate": 4.5788518767793786e-06, + "loss": 1.0227, + "step": 7032 + }, + { + "epoch": 0.21, + "learning_rate": 4.578716378139538e-06, + "loss": 1.1498, + "step": 7033 + }, + { + "epoch": 0.21, + "learning_rate": 4.578580859711318e-06, + "loss": 0.985, + "step": 7034 + }, + { + "epoch": 0.21, + "learning_rate": 4.57844532149601e-06, + "loss": 1.1329, + "step": 7035 + }, + { + "epoch": 0.21, + "learning_rate": 4.5783097634949025e-06, + "loss": 1.1768, + "step": 7036 + }, + { + "epoch": 0.21, + "learning_rate": 4.578174185709288e-06, + "loss": 1.2235, + "step": 7037 + }, + { + "epoch": 0.21, + "learning_rate": 4.578038588140456e-06, + "loss": 1.1591, + "step": 7038 + }, + { + "epoch": 0.21, + "learning_rate": 4.577902970789696e-06, + "loss": 1.2642, + "step": 7039 + }, + { + "epoch": 0.21, + "learning_rate": 4.577767333658302e-06, + "loss": 1.0752, + "step": 7040 + }, + { + "epoch": 0.21, + "learning_rate": 4.5776316767475635e-06, + "loss": 1.1949, + "step": 7041 + }, + { + "epoch": 0.21, + "learning_rate": 4.577496000058771e-06, + "loss": 1.2086, + "step": 7042 + }, + { + "epoch": 0.21, + "learning_rate": 4.577360303593219e-06, + "loss": 1.0393, + "step": 7043 + }, + { + "epoch": 0.21, + "learning_rate": 4.577224587352196e-06, + "loss": 1.0892, + "step": 7044 + }, + { + "epoch": 0.21, + "learning_rate": 4.5770888513369955e-06, + "loss": 1.149, + "step": 7045 + }, + { + "epoch": 0.21, + "learning_rate": 4.57695309554891e-06, + "loss": 1.2264, + "step": 7046 + }, + { + "epoch": 0.21, + "learning_rate": 4.576817319989231e-06, + "loss": 1.1279, + "step": 7047 + }, + { + "epoch": 0.21, + "learning_rate": 4.576681524659251e-06, + "loss": 1.0409, + "step": 7048 + }, + { + "epoch": 0.21, + "learning_rate": 4.576545709560264e-06, + "loss": 1.1503, + "step": 7049 + }, + { + "epoch": 0.21, + "learning_rate": 4.576409874693561e-06, + "loss": 1.1589, + "step": 7050 + }, + { + "epoch": 0.21, + "learning_rate": 4.576274020060436e-06, + "loss": 1.1164, + "step": 7051 + }, + { + "epoch": 0.21, + "learning_rate": 4.576138145662183e-06, + "loss": 1.1345, + "step": 7052 + }, + { + "epoch": 0.21, + "learning_rate": 4.576002251500095e-06, + "loss": 1.1198, + "step": 7053 + }, + { + "epoch": 0.21, + "learning_rate": 4.575866337575464e-06, + "loss": 1.066, + "step": 7054 + }, + { + "epoch": 0.21, + "learning_rate": 4.575730403889586e-06, + "loss": 1.0543, + "step": 7055 + }, + { + "epoch": 0.21, + "learning_rate": 4.5755944504437545e-06, + "loss": 1.1301, + "step": 7056 + }, + { + "epoch": 0.21, + "learning_rate": 4.575458477239263e-06, + "loss": 1.0657, + "step": 7057 + }, + { + "epoch": 0.21, + "learning_rate": 4.5753224842774066e-06, + "loss": 1.1651, + "step": 7058 + }, + { + "epoch": 0.21, + "learning_rate": 4.57518647155948e-06, + "loss": 1.1147, + "step": 7059 + }, + { + "epoch": 0.21, + "learning_rate": 4.575050439086778e-06, + "loss": 1.1327, + "step": 7060 + }, + { + "epoch": 0.21, + "learning_rate": 4.574914386860594e-06, + "loss": 1.1474, + "step": 7061 + }, + { + "epoch": 0.21, + "learning_rate": 4.574778314882225e-06, + "loss": 1.1183, + "step": 7062 + }, + { + "epoch": 0.21, + "learning_rate": 4.5746422231529654e-06, + "loss": 1.2057, + "step": 7063 + }, + { + "epoch": 0.21, + "learning_rate": 4.574506111674111e-06, + "loss": 1.1055, + "step": 7064 + }, + { + "epoch": 0.21, + "learning_rate": 4.574369980446958e-06, + "loss": 0.9849, + "step": 7065 + }, + { + "epoch": 0.21, + "learning_rate": 4.574233829472802e-06, + "loss": 1.156, + "step": 7066 + }, + { + "epoch": 0.21, + "learning_rate": 4.574097658752938e-06, + "loss": 1.078, + "step": 7067 + }, + { + "epoch": 0.21, + "learning_rate": 4.573961468288664e-06, + "loss": 1.1691, + "step": 7068 + }, + { + "epoch": 0.21, + "learning_rate": 4.5738252580812754e-06, + "loss": 1.197, + "step": 7069 + }, + { + "epoch": 0.21, + "learning_rate": 4.573689028132069e-06, + "loss": 1.1755, + "step": 7070 + }, + { + "epoch": 0.21, + "learning_rate": 4.573552778442342e-06, + "loss": 1.1833, + "step": 7071 + }, + { + "epoch": 0.21, + "learning_rate": 4.5734165090133905e-06, + "loss": 0.9973, + "step": 7072 + }, + { + "epoch": 0.21, + "learning_rate": 4.573280219846514e-06, + "loss": 1.1624, + "step": 7073 + }, + { + "epoch": 0.21, + "learning_rate": 4.5731439109430074e-06, + "loss": 1.2397, + "step": 7074 + }, + { + "epoch": 0.21, + "learning_rate": 4.5730075823041685e-06, + "loss": 1.0654, + "step": 7075 + }, + { + "epoch": 0.21, + "learning_rate": 4.572871233931297e-06, + "loss": 1.1193, + "step": 7076 + }, + { + "epoch": 0.21, + "learning_rate": 4.572734865825689e-06, + "loss": 1.202, + "step": 7077 + }, + { + "epoch": 0.21, + "learning_rate": 4.572598477988644e-06, + "loss": 1.0618, + "step": 7078 + }, + { + "epoch": 0.21, + "learning_rate": 4.572462070421459e-06, + "loss": 1.1824, + "step": 7079 + }, + { + "epoch": 0.21, + "learning_rate": 4.572325643125433e-06, + "loss": 1.2244, + "step": 7080 + }, + { + "epoch": 0.21, + "learning_rate": 4.572189196101865e-06, + "loss": 1.0788, + "step": 7081 + }, + { + "epoch": 0.21, + "learning_rate": 4.572052729352055e-06, + "loss": 1.1685, + "step": 7082 + }, + { + "epoch": 0.21, + "learning_rate": 4.5719162428773005e-06, + "loss": 1.175, + "step": 7083 + }, + { + "epoch": 0.21, + "learning_rate": 4.5717797366789005e-06, + "loss": 1.112, + "step": 7084 + }, + { + "epoch": 0.21, + "learning_rate": 4.571643210758156e-06, + "loss": 1.1193, + "step": 7085 + }, + { + "epoch": 0.21, + "learning_rate": 4.5715066651163655e-06, + "loss": 1.0555, + "step": 7086 + }, + { + "epoch": 0.21, + "learning_rate": 4.571370099754829e-06, + "loss": 1.1805, + "step": 7087 + }, + { + "epoch": 0.21, + "learning_rate": 4.571233514674846e-06, + "loss": 1.147, + "step": 7088 + }, + { + "epoch": 0.21, + "learning_rate": 4.571096909877719e-06, + "loss": 1.0204, + "step": 7089 + }, + { + "epoch": 0.21, + "learning_rate": 4.5709602853647466e-06, + "loss": 1.1893, + "step": 7090 + }, + { + "epoch": 0.21, + "learning_rate": 4.5708236411372295e-06, + "loss": 1.0517, + "step": 7091 + }, + { + "epoch": 0.21, + "learning_rate": 4.570686977196468e-06, + "loss": 1.1141, + "step": 7092 + }, + { + "epoch": 0.21, + "learning_rate": 4.570550293543765e-06, + "loss": 1.209, + "step": 7093 + }, + { + "epoch": 0.21, + "learning_rate": 4.5704135901804196e-06, + "loss": 1.1737, + "step": 7094 + }, + { + "epoch": 0.21, + "learning_rate": 4.570276867107734e-06, + "loss": 1.2625, + "step": 7095 + }, + { + "epoch": 0.21, + "learning_rate": 4.5701401243270106e-06, + "loss": 1.0331, + "step": 7096 + }, + { + "epoch": 0.21, + "learning_rate": 4.570003361839549e-06, + "loss": 1.2637, + "step": 7097 + }, + { + "epoch": 0.21, + "learning_rate": 4.569866579646654e-06, + "loss": 1.1418, + "step": 7098 + }, + { + "epoch": 0.21, + "learning_rate": 4.569729777749624e-06, + "loss": 1.2286, + "step": 7099 + }, + { + "epoch": 0.21, + "learning_rate": 4.5695929561497644e-06, + "loss": 1.1063, + "step": 7100 + }, + { + "epoch": 0.21, + "learning_rate": 4.569456114848376e-06, + "loss": 1.1829, + "step": 7101 + }, + { + "epoch": 0.21, + "learning_rate": 4.569319253846763e-06, + "loss": 1.1119, + "step": 7102 + }, + { + "epoch": 0.21, + "learning_rate": 4.569182373146226e-06, + "loss": 1.0613, + "step": 7103 + }, + { + "epoch": 0.21, + "learning_rate": 4.56904547274807e-06, + "loss": 1.3307, + "step": 7104 + }, + { + "epoch": 0.21, + "learning_rate": 4.568908552653598e-06, + "loss": 1.2074, + "step": 7105 + }, + { + "epoch": 0.21, + "learning_rate": 4.5687716128641135e-06, + "loss": 1.2242, + "step": 7106 + }, + { + "epoch": 0.21, + "learning_rate": 4.568634653380919e-06, + "loss": 1.1298, + "step": 7107 + }, + { + "epoch": 0.21, + "learning_rate": 4.5684976742053185e-06, + "loss": 1.1349, + "step": 7108 + }, + { + "epoch": 0.21, + "learning_rate": 4.568360675338617e-06, + "loss": 1.0401, + "step": 7109 + }, + { + "epoch": 0.21, + "learning_rate": 4.568223656782117e-06, + "loss": 1.1708, + "step": 7110 + }, + { + "epoch": 0.21, + "learning_rate": 4.568086618537125e-06, + "loss": 1.1875, + "step": 7111 + }, + { + "epoch": 0.21, + "learning_rate": 4.567949560604944e-06, + "loss": 1.0665, + "step": 7112 + }, + { + "epoch": 0.21, + "learning_rate": 4.567812482986879e-06, + "loss": 1.0731, + "step": 7113 + }, + { + "epoch": 0.21, + "learning_rate": 4.567675385684235e-06, + "loss": 1.2393, + "step": 7114 + }, + { + "epoch": 0.21, + "learning_rate": 4.567538268698317e-06, + "loss": 1.1445, + "step": 7115 + }, + { + "epoch": 0.21, + "learning_rate": 4.567401132030431e-06, + "loss": 1.2617, + "step": 7116 + }, + { + "epoch": 0.21, + "learning_rate": 4.567263975681882e-06, + "loss": 1.2302, + "step": 7117 + }, + { + "epoch": 0.21, + "learning_rate": 4.567126799653975e-06, + "loss": 1.2515, + "step": 7118 + }, + { + "epoch": 0.21, + "learning_rate": 4.566989603948016e-06, + "loss": 1.2134, + "step": 7119 + }, + { + "epoch": 0.21, + "learning_rate": 4.566852388565312e-06, + "loss": 1.1607, + "step": 7120 + }, + { + "epoch": 0.21, + "learning_rate": 4.5667151535071695e-06, + "loss": 1.1301, + "step": 7121 + }, + { + "epoch": 0.21, + "learning_rate": 4.566577898774893e-06, + "loss": 1.1207, + "step": 7122 + }, + { + "epoch": 0.21, + "learning_rate": 4.566440624369791e-06, + "loss": 1.1646, + "step": 7123 + }, + { + "epoch": 0.21, + "learning_rate": 4.566303330293169e-06, + "loss": 1.1885, + "step": 7124 + }, + { + "epoch": 0.21, + "learning_rate": 4.566166016546335e-06, + "loss": 1.049, + "step": 7125 + }, + { + "epoch": 0.21, + "learning_rate": 4.566028683130595e-06, + "loss": 1.2237, + "step": 7126 + }, + { + "epoch": 0.21, + "learning_rate": 4.565891330047257e-06, + "loss": 1.0841, + "step": 7127 + }, + { + "epoch": 0.21, + "learning_rate": 4.565753957297628e-06, + "loss": 1.1285, + "step": 7128 + }, + { + "epoch": 0.21, + "learning_rate": 4.565616564883018e-06, + "loss": 1.2174, + "step": 7129 + }, + { + "epoch": 0.21, + "learning_rate": 4.565479152804732e-06, + "loss": 1.1568, + "step": 7130 + }, + { + "epoch": 0.21, + "learning_rate": 4.565341721064079e-06, + "loss": 1.1951, + "step": 7131 + }, + { + "epoch": 0.21, + "learning_rate": 4.565204269662368e-06, + "loss": 1.101, + "step": 7132 + }, + { + "epoch": 0.21, + "learning_rate": 4.565066798600907e-06, + "loss": 1.2166, + "step": 7133 + }, + { + "epoch": 0.21, + "learning_rate": 4.564929307881004e-06, + "loss": 1.0893, + "step": 7134 + }, + { + "epoch": 0.21, + "learning_rate": 4.564791797503969e-06, + "loss": 1.1962, + "step": 7135 + }, + { + "epoch": 0.21, + "learning_rate": 4.56465426747111e-06, + "loss": 1.2383, + "step": 7136 + }, + { + "epoch": 0.22, + "learning_rate": 4.564516717783738e-06, + "loss": 1.1902, + "step": 7137 + }, + { + "epoch": 0.22, + "learning_rate": 4.56437914844316e-06, + "loss": 1.1916, + "step": 7138 + }, + { + "epoch": 0.22, + "learning_rate": 4.5642415594506875e-06, + "loss": 1.1262, + "step": 7139 + }, + { + "epoch": 0.22, + "learning_rate": 4.564103950807628e-06, + "loss": 0.9864, + "step": 7140 + }, + { + "epoch": 0.22, + "learning_rate": 4.5639663225152945e-06, + "loss": 1.1564, + "step": 7141 + }, + { + "epoch": 0.22, + "learning_rate": 4.5638286745749955e-06, + "loss": 1.1643, + "step": 7142 + }, + { + "epoch": 0.22, + "learning_rate": 4.563691006988042e-06, + "loss": 1.3605, + "step": 7143 + }, + { + "epoch": 0.22, + "learning_rate": 4.563553319755743e-06, + "loss": 1.2145, + "step": 7144 + }, + { + "epoch": 0.22, + "learning_rate": 4.56341561287941e-06, + "loss": 1.1264, + "step": 7145 + }, + { + "epoch": 0.22, + "learning_rate": 4.5632778863603545e-06, + "loss": 1.0044, + "step": 7146 + }, + { + "epoch": 0.22, + "learning_rate": 4.563140140199888e-06, + "loss": 1.153, + "step": 7147 + }, + { + "epoch": 0.22, + "learning_rate": 4.56300237439932e-06, + "loss": 1.1601, + "step": 7148 + }, + { + "epoch": 0.22, + "learning_rate": 4.5628645889599635e-06, + "loss": 1.1686, + "step": 7149 + }, + { + "epoch": 0.22, + "learning_rate": 4.562726783883129e-06, + "loss": 1.2634, + "step": 7150 + }, + { + "epoch": 0.22, + "learning_rate": 4.56258895917013e-06, + "loss": 1.1641, + "step": 7151 + }, + { + "epoch": 0.22, + "learning_rate": 4.562451114822277e-06, + "loss": 1.1035, + "step": 7152 + }, + { + "epoch": 0.22, + "learning_rate": 4.5623132508408826e-06, + "loss": 1.1152, + "step": 7153 + }, + { + "epoch": 0.22, + "learning_rate": 4.562175367227259e-06, + "loss": 1.2822, + "step": 7154 + }, + { + "epoch": 0.22, + "learning_rate": 4.562037463982719e-06, + "loss": 1.2496, + "step": 7155 + }, + { + "epoch": 0.22, + "learning_rate": 4.561899541108576e-06, + "loss": 1.2036, + "step": 7156 + }, + { + "epoch": 0.22, + "learning_rate": 4.561761598606143e-06, + "loss": 1.1077, + "step": 7157 + }, + { + "epoch": 0.22, + "learning_rate": 4.561623636476732e-06, + "loss": 1.2079, + "step": 7158 + }, + { + "epoch": 0.22, + "learning_rate": 4.561485654721656e-06, + "loss": 1.1909, + "step": 7159 + }, + { + "epoch": 0.22, + "learning_rate": 4.561347653342231e-06, + "loss": 1.1213, + "step": 7160 + }, + { + "epoch": 0.22, + "learning_rate": 4.561209632339768e-06, + "loss": 1.2359, + "step": 7161 + }, + { + "epoch": 0.22, + "learning_rate": 4.561071591715582e-06, + "loss": 1.184, + "step": 7162 + }, + { + "epoch": 0.22, + "learning_rate": 4.560933531470987e-06, + "loss": 1.2416, + "step": 7163 + }, + { + "epoch": 0.22, + "learning_rate": 4.560795451607298e-06, + "loss": 1.1219, + "step": 7164 + }, + { + "epoch": 0.22, + "learning_rate": 4.560657352125828e-06, + "loss": 1.23, + "step": 7165 + }, + { + "epoch": 0.22, + "learning_rate": 4.560519233027893e-06, + "loss": 1.1633, + "step": 7166 + }, + { + "epoch": 0.22, + "learning_rate": 4.560381094314807e-06, + "loss": 1.2129, + "step": 7167 + }, + { + "epoch": 0.22, + "learning_rate": 4.5602429359878865e-06, + "loss": 1.1394, + "step": 7168 + }, + { + "epoch": 0.22, + "learning_rate": 4.560104758048444e-06, + "loss": 1.2101, + "step": 7169 + }, + { + "epoch": 0.22, + "learning_rate": 4.559966560497797e-06, + "loss": 1.1985, + "step": 7170 + }, + { + "epoch": 0.22, + "learning_rate": 4.5598283433372605e-06, + "loss": 1.1494, + "step": 7171 + }, + { + "epoch": 0.22, + "learning_rate": 4.559690106568151e-06, + "loss": 1.1707, + "step": 7172 + }, + { + "epoch": 0.22, + "learning_rate": 4.559551850191783e-06, + "loss": 1.1063, + "step": 7173 + }, + { + "epoch": 0.22, + "learning_rate": 4.559413574209472e-06, + "loss": 1.2478, + "step": 7174 + }, + { + "epoch": 0.22, + "learning_rate": 4.559275278622537e-06, + "loss": 1.0784, + "step": 7175 + }, + { + "epoch": 0.22, + "learning_rate": 4.559136963432292e-06, + "loss": 1.1321, + "step": 7176 + }, + { + "epoch": 0.22, + "learning_rate": 4.558998628640057e-06, + "loss": 1.1165, + "step": 7177 + }, + { + "epoch": 0.22, + "learning_rate": 4.558860274247145e-06, + "loss": 1.107, + "step": 7178 + }, + { + "epoch": 0.22, + "learning_rate": 4.558721900254875e-06, + "loss": 1.051, + "step": 7179 + }, + { + "epoch": 0.22, + "learning_rate": 4.558583506664564e-06, + "loss": 1.205, + "step": 7180 + }, + { + "epoch": 0.22, + "learning_rate": 4.5584450934775295e-06, + "loss": 1.0922, + "step": 7181 + }, + { + "epoch": 0.22, + "learning_rate": 4.55830666069509e-06, + "loss": 1.2334, + "step": 7182 + }, + { + "epoch": 0.22, + "learning_rate": 4.558168208318561e-06, + "loss": 1.0901, + "step": 7183 + }, + { + "epoch": 0.22, + "learning_rate": 4.558029736349263e-06, + "loss": 1.0823, + "step": 7184 + }, + { + "epoch": 0.22, + "learning_rate": 4.557891244788512e-06, + "loss": 1.1379, + "step": 7185 + }, + { + "epoch": 0.22, + "learning_rate": 4.557752733637628e-06, + "loss": 1.26, + "step": 7186 + }, + { + "epoch": 0.22, + "learning_rate": 4.55761420289793e-06, + "loss": 1.1077, + "step": 7187 + }, + { + "epoch": 0.22, + "learning_rate": 4.557475652570734e-06, + "loss": 1.0761, + "step": 7188 + }, + { + "epoch": 0.22, + "learning_rate": 4.557337082657361e-06, + "loss": 1.1455, + "step": 7189 + }, + { + "epoch": 0.22, + "learning_rate": 4.557198493159132e-06, + "loss": 1.0837, + "step": 7190 + }, + { + "epoch": 0.22, + "learning_rate": 4.557059884077362e-06, + "loss": 1.2288, + "step": 7191 + }, + { + "epoch": 0.22, + "learning_rate": 4.556921255413373e-06, + "loss": 1.2021, + "step": 7192 + }, + { + "epoch": 0.22, + "learning_rate": 4.5567826071684844e-06, + "loss": 1.1152, + "step": 7193 + }, + { + "epoch": 0.22, + "learning_rate": 4.556643939344016e-06, + "loss": 1.2323, + "step": 7194 + }, + { + "epoch": 0.22, + "learning_rate": 4.556505251941287e-06, + "loss": 1.1535, + "step": 7195 + }, + { + "epoch": 0.22, + "learning_rate": 4.55636654496162e-06, + "loss": 1.1361, + "step": 7196 + }, + { + "epoch": 0.22, + "learning_rate": 4.556227818406333e-06, + "loss": 1.1457, + "step": 7197 + }, + { + "epoch": 0.22, + "learning_rate": 4.556089072276748e-06, + "loss": 1.1626, + "step": 7198 + }, + { + "epoch": 0.22, + "learning_rate": 4.555950306574185e-06, + "loss": 1.2203, + "step": 7199 + }, + { + "epoch": 0.22, + "learning_rate": 4.555811521299965e-06, + "loss": 1.2722, + "step": 7200 + }, + { + "epoch": 0.22, + "learning_rate": 4.555672716455409e-06, + "loss": 1.1461, + "step": 7201 + }, + { + "epoch": 0.22, + "learning_rate": 4.55553389204184e-06, + "loss": 1.0963, + "step": 7202 + }, + { + "epoch": 0.22, + "learning_rate": 4.555395048060578e-06, + "loss": 1.0645, + "step": 7203 + }, + { + "epoch": 0.22, + "learning_rate": 4.555256184512944e-06, + "loss": 1.1747, + "step": 7204 + }, + { + "epoch": 0.22, + "learning_rate": 4.555117301400262e-06, + "loss": 1.1062, + "step": 7205 + }, + { + "epoch": 0.22, + "learning_rate": 4.5549783987238525e-06, + "loss": 1.1953, + "step": 7206 + }, + { + "epoch": 0.22, + "learning_rate": 4.554839476485039e-06, + "loss": 1.1086, + "step": 7207 + }, + { + "epoch": 0.22, + "learning_rate": 4.554700534685143e-06, + "loss": 1.0746, + "step": 7208 + }, + { + "epoch": 0.22, + "learning_rate": 4.5545615733254875e-06, + "loss": 1.11, + "step": 7209 + }, + { + "epoch": 0.22, + "learning_rate": 4.554422592407395e-06, + "loss": 1.0872, + "step": 7210 + }, + { + "epoch": 0.22, + "learning_rate": 4.5542835919321894e-06, + "loss": 1.2233, + "step": 7211 + }, + { + "epoch": 0.22, + "learning_rate": 4.554144571901193e-06, + "loss": 1.2457, + "step": 7212 + }, + { + "epoch": 0.22, + "learning_rate": 4.554005532315729e-06, + "loss": 1.0643, + "step": 7213 + }, + { + "epoch": 0.22, + "learning_rate": 4.5538664731771234e-06, + "loss": 1.0759, + "step": 7214 + }, + { + "epoch": 0.22, + "learning_rate": 4.553727394486697e-06, + "loss": 1.2444, + "step": 7215 + }, + { + "epoch": 0.22, + "learning_rate": 4.553588296245775e-06, + "loss": 1.2189, + "step": 7216 + }, + { + "epoch": 0.22, + "learning_rate": 4.5534491784556815e-06, + "loss": 1.201, + "step": 7217 + }, + { + "epoch": 0.22, + "learning_rate": 4.5533100411177405e-06, + "loss": 1.0563, + "step": 7218 + }, + { + "epoch": 0.22, + "learning_rate": 4.553170884233277e-06, + "loss": 1.1754, + "step": 7219 + }, + { + "epoch": 0.22, + "learning_rate": 4.553031707803616e-06, + "loss": 1.1019, + "step": 7220 + }, + { + "epoch": 0.22, + "learning_rate": 4.552892511830081e-06, + "loss": 1.1072, + "step": 7221 + }, + { + "epoch": 0.22, + "learning_rate": 4.552753296313998e-06, + "loss": 1.1859, + "step": 7222 + }, + { + "epoch": 0.22, + "learning_rate": 4.552614061256693e-06, + "loss": 1.1624, + "step": 7223 + }, + { + "epoch": 0.22, + "learning_rate": 4.55247480665949e-06, + "loss": 1.1705, + "step": 7224 + }, + { + "epoch": 0.22, + "learning_rate": 4.552335532523716e-06, + "loss": 1.0805, + "step": 7225 + }, + { + "epoch": 0.22, + "learning_rate": 4.552196238850696e-06, + "loss": 1.1627, + "step": 7226 + }, + { + "epoch": 0.22, + "learning_rate": 4.5520569256417566e-06, + "loss": 1.2104, + "step": 7227 + }, + { + "epoch": 0.22, + "learning_rate": 4.551917592898223e-06, + "loss": 1.1777, + "step": 7228 + }, + { + "epoch": 0.22, + "learning_rate": 4.551778240621422e-06, + "loss": 1.1783, + "step": 7229 + }, + { + "epoch": 0.22, + "learning_rate": 4.551638868812681e-06, + "loss": 1.1509, + "step": 7230 + }, + { + "epoch": 0.22, + "learning_rate": 4.5514994774733255e-06, + "loss": 1.3157, + "step": 7231 + }, + { + "epoch": 0.22, + "learning_rate": 4.551360066604683e-06, + "loss": 1.1525, + "step": 7232 + }, + { + "epoch": 0.22, + "learning_rate": 4.551220636208081e-06, + "loss": 1.0916, + "step": 7233 + }, + { + "epoch": 0.22, + "learning_rate": 4.551081186284847e-06, + "loss": 1.1195, + "step": 7234 + }, + { + "epoch": 0.22, + "learning_rate": 4.550941716836306e-06, + "loss": 1.2406, + "step": 7235 + }, + { + "epoch": 0.22, + "learning_rate": 4.550802227863788e-06, + "loss": 1.2299, + "step": 7236 + }, + { + "epoch": 0.22, + "learning_rate": 4.550662719368622e-06, + "loss": 1.0419, + "step": 7237 + }, + { + "epoch": 0.22, + "learning_rate": 4.550523191352134e-06, + "loss": 1.0684, + "step": 7238 + }, + { + "epoch": 0.22, + "learning_rate": 4.550383643815653e-06, + "loss": 1.1151, + "step": 7239 + }, + { + "epoch": 0.22, + "learning_rate": 4.550244076760507e-06, + "loss": 1.0557, + "step": 7240 + }, + { + "epoch": 0.22, + "learning_rate": 4.550104490188024e-06, + "loss": 1.1562, + "step": 7241 + }, + { + "epoch": 0.22, + "learning_rate": 4.5499648840995346e-06, + "loss": 1.2594, + "step": 7242 + }, + { + "epoch": 0.22, + "learning_rate": 4.549825258496366e-06, + "loss": 1.1762, + "step": 7243 + }, + { + "epoch": 0.22, + "learning_rate": 4.5496856133798494e-06, + "loss": 1.2548, + "step": 7244 + }, + { + "epoch": 0.22, + "learning_rate": 4.549545948751312e-06, + "loss": 1.1442, + "step": 7245 + }, + { + "epoch": 0.22, + "learning_rate": 4.5494062646120845e-06, + "loss": 1.2076, + "step": 7246 + }, + { + "epoch": 0.22, + "learning_rate": 4.549266560963497e-06, + "loss": 1.0754, + "step": 7247 + }, + { + "epoch": 0.22, + "learning_rate": 4.549126837806878e-06, + "loss": 1.1815, + "step": 7248 + }, + { + "epoch": 0.22, + "learning_rate": 4.548987095143558e-06, + "loss": 1.1144, + "step": 7249 + }, + { + "epoch": 0.22, + "learning_rate": 4.5488473329748686e-06, + "loss": 1.1133, + "step": 7250 + }, + { + "epoch": 0.22, + "learning_rate": 4.5487075513021385e-06, + "loss": 1.0976, + "step": 7251 + }, + { + "epoch": 0.22, + "learning_rate": 4.548567750126699e-06, + "loss": 1.0555, + "step": 7252 + }, + { + "epoch": 0.22, + "learning_rate": 4.548427929449882e-06, + "loss": 1.0805, + "step": 7253 + }, + { + "epoch": 0.22, + "learning_rate": 4.548288089273018e-06, + "loss": 1.158, + "step": 7254 + }, + { + "epoch": 0.22, + "learning_rate": 4.548148229597437e-06, + "loss": 1.2196, + "step": 7255 + }, + { + "epoch": 0.22, + "learning_rate": 4.548008350424472e-06, + "loss": 1.2257, + "step": 7256 + }, + { + "epoch": 0.22, + "learning_rate": 4.5478684517554536e-06, + "loss": 1.0798, + "step": 7257 + }, + { + "epoch": 0.22, + "learning_rate": 4.547728533591713e-06, + "loss": 1.0659, + "step": 7258 + }, + { + "epoch": 0.22, + "learning_rate": 4.5475885959345845e-06, + "loss": 1.1605, + "step": 7259 + }, + { + "epoch": 0.22, + "learning_rate": 4.547448638785398e-06, + "loss": 1.1611, + "step": 7260 + }, + { + "epoch": 0.22, + "learning_rate": 4.547308662145486e-06, + "loss": 1.2012, + "step": 7261 + }, + { + "epoch": 0.22, + "learning_rate": 4.547168666016182e-06, + "loss": 1.3, + "step": 7262 + }, + { + "epoch": 0.22, + "learning_rate": 4.547028650398818e-06, + "loss": 1.1627, + "step": 7263 + }, + { + "epoch": 0.22, + "learning_rate": 4.546888615294728e-06, + "loss": 1.1221, + "step": 7264 + }, + { + "epoch": 0.22, + "learning_rate": 4.546748560705243e-06, + "loss": 1.0696, + "step": 7265 + }, + { + "epoch": 0.22, + "learning_rate": 4.546608486631698e-06, + "loss": 1.0871, + "step": 7266 + }, + { + "epoch": 0.22, + "learning_rate": 4.546468393075426e-06, + "loss": 1.1196, + "step": 7267 + }, + { + "epoch": 0.22, + "learning_rate": 4.546328280037761e-06, + "loss": 1.1524, + "step": 7268 + }, + { + "epoch": 0.22, + "learning_rate": 4.546188147520035e-06, + "loss": 1.166, + "step": 7269 + }, + { + "epoch": 0.22, + "learning_rate": 4.546047995523584e-06, + "loss": 1.0015, + "step": 7270 + }, + { + "epoch": 0.22, + "learning_rate": 4.5459078240497416e-06, + "loss": 1.1092, + "step": 7271 + }, + { + "epoch": 0.22, + "learning_rate": 4.545767633099843e-06, + "loss": 1.1268, + "step": 7272 + }, + { + "epoch": 0.22, + "learning_rate": 4.54562742267522e-06, + "loss": 1.1426, + "step": 7273 + }, + { + "epoch": 0.22, + "learning_rate": 4.54548719277721e-06, + "loss": 1.2057, + "step": 7274 + }, + { + "epoch": 0.22, + "learning_rate": 4.545346943407148e-06, + "loss": 1.1622, + "step": 7275 + }, + { + "epoch": 0.22, + "learning_rate": 4.545206674566366e-06, + "loss": 1.1655, + "step": 7276 + }, + { + "epoch": 0.22, + "learning_rate": 4.545066386256203e-06, + "loss": 1.1622, + "step": 7277 + }, + { + "epoch": 0.22, + "learning_rate": 4.544926078477993e-06, + "loss": 1.1016, + "step": 7278 + }, + { + "epoch": 0.22, + "learning_rate": 4.544785751233071e-06, + "loss": 1.276, + "step": 7279 + }, + { + "epoch": 0.22, + "learning_rate": 4.544645404522773e-06, + "loss": 1.2865, + "step": 7280 + }, + { + "epoch": 0.22, + "learning_rate": 4.5445050383484365e-06, + "loss": 1.2736, + "step": 7281 + }, + { + "epoch": 0.22, + "learning_rate": 4.544364652711396e-06, + "loss": 1.1566, + "step": 7282 + }, + { + "epoch": 0.22, + "learning_rate": 4.544224247612989e-06, + "loss": 1.1534, + "step": 7283 + }, + { + "epoch": 0.22, + "learning_rate": 4.544083823054552e-06, + "loss": 1.2037, + "step": 7284 + }, + { + "epoch": 0.22, + "learning_rate": 4.543943379037421e-06, + "loss": 1.1824, + "step": 7285 + }, + { + "epoch": 0.22, + "learning_rate": 4.543802915562934e-06, + "loss": 1.1625, + "step": 7286 + }, + { + "epoch": 0.22, + "learning_rate": 4.5436624326324265e-06, + "loss": 1.2208, + "step": 7287 + }, + { + "epoch": 0.22, + "learning_rate": 4.543521930247237e-06, + "loss": 1.0106, + "step": 7288 + }, + { + "epoch": 0.22, + "learning_rate": 4.543381408408704e-06, + "loss": 1.1486, + "step": 7289 + }, + { + "epoch": 0.22, + "learning_rate": 4.543240867118164e-06, + "loss": 1.0827, + "step": 7290 + }, + { + "epoch": 0.22, + "learning_rate": 4.543100306376954e-06, + "loss": 1.1819, + "step": 7291 + }, + { + "epoch": 0.22, + "learning_rate": 4.5429597261864135e-06, + "loss": 1.2017, + "step": 7292 + }, + { + "epoch": 0.22, + "learning_rate": 4.5428191265478805e-06, + "loss": 1.3162, + "step": 7293 + }, + { + "epoch": 0.22, + "learning_rate": 4.542678507462693e-06, + "loss": 1.1752, + "step": 7294 + }, + { + "epoch": 0.22, + "learning_rate": 4.542537868932191e-06, + "loss": 1.186, + "step": 7295 + }, + { + "epoch": 0.22, + "learning_rate": 4.542397210957711e-06, + "loss": 1.1982, + "step": 7296 + }, + { + "epoch": 0.22, + "learning_rate": 4.542256533540594e-06, + "loss": 1.0609, + "step": 7297 + }, + { + "epoch": 0.22, + "learning_rate": 4.542115836682177e-06, + "loss": 1.2584, + "step": 7298 + }, + { + "epoch": 0.22, + "learning_rate": 4.541975120383803e-06, + "loss": 1.3094, + "step": 7299 + }, + { + "epoch": 0.22, + "learning_rate": 4.5418343846468076e-06, + "loss": 1.146, + "step": 7300 + }, + { + "epoch": 0.22, + "learning_rate": 4.541693629472532e-06, + "loss": 1.0342, + "step": 7301 + }, + { + "epoch": 0.22, + "learning_rate": 4.541552854862317e-06, + "loss": 1.0256, + "step": 7302 + }, + { + "epoch": 0.22, + "learning_rate": 4.541412060817502e-06, + "loss": 1.175, + "step": 7303 + }, + { + "epoch": 0.22, + "learning_rate": 4.541271247339428e-06, + "loss": 1.1192, + "step": 7304 + }, + { + "epoch": 0.22, + "learning_rate": 4.541130414429434e-06, + "loss": 1.1479, + "step": 7305 + }, + { + "epoch": 0.22, + "learning_rate": 4.540989562088861e-06, + "loss": 1.2076, + "step": 7306 + }, + { + "epoch": 0.22, + "learning_rate": 4.540848690319052e-06, + "loss": 1.0611, + "step": 7307 + }, + { + "epoch": 0.22, + "learning_rate": 4.5407077991213455e-06, + "loss": 1.0609, + "step": 7308 + }, + { + "epoch": 0.22, + "learning_rate": 4.540566888497083e-06, + "loss": 1.1371, + "step": 7309 + }, + { + "epoch": 0.22, + "learning_rate": 4.540425958447607e-06, + "loss": 1.1115, + "step": 7310 + }, + { + "epoch": 0.22, + "learning_rate": 4.540285008974259e-06, + "loss": 1.1973, + "step": 7311 + }, + { + "epoch": 0.22, + "learning_rate": 4.54014404007838e-06, + "loss": 1.1588, + "step": 7312 + }, + { + "epoch": 0.22, + "learning_rate": 4.540003051761312e-06, + "loss": 1.2568, + "step": 7313 + }, + { + "epoch": 0.22, + "learning_rate": 4.539862044024398e-06, + "loss": 1.1546, + "step": 7314 + }, + { + "epoch": 0.22, + "learning_rate": 4.5397210168689795e-06, + "loss": 1.1782, + "step": 7315 + }, + { + "epoch": 0.22, + "learning_rate": 4.539579970296399e-06, + "loss": 1.1844, + "step": 7316 + }, + { + "epoch": 0.22, + "learning_rate": 4.5394389043080004e-06, + "loss": 1.22, + "step": 7317 + }, + { + "epoch": 0.22, + "learning_rate": 4.539297818905124e-06, + "loss": 1.2021, + "step": 7318 + }, + { + "epoch": 0.22, + "learning_rate": 4.5391567140891155e-06, + "loss": 1.1196, + "step": 7319 + }, + { + "epoch": 0.22, + "learning_rate": 4.539015589861318e-06, + "loss": 1.1156, + "step": 7320 + }, + { + "epoch": 0.22, + "learning_rate": 4.538874446223073e-06, + "loss": 1.1896, + "step": 7321 + }, + { + "epoch": 0.22, + "learning_rate": 4.5387332831757254e-06, + "loss": 1.1238, + "step": 7322 + }, + { + "epoch": 0.22, + "learning_rate": 4.538592100720619e-06, + "loss": 1.1065, + "step": 7323 + }, + { + "epoch": 0.22, + "learning_rate": 4.5384508988590975e-06, + "loss": 1.1287, + "step": 7324 + }, + { + "epoch": 0.22, + "learning_rate": 4.538309677592505e-06, + "loss": 1.1084, + "step": 7325 + }, + { + "epoch": 0.22, + "learning_rate": 4.538168436922187e-06, + "loss": 0.9809, + "step": 7326 + }, + { + "epoch": 0.22, + "learning_rate": 4.538027176849487e-06, + "loss": 1.108, + "step": 7327 + }, + { + "epoch": 0.22, + "learning_rate": 4.537885897375749e-06, + "loss": 1.1664, + "step": 7328 + }, + { + "epoch": 0.22, + "learning_rate": 4.5377445985023185e-06, + "loss": 1.1522, + "step": 7329 + }, + { + "epoch": 0.22, + "learning_rate": 4.537603280230542e-06, + "loss": 1.272, + "step": 7330 + }, + { + "epoch": 0.22, + "learning_rate": 4.537461942561762e-06, + "loss": 1.12, + "step": 7331 + }, + { + "epoch": 0.22, + "learning_rate": 4.537320585497327e-06, + "loss": 1.0946, + "step": 7332 + }, + { + "epoch": 0.22, + "learning_rate": 4.5371792090385805e-06, + "loss": 1.1329, + "step": 7333 + }, + { + "epoch": 0.22, + "learning_rate": 4.53703781318687e-06, + "loss": 1.1012, + "step": 7334 + }, + { + "epoch": 0.22, + "learning_rate": 4.53689639794354e-06, + "loss": 1.1056, + "step": 7335 + }, + { + "epoch": 0.22, + "learning_rate": 4.536754963309937e-06, + "loss": 1.0726, + "step": 7336 + }, + { + "epoch": 0.22, + "learning_rate": 4.536613509287407e-06, + "loss": 1.2129, + "step": 7337 + }, + { + "epoch": 0.22, + "learning_rate": 4.536472035877298e-06, + "loss": 1.1987, + "step": 7338 + }, + { + "epoch": 0.22, + "learning_rate": 4.5363305430809565e-06, + "loss": 1.1017, + "step": 7339 + }, + { + "epoch": 0.22, + "learning_rate": 4.5361890308997295e-06, + "loss": 1.182, + "step": 7340 + }, + { + "epoch": 0.22, + "learning_rate": 4.5360474993349625e-06, + "loss": 1.1692, + "step": 7341 + }, + { + "epoch": 0.22, + "learning_rate": 4.535905948388004e-06, + "loss": 1.0915, + "step": 7342 + }, + { + "epoch": 0.22, + "learning_rate": 4.535764378060201e-06, + "loss": 1.2443, + "step": 7343 + }, + { + "epoch": 0.22, + "learning_rate": 4.535622788352902e-06, + "loss": 1.0411, + "step": 7344 + }, + { + "epoch": 0.22, + "learning_rate": 4.5354811792674545e-06, + "loss": 1.1406, + "step": 7345 + }, + { + "epoch": 0.22, + "learning_rate": 4.535339550805207e-06, + "loss": 1.1108, + "step": 7346 + }, + { + "epoch": 0.22, + "learning_rate": 4.535197902967506e-06, + "loss": 1.0869, + "step": 7347 + }, + { + "epoch": 0.22, + "learning_rate": 4.535056235755703e-06, + "loss": 1.0566, + "step": 7348 + }, + { + "epoch": 0.22, + "learning_rate": 4.5349145491711436e-06, + "loss": 1.1481, + "step": 7349 + }, + { + "epoch": 0.22, + "learning_rate": 4.534772843215178e-06, + "loss": 1.1918, + "step": 7350 + }, + { + "epoch": 0.22, + "learning_rate": 4.534631117889154e-06, + "loss": 1.1287, + "step": 7351 + }, + { + "epoch": 0.22, + "learning_rate": 4.534489373194423e-06, + "loss": 1.0646, + "step": 7352 + }, + { + "epoch": 0.22, + "learning_rate": 4.534347609132332e-06, + "loss": 1.1409, + "step": 7353 + }, + { + "epoch": 0.22, + "learning_rate": 4.534205825704232e-06, + "loss": 1.1708, + "step": 7354 + }, + { + "epoch": 0.22, + "learning_rate": 4.5340640229114715e-06, + "loss": 1.2567, + "step": 7355 + }, + { + "epoch": 0.22, + "learning_rate": 4.533922200755403e-06, + "loss": 1.1818, + "step": 7356 + }, + { + "epoch": 0.22, + "learning_rate": 4.533780359237373e-06, + "loss": 1.0815, + "step": 7357 + }, + { + "epoch": 0.22, + "learning_rate": 4.533638498358734e-06, + "loss": 1.147, + "step": 7358 + }, + { + "epoch": 0.22, + "learning_rate": 4.533496618120836e-06, + "loss": 1.1263, + "step": 7359 + }, + { + "epoch": 0.22, + "learning_rate": 4.533354718525029e-06, + "loss": 1.1705, + "step": 7360 + }, + { + "epoch": 0.22, + "learning_rate": 4.533212799572666e-06, + "loss": 1.2018, + "step": 7361 + }, + { + "epoch": 0.22, + "learning_rate": 4.533070861265095e-06, + "loss": 1.1476, + "step": 7362 + }, + { + "epoch": 0.22, + "learning_rate": 4.532928903603668e-06, + "loss": 1.1458, + "step": 7363 + }, + { + "epoch": 0.22, + "learning_rate": 4.5327869265897385e-06, + "loss": 1.2256, + "step": 7364 + }, + { + "epoch": 0.22, + "learning_rate": 4.532644930224656e-06, + "loss": 1.105, + "step": 7365 + }, + { + "epoch": 0.22, + "learning_rate": 4.532502914509772e-06, + "loss": 1.053, + "step": 7366 + }, + { + "epoch": 0.22, + "learning_rate": 4.53236087944644e-06, + "loss": 1.2971, + "step": 7367 + }, + { + "epoch": 0.22, + "learning_rate": 4.53221882503601e-06, + "loss": 1.3905, + "step": 7368 + }, + { + "epoch": 0.22, + "learning_rate": 4.532076751279837e-06, + "loss": 1.1563, + "step": 7369 + }, + { + "epoch": 0.22, + "learning_rate": 4.531934658179271e-06, + "loss": 1.1879, + "step": 7370 + }, + { + "epoch": 0.22, + "learning_rate": 4.531792545735667e-06, + "loss": 1.0984, + "step": 7371 + }, + { + "epoch": 0.22, + "learning_rate": 4.531650413950375e-06, + "loss": 1.1737, + "step": 7372 + }, + { + "epoch": 0.22, + "learning_rate": 4.5315082628247495e-06, + "loss": 1.2487, + "step": 7373 + }, + { + "epoch": 0.22, + "learning_rate": 4.531366092360145e-06, + "loss": 1.1202, + "step": 7374 + }, + { + "epoch": 0.22, + "learning_rate": 4.531223902557913e-06, + "loss": 1.136, + "step": 7375 + }, + { + "epoch": 0.22, + "learning_rate": 4.531081693419408e-06, + "loss": 1.1937, + "step": 7376 + }, + { + "epoch": 0.22, + "learning_rate": 4.530939464945983e-06, + "loss": 1.0874, + "step": 7377 + }, + { + "epoch": 0.22, + "learning_rate": 4.5307972171389925e-06, + "loss": 1.1557, + "step": 7378 + }, + { + "epoch": 0.22, + "learning_rate": 4.530654949999791e-06, + "loss": 1.0769, + "step": 7379 + }, + { + "epoch": 0.22, + "learning_rate": 4.530512663529732e-06, + "loss": 1.1334, + "step": 7380 + }, + { + "epoch": 0.22, + "learning_rate": 4.53037035773017e-06, + "loss": 1.1017, + "step": 7381 + }, + { + "epoch": 0.22, + "learning_rate": 4.530228032602461e-06, + "loss": 1.2406, + "step": 7382 + }, + { + "epoch": 0.22, + "learning_rate": 4.530085688147958e-06, + "loss": 1.1112, + "step": 7383 + }, + { + "epoch": 0.22, + "learning_rate": 4.529943324368018e-06, + "loss": 1.0766, + "step": 7384 + }, + { + "epoch": 0.22, + "learning_rate": 4.529800941263994e-06, + "loss": 1.1319, + "step": 7385 + }, + { + "epoch": 0.22, + "learning_rate": 4.529658538837243e-06, + "loss": 1.0692, + "step": 7386 + }, + { + "epoch": 0.22, + "learning_rate": 4.529516117089121e-06, + "loss": 1.2361, + "step": 7387 + }, + { + "epoch": 0.22, + "learning_rate": 4.529373676020982e-06, + "loss": 1.1062, + "step": 7388 + }, + { + "epoch": 0.22, + "learning_rate": 4.529231215634183e-06, + "loss": 1.2086, + "step": 7389 + }, + { + "epoch": 0.22, + "learning_rate": 4.529088735930081e-06, + "loss": 1.0651, + "step": 7390 + }, + { + "epoch": 0.22, + "learning_rate": 4.528946236910031e-06, + "loss": 1.1638, + "step": 7391 + }, + { + "epoch": 0.22, + "learning_rate": 4.52880371857539e-06, + "loss": 1.2653, + "step": 7392 + }, + { + "epoch": 0.22, + "learning_rate": 4.528661180927515e-06, + "loss": 0.9892, + "step": 7393 + }, + { + "epoch": 0.22, + "learning_rate": 4.5285186239677625e-06, + "loss": 1.0499, + "step": 7394 + }, + { + "epoch": 0.22, + "learning_rate": 4.528376047697489e-06, + "loss": 1.1569, + "step": 7395 + }, + { + "epoch": 0.22, + "learning_rate": 4.5282334521180534e-06, + "loss": 1.099, + "step": 7396 + }, + { + "epoch": 0.22, + "learning_rate": 4.528090837230812e-06, + "loss": 1.1897, + "step": 7397 + }, + { + "epoch": 0.22, + "learning_rate": 4.527948203037122e-06, + "loss": 1.1088, + "step": 7398 + }, + { + "epoch": 0.22, + "learning_rate": 4.527805549538343e-06, + "loss": 1.1896, + "step": 7399 + }, + { + "epoch": 0.22, + "learning_rate": 4.52766287673583e-06, + "loss": 1.2898, + "step": 7400 + }, + { + "epoch": 0.22, + "learning_rate": 4.527520184630944e-06, + "loss": 1.111, + "step": 7401 + }, + { + "epoch": 0.22, + "learning_rate": 4.527377473225042e-06, + "loss": 0.9574, + "step": 7402 + }, + { + "epoch": 0.22, + "learning_rate": 4.527234742519483e-06, + "loss": 1.2298, + "step": 7403 + }, + { + "epoch": 0.22, + "learning_rate": 4.527091992515625e-06, + "loss": 1.2787, + "step": 7404 + }, + { + "epoch": 0.22, + "learning_rate": 4.526949223214829e-06, + "loss": 1.1545, + "step": 7405 + }, + { + "epoch": 0.22, + "learning_rate": 4.526806434618452e-06, + "loss": 1.2998, + "step": 7406 + }, + { + "epoch": 0.22, + "learning_rate": 4.526663626727853e-06, + "loss": 1.127, + "step": 7407 + }, + { + "epoch": 0.22, + "learning_rate": 4.5265207995443935e-06, + "loss": 1.0761, + "step": 7408 + }, + { + "epoch": 0.22, + "learning_rate": 4.526377953069432e-06, + "loss": 1.1735, + "step": 7409 + }, + { + "epoch": 0.22, + "learning_rate": 4.526235087304327e-06, + "loss": 1.068, + "step": 7410 + }, + { + "epoch": 0.22, + "learning_rate": 4.526092202250441e-06, + "loss": 1.0234, + "step": 7411 + }, + { + "epoch": 0.22, + "learning_rate": 4.525949297909132e-06, + "loss": 1.2395, + "step": 7412 + }, + { + "epoch": 0.22, + "learning_rate": 4.5258063742817625e-06, + "loss": 1.07, + "step": 7413 + }, + { + "epoch": 0.22, + "learning_rate": 4.5256634313696915e-06, + "loss": 1.147, + "step": 7414 + }, + { + "epoch": 0.22, + "learning_rate": 4.52552046917428e-06, + "loss": 1.1031, + "step": 7415 + }, + { + "epoch": 0.22, + "learning_rate": 4.5253774876968905e-06, + "loss": 1.132, + "step": 7416 + }, + { + "epoch": 0.22, + "learning_rate": 4.525234486938881e-06, + "loss": 1.2599, + "step": 7417 + }, + { + "epoch": 0.22, + "learning_rate": 4.525091466901615e-06, + "loss": 1.2117, + "step": 7418 + }, + { + "epoch": 0.22, + "learning_rate": 4.524948427586454e-06, + "loss": 1.0938, + "step": 7419 + }, + { + "epoch": 0.22, + "learning_rate": 4.52480536899476e-06, + "loss": 1.1113, + "step": 7420 + }, + { + "epoch": 0.22, + "learning_rate": 4.524662291127892e-06, + "loss": 1.098, + "step": 7421 + }, + { + "epoch": 0.22, + "learning_rate": 4.524519193987215e-06, + "loss": 1.0061, + "step": 7422 + }, + { + "epoch": 0.22, + "learning_rate": 4.524376077574092e-06, + "loss": 1.1456, + "step": 7423 + }, + { + "epoch": 0.22, + "learning_rate": 4.5242329418898816e-06, + "loss": 1.1642, + "step": 7424 + }, + { + "epoch": 0.22, + "learning_rate": 4.52408978693595e-06, + "loss": 1.2206, + "step": 7425 + }, + { + "epoch": 0.22, + "learning_rate": 4.5239466127136576e-06, + "loss": 1.0943, + "step": 7426 + }, + { + "epoch": 0.22, + "learning_rate": 4.523803419224368e-06, + "loss": 1.2423, + "step": 7427 + }, + { + "epoch": 0.22, + "learning_rate": 4.5236602064694446e-06, + "loss": 1.1542, + "step": 7428 + }, + { + "epoch": 0.22, + "learning_rate": 4.5235169744502505e-06, + "loss": 1.225, + "step": 7429 + }, + { + "epoch": 0.22, + "learning_rate": 4.52337372316815e-06, + "loss": 1.2388, + "step": 7430 + }, + { + "epoch": 0.22, + "learning_rate": 4.5232304526245065e-06, + "loss": 1.041, + "step": 7431 + }, + { + "epoch": 0.22, + "learning_rate": 4.523087162820682e-06, + "loss": 1.0942, + "step": 7432 + }, + { + "epoch": 0.22, + "learning_rate": 4.522943853758044e-06, + "loss": 1.1461, + "step": 7433 + }, + { + "epoch": 0.22, + "learning_rate": 4.522800525437953e-06, + "loss": 1.1868, + "step": 7434 + }, + { + "epoch": 0.22, + "learning_rate": 4.5226571778617755e-06, + "loss": 1.2327, + "step": 7435 + }, + { + "epoch": 0.22, + "learning_rate": 4.522513811030877e-06, + "loss": 1.1857, + "step": 7436 + }, + { + "epoch": 0.22, + "learning_rate": 4.522370424946621e-06, + "loss": 1.1082, + "step": 7437 + }, + { + "epoch": 0.22, + "learning_rate": 4.5222270196103715e-06, + "loss": 1.0386, + "step": 7438 + }, + { + "epoch": 0.22, + "learning_rate": 4.522083595023495e-06, + "loss": 1.1154, + "step": 7439 + }, + { + "epoch": 0.22, + "learning_rate": 4.521940151187356e-06, + "loss": 1.0502, + "step": 7440 + }, + { + "epoch": 0.22, + "learning_rate": 4.521796688103321e-06, + "loss": 1.2194, + "step": 7441 + }, + { + "epoch": 0.22, + "learning_rate": 4.5216532057727564e-06, + "loss": 1.0879, + "step": 7442 + }, + { + "epoch": 0.22, + "learning_rate": 4.521509704197026e-06, + "loss": 1.0914, + "step": 7443 + }, + { + "epoch": 0.22, + "learning_rate": 4.521366183377497e-06, + "loss": 1.1417, + "step": 7444 + }, + { + "epoch": 0.22, + "learning_rate": 4.521222643315535e-06, + "loss": 1.1689, + "step": 7445 + }, + { + "epoch": 0.22, + "learning_rate": 4.521079084012507e-06, + "loss": 1.1313, + "step": 7446 + }, + { + "epoch": 0.22, + "learning_rate": 4.52093550546978e-06, + "loss": 1.0848, + "step": 7447 + }, + { + "epoch": 0.22, + "learning_rate": 4.5207919076887195e-06, + "loss": 1.1973, + "step": 7448 + }, + { + "epoch": 0.22, + "learning_rate": 4.520648290670694e-06, + "loss": 1.3463, + "step": 7449 + }, + { + "epoch": 0.22, + "learning_rate": 4.52050465441707e-06, + "loss": 1.0508, + "step": 7450 + }, + { + "epoch": 0.22, + "learning_rate": 4.520360998929215e-06, + "loss": 1.0932, + "step": 7451 + }, + { + "epoch": 0.22, + "learning_rate": 4.5202173242084956e-06, + "loss": 1.1338, + "step": 7452 + }, + { + "epoch": 0.22, + "learning_rate": 4.520073630256281e-06, + "loss": 1.0635, + "step": 7453 + }, + { + "epoch": 0.22, + "learning_rate": 4.519929917073937e-06, + "loss": 1.1199, + "step": 7454 + }, + { + "epoch": 0.22, + "learning_rate": 4.519786184662834e-06, + "loss": 1.2295, + "step": 7455 + }, + { + "epoch": 0.22, + "learning_rate": 4.5196424330243395e-06, + "loss": 1.0961, + "step": 7456 + }, + { + "epoch": 0.22, + "learning_rate": 4.519498662159822e-06, + "loss": 1.1172, + "step": 7457 + }, + { + "epoch": 0.22, + "learning_rate": 4.5193548720706486e-06, + "loss": 1.1494, + "step": 7458 + }, + { + "epoch": 0.22, + "learning_rate": 4.51921106275819e-06, + "loss": 1.0649, + "step": 7459 + }, + { + "epoch": 0.22, + "learning_rate": 4.519067234223815e-06, + "loss": 1.1188, + "step": 7460 + }, + { + "epoch": 0.22, + "learning_rate": 4.518923386468891e-06, + "loss": 1.1302, + "step": 7461 + }, + { + "epoch": 0.22, + "learning_rate": 4.518779519494791e-06, + "loss": 1.1596, + "step": 7462 + }, + { + "epoch": 0.22, + "learning_rate": 4.5186356333028806e-06, + "loss": 1.1259, + "step": 7463 + }, + { + "epoch": 0.22, + "learning_rate": 4.5184917278945305e-06, + "loss": 1.151, + "step": 7464 + }, + { + "epoch": 0.22, + "learning_rate": 4.518347803271113e-06, + "loss": 1.0501, + "step": 7465 + }, + { + "epoch": 0.22, + "learning_rate": 4.518203859433996e-06, + "loss": 1.1553, + "step": 7466 + }, + { + "epoch": 0.22, + "learning_rate": 4.51805989638455e-06, + "loss": 1.1721, + "step": 7467 + }, + { + "epoch": 0.22, + "learning_rate": 4.517915914124145e-06, + "loss": 1.1813, + "step": 7468 + }, + { + "epoch": 0.23, + "learning_rate": 4.517771912654153e-06, + "loss": 1.1461, + "step": 7469 + }, + { + "epoch": 0.23, + "learning_rate": 4.517627891975945e-06, + "loss": 1.1256, + "step": 7470 + }, + { + "epoch": 0.23, + "learning_rate": 4.517483852090891e-06, + "loss": 1.1556, + "step": 7471 + }, + { + "epoch": 0.23, + "learning_rate": 4.517339793000361e-06, + "loss": 1.131, + "step": 7472 + }, + { + "epoch": 0.23, + "learning_rate": 4.517195714705728e-06, + "loss": 1.2159, + "step": 7473 + }, + { + "epoch": 0.23, + "learning_rate": 4.517051617208365e-06, + "loss": 1.2264, + "step": 7474 + }, + { + "epoch": 0.23, + "learning_rate": 4.516907500509641e-06, + "loss": 1.3211, + "step": 7475 + }, + { + "epoch": 0.23, + "learning_rate": 4.516763364610929e-06, + "loss": 1.1399, + "step": 7476 + }, + { + "epoch": 0.23, + "learning_rate": 4.5166192095136e-06, + "loss": 1.1653, + "step": 7477 + }, + { + "epoch": 0.23, + "learning_rate": 4.516475035219029e-06, + "loss": 1.0685, + "step": 7478 + }, + { + "epoch": 0.23, + "learning_rate": 4.516330841728585e-06, + "loss": 1.1016, + "step": 7479 + }, + { + "epoch": 0.23, + "learning_rate": 4.516186629043645e-06, + "loss": 1.1709, + "step": 7480 + }, + { + "epoch": 0.23, + "learning_rate": 4.516042397165577e-06, + "loss": 1.2007, + "step": 7481 + }, + { + "epoch": 0.23, + "learning_rate": 4.515898146095758e-06, + "loss": 1.2156, + "step": 7482 + }, + { + "epoch": 0.23, + "learning_rate": 4.515753875835559e-06, + "loss": 1.1807, + "step": 7483 + }, + { + "epoch": 0.23, + "learning_rate": 4.515609586386354e-06, + "loss": 1.1263, + "step": 7484 + }, + { + "epoch": 0.23, + "learning_rate": 4.515465277749516e-06, + "loss": 1.1174, + "step": 7485 + }, + { + "epoch": 0.23, + "learning_rate": 4.51532094992642e-06, + "loss": 1.2465, + "step": 7486 + }, + { + "epoch": 0.23, + "learning_rate": 4.515176602918439e-06, + "loss": 1.0689, + "step": 7487 + }, + { + "epoch": 0.23, + "learning_rate": 4.515032236726946e-06, + "loss": 1.1005, + "step": 7488 + }, + { + "epoch": 0.23, + "learning_rate": 4.514887851353318e-06, + "loss": 1.1141, + "step": 7489 + }, + { + "epoch": 0.23, + "learning_rate": 4.514743446798927e-06, + "loss": 1.1354, + "step": 7490 + }, + { + "epoch": 0.23, + "learning_rate": 4.51459902306515e-06, + "loss": 1.0775, + "step": 7491 + }, + { + "epoch": 0.23, + "learning_rate": 4.51445458015336e-06, + "loss": 1.0758, + "step": 7492 + }, + { + "epoch": 0.23, + "learning_rate": 4.5143101180649325e-06, + "loss": 1.1146, + "step": 7493 + }, + { + "epoch": 0.23, + "learning_rate": 4.5141656368012425e-06, + "loss": 1.1943, + "step": 7494 + }, + { + "epoch": 0.23, + "learning_rate": 4.514021136363667e-06, + "loss": 1.1109, + "step": 7495 + }, + { + "epoch": 0.23, + "learning_rate": 4.513876616753579e-06, + "loss": 1.1692, + "step": 7496 + }, + { + "epoch": 0.23, + "learning_rate": 4.513732077972355e-06, + "loss": 1.1118, + "step": 7497 + }, + { + "epoch": 0.23, + "learning_rate": 4.513587520021372e-06, + "loss": 1.0252, + "step": 7498 + }, + { + "epoch": 0.23, + "learning_rate": 4.513442942902006e-06, + "loss": 1.3154, + "step": 7499 + }, + { + "epoch": 0.23, + "learning_rate": 4.513298346615633e-06, + "loss": 1.0869, + "step": 7500 + }, + { + "epoch": 0.23, + "learning_rate": 4.513153731163628e-06, + "loss": 1.1031, + "step": 7501 + }, + { + "epoch": 0.23, + "learning_rate": 4.513009096547372e-06, + "loss": 1.072, + "step": 7502 + }, + { + "epoch": 0.23, + "learning_rate": 4.512864442768236e-06, + "loss": 1.1451, + "step": 7503 + }, + { + "epoch": 0.23, + "learning_rate": 4.512719769827601e-06, + "loss": 1.1941, + "step": 7504 + }, + { + "epoch": 0.23, + "learning_rate": 4.512575077726843e-06, + "loss": 1.2285, + "step": 7505 + }, + { + "epoch": 0.23, + "learning_rate": 4.51243036646734e-06, + "loss": 1.0479, + "step": 7506 + }, + { + "epoch": 0.23, + "learning_rate": 4.512285636050469e-06, + "loss": 1.1229, + "step": 7507 + }, + { + "epoch": 0.23, + "learning_rate": 4.512140886477608e-06, + "loss": 1.1266, + "step": 7508 + }, + { + "epoch": 0.23, + "learning_rate": 4.5119961177501344e-06, + "loss": 1.0493, + "step": 7509 + }, + { + "epoch": 0.23, + "learning_rate": 4.511851329869427e-06, + "loss": 1.1524, + "step": 7510 + }, + { + "epoch": 0.23, + "learning_rate": 4.5117065228368636e-06, + "loss": 1.2069, + "step": 7511 + }, + { + "epoch": 0.23, + "learning_rate": 4.511561696653823e-06, + "loss": 1.1716, + "step": 7512 + }, + { + "epoch": 0.23, + "learning_rate": 4.511416851321684e-06, + "loss": 1.0744, + "step": 7513 + }, + { + "epoch": 0.23, + "learning_rate": 4.5112719868418255e-06, + "loss": 1.1403, + "step": 7514 + }, + { + "epoch": 0.23, + "learning_rate": 4.511127103215626e-06, + "loss": 1.1344, + "step": 7515 + }, + { + "epoch": 0.23, + "learning_rate": 4.510982200444466e-06, + "loss": 1.0173, + "step": 7516 + }, + { + "epoch": 0.23, + "learning_rate": 4.5108372785297225e-06, + "loss": 1.2362, + "step": 7517 + }, + { + "epoch": 0.23, + "learning_rate": 4.510692337472778e-06, + "loss": 1.2161, + "step": 7518 + }, + { + "epoch": 0.23, + "learning_rate": 4.51054737727501e-06, + "loss": 1.077, + "step": 7519 + }, + { + "epoch": 0.23, + "learning_rate": 4.510402397937799e-06, + "loss": 1.2349, + "step": 7520 + }, + { + "epoch": 0.23, + "learning_rate": 4.510257399462526e-06, + "loss": 1.1344, + "step": 7521 + }, + { + "epoch": 0.23, + "learning_rate": 4.51011238185057e-06, + "loss": 1.1289, + "step": 7522 + }, + { + "epoch": 0.23, + "learning_rate": 4.509967345103313e-06, + "loss": 1.127, + "step": 7523 + }, + { + "epoch": 0.23, + "learning_rate": 4.509822289222135e-06, + "loss": 1.1956, + "step": 7524 + }, + { + "epoch": 0.23, + "learning_rate": 4.509677214208417e-06, + "loss": 1.1406, + "step": 7525 + }, + { + "epoch": 0.23, + "learning_rate": 4.509532120063539e-06, + "loss": 1.1014, + "step": 7526 + }, + { + "epoch": 0.23, + "learning_rate": 4.5093870067888825e-06, + "loss": 1.1449, + "step": 7527 + }, + { + "epoch": 0.23, + "learning_rate": 4.50924187438583e-06, + "loss": 0.9839, + "step": 7528 + }, + { + "epoch": 0.23, + "learning_rate": 4.509096722855764e-06, + "loss": 1.0293, + "step": 7529 + }, + { + "epoch": 0.23, + "learning_rate": 4.508951552200062e-06, + "loss": 1.2289, + "step": 7530 + }, + { + "epoch": 0.23, + "learning_rate": 4.508806362420111e-06, + "loss": 1.1104, + "step": 7531 + }, + { + "epoch": 0.23, + "learning_rate": 4.508661153517291e-06, + "loss": 1.0994, + "step": 7532 + }, + { + "epoch": 0.23, + "learning_rate": 4.5085159254929835e-06, + "loss": 1.2477, + "step": 7533 + }, + { + "epoch": 0.23, + "learning_rate": 4.5083706783485715e-06, + "loss": 1.1208, + "step": 7534 + }, + { + "epoch": 0.23, + "learning_rate": 4.508225412085438e-06, + "loss": 1.1889, + "step": 7535 + }, + { + "epoch": 0.23, + "learning_rate": 4.508080126704965e-06, + "loss": 1.259, + "step": 7536 + }, + { + "epoch": 0.23, + "learning_rate": 4.507934822208539e-06, + "loss": 1.1096, + "step": 7537 + }, + { + "epoch": 0.23, + "learning_rate": 4.507789498597538e-06, + "loss": 1.1837, + "step": 7538 + }, + { + "epoch": 0.23, + "learning_rate": 4.507644155873349e-06, + "loss": 1.1307, + "step": 7539 + }, + { + "epoch": 0.23, + "learning_rate": 4.507498794037353e-06, + "loss": 1.0648, + "step": 7540 + }, + { + "epoch": 0.23, + "learning_rate": 4.507353413090937e-06, + "loss": 1.1338, + "step": 7541 + }, + { + "epoch": 0.23, + "learning_rate": 4.507208013035483e-06, + "loss": 1.0932, + "step": 7542 + }, + { + "epoch": 0.23, + "learning_rate": 4.507062593872376e-06, + "loss": 1.135, + "step": 7543 + }, + { + "epoch": 0.23, + "learning_rate": 4.506917155602999e-06, + "loss": 1.226, + "step": 7544 + }, + { + "epoch": 0.23, + "learning_rate": 4.506771698228737e-06, + "loss": 1.2314, + "step": 7545 + }, + { + "epoch": 0.23, + "learning_rate": 4.506626221750975e-06, + "loss": 1.0586, + "step": 7546 + }, + { + "epoch": 0.23, + "learning_rate": 4.506480726171099e-06, + "loss": 1.1614, + "step": 7547 + }, + { + "epoch": 0.23, + "learning_rate": 4.506335211490491e-06, + "loss": 1.2179, + "step": 7548 + }, + { + "epoch": 0.23, + "learning_rate": 4.506189677710539e-06, + "loss": 1.2875, + "step": 7549 + }, + { + "epoch": 0.23, + "learning_rate": 4.506044124832627e-06, + "loss": 1.2845, + "step": 7550 + }, + { + "epoch": 0.23, + "learning_rate": 4.505898552858142e-06, + "loss": 1.1656, + "step": 7551 + }, + { + "epoch": 0.23, + "learning_rate": 4.505752961788468e-06, + "loss": 1.0878, + "step": 7552 + }, + { + "epoch": 0.23, + "learning_rate": 4.505607351624992e-06, + "loss": 1.2305, + "step": 7553 + }, + { + "epoch": 0.23, + "learning_rate": 4.505461722369101e-06, + "loss": 1.1385, + "step": 7554 + }, + { + "epoch": 0.23, + "learning_rate": 4.505316074022179e-06, + "loss": 1.1249, + "step": 7555 + }, + { + "epoch": 0.23, + "learning_rate": 4.505170406585614e-06, + "loss": 1.2129, + "step": 7556 + }, + { + "epoch": 0.23, + "learning_rate": 4.505024720060792e-06, + "loss": 1.1407, + "step": 7557 + }, + { + "epoch": 0.23, + "learning_rate": 4.504879014449102e-06, + "loss": 1.1073, + "step": 7558 + }, + { + "epoch": 0.23, + "learning_rate": 4.504733289751928e-06, + "loss": 1.0892, + "step": 7559 + }, + { + "epoch": 0.23, + "learning_rate": 4.504587545970658e-06, + "loss": 1.074, + "step": 7560 + }, + { + "epoch": 0.23, + "learning_rate": 4.504441783106681e-06, + "loss": 1.1899, + "step": 7561 + }, + { + "epoch": 0.23, + "learning_rate": 4.504296001161384e-06, + "loss": 1.2155, + "step": 7562 + }, + { + "epoch": 0.23, + "learning_rate": 4.5041502001361535e-06, + "loss": 1.1144, + "step": 7563 + }, + { + "epoch": 0.23, + "learning_rate": 4.5040043800323785e-06, + "loss": 1.1743, + "step": 7564 + }, + { + "epoch": 0.23, + "learning_rate": 4.503858540851447e-06, + "loss": 1.0877, + "step": 7565 + }, + { + "epoch": 0.23, + "learning_rate": 4.503712682594747e-06, + "loss": 1.2094, + "step": 7566 + }, + { + "epoch": 0.23, + "learning_rate": 4.503566805263668e-06, + "loss": 1.1913, + "step": 7567 + }, + { + "epoch": 0.23, + "learning_rate": 4.503420908859598e-06, + "loss": 1.092, + "step": 7568 + }, + { + "epoch": 0.23, + "learning_rate": 4.503274993383926e-06, + "loss": 1.2463, + "step": 7569 + }, + { + "epoch": 0.23, + "learning_rate": 4.50312905883804e-06, + "loss": 1.1041, + "step": 7570 + }, + { + "epoch": 0.23, + "learning_rate": 4.50298310522333e-06, + "loss": 1.092, + "step": 7571 + }, + { + "epoch": 0.23, + "learning_rate": 4.502837132541186e-06, + "loss": 1.2367, + "step": 7572 + }, + { + "epoch": 0.23, + "learning_rate": 4.502691140792997e-06, + "loss": 1.0789, + "step": 7573 + }, + { + "epoch": 0.23, + "learning_rate": 4.502545129980154e-06, + "loss": 1.1595, + "step": 7574 + }, + { + "epoch": 0.23, + "learning_rate": 4.5023991001040444e-06, + "loss": 0.9984, + "step": 7575 + }, + { + "epoch": 0.23, + "learning_rate": 4.50225305116606e-06, + "loss": 1.1343, + "step": 7576 + }, + { + "epoch": 0.23, + "learning_rate": 4.5021069831675915e-06, + "loss": 1.0511, + "step": 7577 + }, + { + "epoch": 0.23, + "learning_rate": 4.501960896110028e-06, + "loss": 1.1247, + "step": 7578 + }, + { + "epoch": 0.23, + "learning_rate": 4.501814789994761e-06, + "loss": 1.2029, + "step": 7579 + }, + { + "epoch": 0.23, + "learning_rate": 4.501668664823181e-06, + "loss": 1.1127, + "step": 7580 + }, + { + "epoch": 0.23, + "learning_rate": 4.50152252059668e-06, + "loss": 1.2445, + "step": 7581 + }, + { + "epoch": 0.23, + "learning_rate": 4.501376357316648e-06, + "loss": 1.1049, + "step": 7582 + }, + { + "epoch": 0.23, + "learning_rate": 4.501230174984478e-06, + "loss": 1.1365, + "step": 7583 + }, + { + "epoch": 0.23, + "learning_rate": 4.50108397360156e-06, + "loss": 1.1243, + "step": 7584 + }, + { + "epoch": 0.23, + "learning_rate": 4.500937753169286e-06, + "loss": 1.0838, + "step": 7585 + }, + { + "epoch": 0.23, + "learning_rate": 4.500791513689049e-06, + "loss": 1.0632, + "step": 7586 + }, + { + "epoch": 0.23, + "learning_rate": 4.500645255162239e-06, + "loss": 1.2172, + "step": 7587 + }, + { + "epoch": 0.23, + "learning_rate": 4.500498977590251e-06, + "loss": 1.0923, + "step": 7588 + }, + { + "epoch": 0.23, + "learning_rate": 4.500352680974475e-06, + "loss": 1.1256, + "step": 7589 + }, + { + "epoch": 0.23, + "learning_rate": 4.500206365316307e-06, + "loss": 1.0748, + "step": 7590 + }, + { + "epoch": 0.23, + "learning_rate": 4.500060030617136e-06, + "loss": 1.179, + "step": 7591 + }, + { + "epoch": 0.23, + "learning_rate": 4.499913676878358e-06, + "loss": 1.2172, + "step": 7592 + }, + { + "epoch": 0.23, + "learning_rate": 4.499767304101363e-06, + "loss": 1.2309, + "step": 7593 + }, + { + "epoch": 0.23, + "learning_rate": 4.499620912287549e-06, + "loss": 1.1612, + "step": 7594 + }, + { + "epoch": 0.23, + "learning_rate": 4.499474501438304e-06, + "loss": 1.1039, + "step": 7595 + }, + { + "epoch": 0.23, + "learning_rate": 4.499328071555027e-06, + "loss": 1.0854, + "step": 7596 + }, + { + "epoch": 0.23, + "learning_rate": 4.49918162263911e-06, + "loss": 1.1875, + "step": 7597 + }, + { + "epoch": 0.23, + "learning_rate": 4.499035154691945e-06, + "loss": 1.1433, + "step": 7598 + }, + { + "epoch": 0.23, + "learning_rate": 4.498888667714929e-06, + "loss": 1.2506, + "step": 7599 + }, + { + "epoch": 0.23, + "learning_rate": 4.498742161709455e-06, + "loss": 1.1154, + "step": 7600 + }, + { + "epoch": 0.23, + "learning_rate": 4.498595636676919e-06, + "loss": 1.004, + "step": 7601 + }, + { + "epoch": 0.23, + "learning_rate": 4.498449092618715e-06, + "loss": 1.1558, + "step": 7602 + }, + { + "epoch": 0.23, + "learning_rate": 4.498302529536238e-06, + "loss": 1.3079, + "step": 7603 + }, + { + "epoch": 0.23, + "learning_rate": 4.498155947430883e-06, + "loss": 1.2006, + "step": 7604 + }, + { + "epoch": 0.23, + "learning_rate": 4.4980093463040465e-06, + "loss": 1.2129, + "step": 7605 + }, + { + "epoch": 0.23, + "learning_rate": 4.497862726157122e-06, + "loss": 1.2667, + "step": 7606 + }, + { + "epoch": 0.23, + "learning_rate": 4.497716086991507e-06, + "loss": 1.1927, + "step": 7607 + }, + { + "epoch": 0.23, + "learning_rate": 4.497569428808598e-06, + "loss": 1.1018, + "step": 7608 + }, + { + "epoch": 0.23, + "learning_rate": 4.497422751609789e-06, + "loss": 1.11, + "step": 7609 + }, + { + "epoch": 0.23, + "learning_rate": 4.497276055396478e-06, + "loss": 1.066, + "step": 7610 + }, + { + "epoch": 0.23, + "learning_rate": 4.497129340170061e-06, + "loss": 1.2371, + "step": 7611 + }, + { + "epoch": 0.23, + "learning_rate": 4.496982605931934e-06, + "loss": 1.1635, + "step": 7612 + }, + { + "epoch": 0.23, + "learning_rate": 4.4968358526834945e-06, + "loss": 1.1011, + "step": 7613 + }, + { + "epoch": 0.23, + "learning_rate": 4.49668908042614e-06, + "loss": 1.1661, + "step": 7614 + }, + { + "epoch": 0.23, + "learning_rate": 4.496542289161266e-06, + "loss": 1.1351, + "step": 7615 + }, + { + "epoch": 0.23, + "learning_rate": 4.496395478890272e-06, + "loss": 1.1829, + "step": 7616 + }, + { + "epoch": 0.23, + "learning_rate": 4.496248649614554e-06, + "loss": 1.1938, + "step": 7617 + }, + { + "epoch": 0.23, + "learning_rate": 4.496101801335511e-06, + "loss": 1.1751, + "step": 7618 + }, + { + "epoch": 0.23, + "learning_rate": 4.495954934054539e-06, + "loss": 1.1008, + "step": 7619 + }, + { + "epoch": 0.23, + "learning_rate": 4.495808047773037e-06, + "loss": 1.1742, + "step": 7620 + }, + { + "epoch": 0.23, + "learning_rate": 4.4956611424924055e-06, + "loss": 1.1066, + "step": 7621 + }, + { + "epoch": 0.23, + "learning_rate": 4.49551421821404e-06, + "loss": 1.0685, + "step": 7622 + }, + { + "epoch": 0.23, + "learning_rate": 4.49536727493934e-06, + "loss": 1.0532, + "step": 7623 + }, + { + "epoch": 0.23, + "learning_rate": 4.495220312669705e-06, + "loss": 1.1357, + "step": 7624 + }, + { + "epoch": 0.23, + "learning_rate": 4.495073331406533e-06, + "loss": 1.0566, + "step": 7625 + }, + { + "epoch": 0.23, + "learning_rate": 4.494926331151224e-06, + "loss": 1.1667, + "step": 7626 + }, + { + "epoch": 0.23, + "learning_rate": 4.494779311905177e-06, + "loss": 1.063, + "step": 7627 + }, + { + "epoch": 0.23, + "learning_rate": 4.494632273669792e-06, + "loss": 1.2125, + "step": 7628 + }, + { + "epoch": 0.23, + "learning_rate": 4.494485216446469e-06, + "loss": 1.1958, + "step": 7629 + }, + { + "epoch": 0.23, + "learning_rate": 4.494338140236606e-06, + "loss": 1.0435, + "step": 7630 + }, + { + "epoch": 0.23, + "learning_rate": 4.494191045041605e-06, + "loss": 1.2988, + "step": 7631 + }, + { + "epoch": 0.23, + "learning_rate": 4.494043930862866e-06, + "loss": 1.2621, + "step": 7632 + }, + { + "epoch": 0.23, + "learning_rate": 4.493896797701789e-06, + "loss": 1.1115, + "step": 7633 + }, + { + "epoch": 0.23, + "learning_rate": 4.493749645559775e-06, + "loss": 1.1064, + "step": 7634 + }, + { + "epoch": 0.23, + "learning_rate": 4.4936024744382234e-06, + "loss": 1.1852, + "step": 7635 + }, + { + "epoch": 0.23, + "learning_rate": 4.493455284338537e-06, + "loss": 1.1333, + "step": 7636 + }, + { + "epoch": 0.23, + "learning_rate": 4.493308075262117e-06, + "loss": 1.1586, + "step": 7637 + }, + { + "epoch": 0.23, + "learning_rate": 4.493160847210364e-06, + "loss": 1.2754, + "step": 7638 + }, + { + "epoch": 0.23, + "learning_rate": 4.493013600184679e-06, + "loss": 1.2039, + "step": 7639 + }, + { + "epoch": 0.23, + "learning_rate": 4.492866334186466e-06, + "loss": 1.1598, + "step": 7640 + }, + { + "epoch": 0.23, + "learning_rate": 4.4927190492171235e-06, + "loss": 1.2209, + "step": 7641 + }, + { + "epoch": 0.23, + "learning_rate": 4.492571745278056e-06, + "loss": 1.1885, + "step": 7642 + }, + { + "epoch": 0.23, + "learning_rate": 4.492424422370664e-06, + "loss": 1.1296, + "step": 7643 + }, + { + "epoch": 0.23, + "learning_rate": 4.492277080496354e-06, + "loss": 1.2007, + "step": 7644 + }, + { + "epoch": 0.23, + "learning_rate": 4.492129719656523e-06, + "loss": 1.1274, + "step": 7645 + }, + { + "epoch": 0.23, + "learning_rate": 4.4919823398525776e-06, + "loss": 1.0345, + "step": 7646 + }, + { + "epoch": 0.23, + "learning_rate": 4.49183494108592e-06, + "loss": 1.1865, + "step": 7647 + }, + { + "epoch": 0.23, + "learning_rate": 4.491687523357951e-06, + "loss": 1.1556, + "step": 7648 + }, + { + "epoch": 0.23, + "learning_rate": 4.4915400866700785e-06, + "loss": 1.1703, + "step": 7649 + }, + { + "epoch": 0.23, + "learning_rate": 4.4913926310237025e-06, + "loss": 1.1189, + "step": 7650 + }, + { + "epoch": 0.23, + "learning_rate": 4.491245156420228e-06, + "loss": 1.1443, + "step": 7651 + }, + { + "epoch": 0.23, + "learning_rate": 4.491097662861058e-06, + "loss": 1.0957, + "step": 7652 + }, + { + "epoch": 0.23, + "learning_rate": 4.490950150347598e-06, + "loss": 1.0614, + "step": 7653 + }, + { + "epoch": 0.23, + "learning_rate": 4.490802618881252e-06, + "loss": 1.2953, + "step": 7654 + }, + { + "epoch": 0.23, + "learning_rate": 4.490655068463422e-06, + "loss": 1.2507, + "step": 7655 + }, + { + "epoch": 0.23, + "learning_rate": 4.4905074990955155e-06, + "loss": 1.2889, + "step": 7656 + }, + { + "epoch": 0.23, + "learning_rate": 4.4903599107789364e-06, + "loss": 1.1832, + "step": 7657 + }, + { + "epoch": 0.23, + "learning_rate": 4.490212303515089e-06, + "loss": 1.1581, + "step": 7658 + }, + { + "epoch": 0.23, + "learning_rate": 4.49006467730538e-06, + "loss": 0.9861, + "step": 7659 + }, + { + "epoch": 0.23, + "learning_rate": 4.489917032151213e-06, + "loss": 1.1644, + "step": 7660 + }, + { + "epoch": 0.23, + "learning_rate": 4.489769368053995e-06, + "loss": 1.2355, + "step": 7661 + }, + { + "epoch": 0.23, + "learning_rate": 4.48962168501513e-06, + "loss": 1.1821, + "step": 7662 + }, + { + "epoch": 0.23, + "learning_rate": 4.4894739830360244e-06, + "loss": 1.1268, + "step": 7663 + }, + { + "epoch": 0.23, + "learning_rate": 4.489326262118086e-06, + "loss": 1.1492, + "step": 7664 + }, + { + "epoch": 0.23, + "learning_rate": 4.489178522262718e-06, + "loss": 1.1359, + "step": 7665 + }, + { + "epoch": 0.23, + "learning_rate": 4.48903076347133e-06, + "loss": 1.0892, + "step": 7666 + }, + { + "epoch": 0.23, + "learning_rate": 4.488882985745326e-06, + "loss": 1.304, + "step": 7667 + }, + { + "epoch": 0.23, + "learning_rate": 4.488735189086115e-06, + "loss": 1.0037, + "step": 7668 + }, + { + "epoch": 0.23, + "learning_rate": 4.488587373495102e-06, + "loss": 1.0919, + "step": 7669 + }, + { + "epoch": 0.23, + "learning_rate": 4.488439538973695e-06, + "loss": 1.1897, + "step": 7670 + }, + { + "epoch": 0.23, + "learning_rate": 4.488291685523301e-06, + "loss": 1.1619, + "step": 7671 + }, + { + "epoch": 0.23, + "learning_rate": 4.4881438131453295e-06, + "loss": 1.1868, + "step": 7672 + }, + { + "epoch": 0.23, + "learning_rate": 4.487995921841184e-06, + "loss": 1.2424, + "step": 7673 + }, + { + "epoch": 0.23, + "learning_rate": 4.4878480116122755e-06, + "loss": 1.0429, + "step": 7674 + }, + { + "epoch": 0.23, + "learning_rate": 4.487700082460013e-06, + "loss": 1.1519, + "step": 7675 + }, + { + "epoch": 0.23, + "learning_rate": 4.487552134385801e-06, + "loss": 1.1557, + "step": 7676 + }, + { + "epoch": 0.23, + "learning_rate": 4.4874041673910505e-06, + "loss": 1.0818, + "step": 7677 + }, + { + "epoch": 0.23, + "learning_rate": 4.48725618147717e-06, + "loss": 1.0229, + "step": 7678 + }, + { + "epoch": 0.23, + "learning_rate": 4.487108176645567e-06, + "loss": 1.1047, + "step": 7679 + }, + { + "epoch": 0.23, + "learning_rate": 4.4869601528976515e-06, + "loss": 1.0912, + "step": 7680 + }, + { + "epoch": 0.23, + "learning_rate": 4.486812110234832e-06, + "loss": 1.2998, + "step": 7681 + }, + { + "epoch": 0.23, + "learning_rate": 4.486664048658519e-06, + "loss": 1.1847, + "step": 7682 + }, + { + "epoch": 0.23, + "learning_rate": 4.4865159681701194e-06, + "loss": 1.1745, + "step": 7683 + }, + { + "epoch": 0.23, + "learning_rate": 4.486367868771046e-06, + "loss": 1.1428, + "step": 7684 + }, + { + "epoch": 0.23, + "learning_rate": 4.486219750462707e-06, + "loss": 1.1951, + "step": 7685 + }, + { + "epoch": 0.23, + "learning_rate": 4.486071613246512e-06, + "loss": 1.2278, + "step": 7686 + }, + { + "epoch": 0.23, + "learning_rate": 4.485923457123872e-06, + "loss": 1.3484, + "step": 7687 + }, + { + "epoch": 0.23, + "learning_rate": 4.485775282096198e-06, + "loss": 1.0493, + "step": 7688 + }, + { + "epoch": 0.23, + "learning_rate": 4.4856270881648986e-06, + "loss": 1.0899, + "step": 7689 + }, + { + "epoch": 0.23, + "learning_rate": 4.485478875331386e-06, + "loss": 1.2325, + "step": 7690 + }, + { + "epoch": 0.23, + "learning_rate": 4.485330643597071e-06, + "loss": 1.1107, + "step": 7691 + }, + { + "epoch": 0.23, + "learning_rate": 4.485182392963364e-06, + "loss": 1.1384, + "step": 7692 + }, + { + "epoch": 0.23, + "learning_rate": 4.485034123431677e-06, + "loss": 1.2216, + "step": 7693 + }, + { + "epoch": 0.23, + "learning_rate": 4.484885835003421e-06, + "loss": 1.0764, + "step": 7694 + }, + { + "epoch": 0.23, + "learning_rate": 4.484737527680007e-06, + "loss": 1.1384, + "step": 7695 + }, + { + "epoch": 0.23, + "learning_rate": 4.484589201462849e-06, + "loss": 1.1206, + "step": 7696 + }, + { + "epoch": 0.23, + "learning_rate": 4.484440856353357e-06, + "loss": 1.0457, + "step": 7697 + }, + { + "epoch": 0.23, + "learning_rate": 4.484292492352944e-06, + "loss": 1.1541, + "step": 7698 + }, + { + "epoch": 0.23, + "learning_rate": 4.484144109463022e-06, + "loss": 1.0773, + "step": 7699 + }, + { + "epoch": 0.23, + "learning_rate": 4.4839957076850036e-06, + "loss": 1.019, + "step": 7700 + }, + { + "epoch": 0.23, + "learning_rate": 4.483847287020302e-06, + "loss": 1.1041, + "step": 7701 + }, + { + "epoch": 0.23, + "learning_rate": 4.483698847470329e-06, + "loss": 1.0406, + "step": 7702 + }, + { + "epoch": 0.23, + "learning_rate": 4.483550389036499e-06, + "loss": 1.0851, + "step": 7703 + }, + { + "epoch": 0.23, + "learning_rate": 4.4834019117202245e-06, + "loss": 1.1461, + "step": 7704 + }, + { + "epoch": 0.23, + "learning_rate": 4.483253415522918e-06, + "loss": 1.218, + "step": 7705 + }, + { + "epoch": 0.23, + "learning_rate": 4.483104900445996e-06, + "loss": 1.2133, + "step": 7706 + }, + { + "epoch": 0.23, + "learning_rate": 4.48295636649087e-06, + "loss": 1.1444, + "step": 7707 + }, + { + "epoch": 0.23, + "learning_rate": 4.482807813658953e-06, + "loss": 1.1215, + "step": 7708 + }, + { + "epoch": 0.23, + "learning_rate": 4.482659241951661e-06, + "loss": 1.1954, + "step": 7709 + }, + { + "epoch": 0.23, + "learning_rate": 4.482510651370409e-06, + "loss": 1.1866, + "step": 7710 + }, + { + "epoch": 0.23, + "learning_rate": 4.482362041916609e-06, + "loss": 1.1661, + "step": 7711 + }, + { + "epoch": 0.23, + "learning_rate": 4.482213413591678e-06, + "loss": 1.0798, + "step": 7712 + }, + { + "epoch": 0.23, + "learning_rate": 4.48206476639703e-06, + "loss": 1.1662, + "step": 7713 + }, + { + "epoch": 0.23, + "learning_rate": 4.48191610033408e-06, + "loss": 1.1285, + "step": 7714 + }, + { + "epoch": 0.23, + "learning_rate": 4.481767415404242e-06, + "loss": 1.086, + "step": 7715 + }, + { + "epoch": 0.23, + "learning_rate": 4.481618711608935e-06, + "loss": 1.2285, + "step": 7716 + }, + { + "epoch": 0.23, + "learning_rate": 4.481469988949571e-06, + "loss": 1.1998, + "step": 7717 + }, + { + "epoch": 0.23, + "learning_rate": 4.4813212474275664e-06, + "loss": 1.3405, + "step": 7718 + }, + { + "epoch": 0.23, + "learning_rate": 4.481172487044338e-06, + "loss": 1.1151, + "step": 7719 + }, + { + "epoch": 0.23, + "learning_rate": 4.481023707801302e-06, + "loss": 1.1726, + "step": 7720 + }, + { + "epoch": 0.23, + "learning_rate": 4.480874909699875e-06, + "loss": 1.0681, + "step": 7721 + }, + { + "epoch": 0.23, + "learning_rate": 4.480726092741472e-06, + "loss": 1.1516, + "step": 7722 + }, + { + "epoch": 0.23, + "learning_rate": 4.480577256927511e-06, + "loss": 1.1371, + "step": 7723 + }, + { + "epoch": 0.23, + "learning_rate": 4.480428402259408e-06, + "loss": 1.1968, + "step": 7724 + }, + { + "epoch": 0.23, + "learning_rate": 4.480279528738581e-06, + "loss": 1.0883, + "step": 7725 + }, + { + "epoch": 0.23, + "learning_rate": 4.480130636366446e-06, + "loss": 1.2194, + "step": 7726 + }, + { + "epoch": 0.23, + "learning_rate": 4.479981725144421e-06, + "loss": 1.074, + "step": 7727 + }, + { + "epoch": 0.23, + "learning_rate": 4.479832795073924e-06, + "loss": 1.117, + "step": 7728 + }, + { + "epoch": 0.23, + "learning_rate": 4.479683846156372e-06, + "loss": 1.1028, + "step": 7729 + }, + { + "epoch": 0.23, + "learning_rate": 4.479534878393184e-06, + "loss": 1.1432, + "step": 7730 + }, + { + "epoch": 0.23, + "learning_rate": 4.479385891785777e-06, + "loss": 1.1314, + "step": 7731 + }, + { + "epoch": 0.23, + "learning_rate": 4.479236886335569e-06, + "loss": 1.0537, + "step": 7732 + }, + { + "epoch": 0.23, + "learning_rate": 4.479087862043979e-06, + "loss": 1.0533, + "step": 7733 + }, + { + "epoch": 0.23, + "learning_rate": 4.478938818912427e-06, + "loss": 1.1381, + "step": 7734 + }, + { + "epoch": 0.23, + "learning_rate": 4.478789756942329e-06, + "loss": 1.1274, + "step": 7735 + }, + { + "epoch": 0.23, + "learning_rate": 4.478640676135106e-06, + "loss": 1.1525, + "step": 7736 + }, + { + "epoch": 0.23, + "learning_rate": 4.478491576492177e-06, + "loss": 1.2164, + "step": 7737 + }, + { + "epoch": 0.23, + "learning_rate": 4.478342458014962e-06, + "loss": 1.1143, + "step": 7738 + }, + { + "epoch": 0.23, + "learning_rate": 4.478193320704878e-06, + "loss": 1.1881, + "step": 7739 + }, + { + "epoch": 0.23, + "learning_rate": 4.478044164563347e-06, + "loss": 1.1654, + "step": 7740 + }, + { + "epoch": 0.23, + "learning_rate": 4.4778949895917875e-06, + "loss": 1.0677, + "step": 7741 + }, + { + "epoch": 0.23, + "learning_rate": 4.4777457957916215e-06, + "loss": 1.1476, + "step": 7742 + }, + { + "epoch": 0.23, + "learning_rate": 4.477596583164268e-06, + "loss": 1.1245, + "step": 7743 + }, + { + "epoch": 0.23, + "learning_rate": 4.477447351711146e-06, + "loss": 1.1528, + "step": 7744 + }, + { + "epoch": 0.23, + "learning_rate": 4.4772981014336784e-06, + "loss": 1.1111, + "step": 7745 + }, + { + "epoch": 0.23, + "learning_rate": 4.4771488323332854e-06, + "loss": 1.1216, + "step": 7746 + }, + { + "epoch": 0.23, + "learning_rate": 4.4769995444113875e-06, + "loss": 1.1108, + "step": 7747 + }, + { + "epoch": 0.23, + "learning_rate": 4.476850237669407e-06, + "loss": 1.1512, + "step": 7748 + }, + { + "epoch": 0.23, + "learning_rate": 4.476700912108763e-06, + "loss": 1.2354, + "step": 7749 + }, + { + "epoch": 0.23, + "learning_rate": 4.476551567730879e-06, + "loss": 1.1235, + "step": 7750 + }, + { + "epoch": 0.23, + "learning_rate": 4.4764022045371756e-06, + "loss": 1.2336, + "step": 7751 + }, + { + "epoch": 0.23, + "learning_rate": 4.476252822529075e-06, + "loss": 1.0983, + "step": 7752 + }, + { + "epoch": 0.23, + "learning_rate": 4.476103421708e-06, + "loss": 1.1635, + "step": 7753 + }, + { + "epoch": 0.23, + "learning_rate": 4.475954002075372e-06, + "loss": 1.0657, + "step": 7754 + }, + { + "epoch": 0.23, + "learning_rate": 4.4758045636326135e-06, + "loss": 1.1829, + "step": 7755 + }, + { + "epoch": 0.23, + "learning_rate": 4.475655106381147e-06, + "loss": 1.2686, + "step": 7756 + }, + { + "epoch": 0.23, + "learning_rate": 4.475505630322395e-06, + "loss": 1.1935, + "step": 7757 + }, + { + "epoch": 0.23, + "learning_rate": 4.475356135457781e-06, + "loss": 1.1135, + "step": 7758 + }, + { + "epoch": 0.23, + "learning_rate": 4.475206621788729e-06, + "loss": 1.0898, + "step": 7759 + }, + { + "epoch": 0.23, + "learning_rate": 4.47505708931666e-06, + "loss": 1.2333, + "step": 7760 + }, + { + "epoch": 0.23, + "learning_rate": 4.474907538043e-06, + "loss": 1.2089, + "step": 7761 + }, + { + "epoch": 0.23, + "learning_rate": 4.47475796796917e-06, + "loss": 1.1323, + "step": 7762 + }, + { + "epoch": 0.23, + "learning_rate": 4.474608379096595e-06, + "loss": 1.2224, + "step": 7763 + }, + { + "epoch": 0.23, + "learning_rate": 4.474458771426701e-06, + "loss": 1.1641, + "step": 7764 + }, + { + "epoch": 0.23, + "learning_rate": 4.4743091449609096e-06, + "loss": 1.1028, + "step": 7765 + }, + { + "epoch": 0.23, + "learning_rate": 4.474159499700645e-06, + "loss": 1.1174, + "step": 7766 + }, + { + "epoch": 0.23, + "learning_rate": 4.474009835647334e-06, + "loss": 1.0869, + "step": 7767 + }, + { + "epoch": 0.23, + "learning_rate": 4.473860152802399e-06, + "loss": 1.1453, + "step": 7768 + }, + { + "epoch": 0.23, + "learning_rate": 4.473710451167268e-06, + "loss": 1.1068, + "step": 7769 + }, + { + "epoch": 0.23, + "learning_rate": 4.473560730743362e-06, + "loss": 1.1529, + "step": 7770 + }, + { + "epoch": 0.23, + "learning_rate": 4.473410991532109e-06, + "loss": 1.1741, + "step": 7771 + }, + { + "epoch": 0.23, + "learning_rate": 4.473261233534935e-06, + "loss": 1.0616, + "step": 7772 + }, + { + "epoch": 0.23, + "learning_rate": 4.473111456753263e-06, + "loss": 1.161, + "step": 7773 + }, + { + "epoch": 0.23, + "learning_rate": 4.47296166118852e-06, + "loss": 1.2427, + "step": 7774 + }, + { + "epoch": 0.23, + "learning_rate": 4.472811846842133e-06, + "loss": 1.0717, + "step": 7775 + }, + { + "epoch": 0.23, + "learning_rate": 4.4726620137155266e-06, + "loss": 1.128, + "step": 7776 + }, + { + "epoch": 0.23, + "learning_rate": 4.472512161810129e-06, + "loss": 1.1126, + "step": 7777 + }, + { + "epoch": 0.23, + "learning_rate": 4.472362291127364e-06, + "loss": 1.1876, + "step": 7778 + }, + { + "epoch": 0.23, + "learning_rate": 4.472212401668661e-06, + "loss": 1.2441, + "step": 7779 + }, + { + "epoch": 0.23, + "learning_rate": 4.472062493435446e-06, + "loss": 1.1829, + "step": 7780 + }, + { + "epoch": 0.23, + "learning_rate": 4.471912566429145e-06, + "loss": 1.0539, + "step": 7781 + }, + { + "epoch": 0.23, + "learning_rate": 4.4717626206511875e-06, + "loss": 1.162, + "step": 7782 + }, + { + "epoch": 0.23, + "learning_rate": 4.471612656102998e-06, + "loss": 1.1593, + "step": 7783 + }, + { + "epoch": 0.23, + "learning_rate": 4.471462672786006e-06, + "loss": 1.1659, + "step": 7784 + }, + { + "epoch": 0.23, + "learning_rate": 4.47131267070164e-06, + "loss": 1.2582, + "step": 7785 + }, + { + "epoch": 0.23, + "learning_rate": 4.471162649851325e-06, + "loss": 1.1015, + "step": 7786 + }, + { + "epoch": 0.23, + "learning_rate": 4.4710126102364914e-06, + "loss": 1.1376, + "step": 7787 + }, + { + "epoch": 0.23, + "learning_rate": 4.470862551858568e-06, + "loss": 1.2151, + "step": 7788 + }, + { + "epoch": 0.23, + "learning_rate": 4.4707124747189814e-06, + "loss": 1.105, + "step": 7789 + }, + { + "epoch": 0.23, + "learning_rate": 4.470562378819161e-06, + "loss": 1.0871, + "step": 7790 + }, + { + "epoch": 0.23, + "learning_rate": 4.4704122641605365e-06, + "loss": 1.0297, + "step": 7791 + }, + { + "epoch": 0.23, + "learning_rate": 4.470262130744536e-06, + "loss": 1.2576, + "step": 7792 + }, + { + "epoch": 0.23, + "learning_rate": 4.470111978572589e-06, + "loss": 1.348, + "step": 7793 + }, + { + "epoch": 0.23, + "learning_rate": 4.469961807646124e-06, + "loss": 1.1223, + "step": 7794 + }, + { + "epoch": 0.23, + "learning_rate": 4.469811617966572e-06, + "loss": 1.1783, + "step": 7795 + }, + { + "epoch": 0.23, + "learning_rate": 4.469661409535363e-06, + "loss": 1.1005, + "step": 7796 + }, + { + "epoch": 0.23, + "learning_rate": 4.4695111823539245e-06, + "loss": 1.1102, + "step": 7797 + }, + { + "epoch": 0.23, + "learning_rate": 4.469360936423689e-06, + "loss": 1.0655, + "step": 7798 + }, + { + "epoch": 0.23, + "learning_rate": 4.469210671746085e-06, + "loss": 1.1772, + "step": 7799 + }, + { + "epoch": 0.23, + "learning_rate": 4.469060388322545e-06, + "loss": 1.0846, + "step": 7800 + }, + { + "epoch": 0.24, + "learning_rate": 4.468910086154498e-06, + "loss": 1.1459, + "step": 7801 + }, + { + "epoch": 0.24, + "learning_rate": 4.4687597652433745e-06, + "loss": 1.0778, + "step": 7802 + }, + { + "epoch": 0.24, + "learning_rate": 4.468609425590607e-06, + "loss": 1.0925, + "step": 7803 + }, + { + "epoch": 0.24, + "learning_rate": 4.468459067197626e-06, + "loss": 1.251, + "step": 7804 + }, + { + "epoch": 0.24, + "learning_rate": 4.468308690065862e-06, + "loss": 1.2383, + "step": 7805 + }, + { + "epoch": 0.24, + "learning_rate": 4.4681582941967475e-06, + "loss": 1.2142, + "step": 7806 + }, + { + "epoch": 0.24, + "learning_rate": 4.468007879591714e-06, + "loss": 1.1631, + "step": 7807 + }, + { + "epoch": 0.24, + "learning_rate": 4.467857446252193e-06, + "loss": 1.0679, + "step": 7808 + }, + { + "epoch": 0.24, + "learning_rate": 4.467706994179618e-06, + "loss": 1.2328, + "step": 7809 + }, + { + "epoch": 0.24, + "learning_rate": 4.4675565233754196e-06, + "loss": 1.1619, + "step": 7810 + }, + { + "epoch": 0.24, + "learning_rate": 4.46740603384103e-06, + "loss": 1.1832, + "step": 7811 + }, + { + "epoch": 0.24, + "learning_rate": 4.467255525577883e-06, + "loss": 1.1911, + "step": 7812 + }, + { + "epoch": 0.24, + "learning_rate": 4.46710499858741e-06, + "loss": 1.1101, + "step": 7813 + }, + { + "epoch": 0.24, + "learning_rate": 4.4669544528710465e-06, + "loss": 1.1216, + "step": 7814 + }, + { + "epoch": 0.24, + "learning_rate": 4.466803888430223e-06, + "loss": 1.2412, + "step": 7815 + }, + { + "epoch": 0.24, + "learning_rate": 4.4666533052663735e-06, + "loss": 1.2148, + "step": 7816 + }, + { + "epoch": 0.24, + "learning_rate": 4.4665027033809316e-06, + "loss": 1.1531, + "step": 7817 + }, + { + "epoch": 0.24, + "learning_rate": 4.466352082775331e-06, + "loss": 1.1412, + "step": 7818 + }, + { + "epoch": 0.24, + "learning_rate": 4.466201443451007e-06, + "loss": 1.1299, + "step": 7819 + }, + { + "epoch": 0.24, + "learning_rate": 4.466050785409391e-06, + "loss": 1.2225, + "step": 7820 + }, + { + "epoch": 0.24, + "learning_rate": 4.465900108651918e-06, + "loss": 1.004, + "step": 7821 + }, + { + "epoch": 0.24, + "learning_rate": 4.465749413180024e-06, + "loss": 1.167, + "step": 7822 + }, + { + "epoch": 0.24, + "learning_rate": 4.465598698995142e-06, + "loss": 1.2143, + "step": 7823 + }, + { + "epoch": 0.24, + "learning_rate": 4.465447966098707e-06, + "loss": 1.3397, + "step": 7824 + }, + { + "epoch": 0.24, + "learning_rate": 4.465297214492153e-06, + "loss": 1.2832, + "step": 7825 + }, + { + "epoch": 0.24, + "learning_rate": 4.4651464441769165e-06, + "loss": 1.104, + "step": 7826 + }, + { + "epoch": 0.24, + "learning_rate": 4.464995655154432e-06, + "loss": 1.0665, + "step": 7827 + }, + { + "epoch": 0.24, + "learning_rate": 4.464844847426137e-06, + "loss": 1.1715, + "step": 7828 + }, + { + "epoch": 0.24, + "learning_rate": 4.464694020993464e-06, + "loss": 1.0663, + "step": 7829 + }, + { + "epoch": 0.24, + "learning_rate": 4.46454317585785e-06, + "loss": 1.1796, + "step": 7830 + }, + { + "epoch": 0.24, + "learning_rate": 4.464392312020732e-06, + "loss": 1.1915, + "step": 7831 + }, + { + "epoch": 0.24, + "learning_rate": 4.464241429483545e-06, + "loss": 1.1491, + "step": 7832 + }, + { + "epoch": 0.24, + "learning_rate": 4.464090528247725e-06, + "loss": 1.1212, + "step": 7833 + }, + { + "epoch": 0.24, + "learning_rate": 4.463939608314709e-06, + "loss": 1.1282, + "step": 7834 + }, + { + "epoch": 0.24, + "learning_rate": 4.463788669685935e-06, + "loss": 1.1758, + "step": 7835 + }, + { + "epoch": 0.24, + "learning_rate": 4.463637712362837e-06, + "loss": 1.3246, + "step": 7836 + }, + { + "epoch": 0.24, + "learning_rate": 4.463486736346855e-06, + "loss": 1.1311, + "step": 7837 + }, + { + "epoch": 0.24, + "learning_rate": 4.463335741639424e-06, + "loss": 1.0565, + "step": 7838 + }, + { + "epoch": 0.24, + "learning_rate": 4.4631847282419825e-06, + "loss": 1.1441, + "step": 7839 + }, + { + "epoch": 0.24, + "learning_rate": 4.463033696155968e-06, + "loss": 1.1592, + "step": 7840 + }, + { + "epoch": 0.24, + "learning_rate": 4.462882645382819e-06, + "loss": 1.0747, + "step": 7841 + }, + { + "epoch": 0.24, + "learning_rate": 4.462731575923972e-06, + "loss": 1.2037, + "step": 7842 + }, + { + "epoch": 0.24, + "learning_rate": 4.462580487780866e-06, + "loss": 1.1852, + "step": 7843 + }, + { + "epoch": 0.24, + "learning_rate": 4.462429380954938e-06, + "loss": 1.1826, + "step": 7844 + }, + { + "epoch": 0.24, + "learning_rate": 4.462278255447628e-06, + "loss": 1.2198, + "step": 7845 + }, + { + "epoch": 0.24, + "learning_rate": 4.462127111260374e-06, + "loss": 1.1205, + "step": 7846 + }, + { + "epoch": 0.24, + "learning_rate": 4.461975948394615e-06, + "loss": 1.1631, + "step": 7847 + }, + { + "epoch": 0.24, + "learning_rate": 4.46182476685179e-06, + "loss": 1.2183, + "step": 7848 + }, + { + "epoch": 0.24, + "learning_rate": 4.4616735666333376e-06, + "loss": 1.2119, + "step": 7849 + }, + { + "epoch": 0.24, + "learning_rate": 4.461522347740698e-06, + "loss": 1.2028, + "step": 7850 + }, + { + "epoch": 0.24, + "learning_rate": 4.461371110175311e-06, + "loss": 1.2388, + "step": 7851 + }, + { + "epoch": 0.24, + "learning_rate": 4.461219853938615e-06, + "loss": 1.2614, + "step": 7852 + }, + { + "epoch": 0.24, + "learning_rate": 4.461068579032049e-06, + "loss": 1.235, + "step": 7853 + }, + { + "epoch": 0.24, + "learning_rate": 4.460917285457057e-06, + "loss": 1.1889, + "step": 7854 + }, + { + "epoch": 0.24, + "learning_rate": 4.460765973215076e-06, + "loss": 1.2608, + "step": 7855 + }, + { + "epoch": 0.24, + "learning_rate": 4.460614642307547e-06, + "loss": 1.183, + "step": 7856 + }, + { + "epoch": 0.24, + "learning_rate": 4.460463292735912e-06, + "loss": 1.1989, + "step": 7857 + }, + { + "epoch": 0.24, + "learning_rate": 4.4603119245016095e-06, + "loss": 1.0407, + "step": 7858 + }, + { + "epoch": 0.24, + "learning_rate": 4.460160537606081e-06, + "loss": 1.0699, + "step": 7859 + }, + { + "epoch": 0.24, + "learning_rate": 4.46000913205077e-06, + "loss": 1.2549, + "step": 7860 + }, + { + "epoch": 0.24, + "learning_rate": 4.4598577078371145e-06, + "loss": 1.1674, + "step": 7861 + }, + { + "epoch": 0.24, + "learning_rate": 4.459706264966558e-06, + "loss": 1.0673, + "step": 7862 + }, + { + "epoch": 0.24, + "learning_rate": 4.459554803440542e-06, + "loss": 1.0482, + "step": 7863 + }, + { + "epoch": 0.24, + "learning_rate": 4.459403323260508e-06, + "loss": 1.1592, + "step": 7864 + }, + { + "epoch": 0.24, + "learning_rate": 4.4592518244278986e-06, + "loss": 1.1667, + "step": 7865 + }, + { + "epoch": 0.24, + "learning_rate": 4.459100306944154e-06, + "loss": 1.0671, + "step": 7866 + }, + { + "epoch": 0.24, + "learning_rate": 4.458948770810718e-06, + "loss": 1.1504, + "step": 7867 + }, + { + "epoch": 0.24, + "learning_rate": 4.458797216029034e-06, + "loss": 1.2781, + "step": 7868 + }, + { + "epoch": 0.24, + "learning_rate": 4.458645642600544e-06, + "loss": 1.1608, + "step": 7869 + }, + { + "epoch": 0.24, + "learning_rate": 4.45849405052669e-06, + "loss": 1.1036, + "step": 7870 + }, + { + "epoch": 0.24, + "learning_rate": 4.458342439808917e-06, + "loss": 1.1742, + "step": 7871 + }, + { + "epoch": 0.24, + "learning_rate": 4.458190810448667e-06, + "loss": 1.0813, + "step": 7872 + }, + { + "epoch": 0.24, + "learning_rate": 4.458039162447383e-06, + "loss": 1.1907, + "step": 7873 + }, + { + "epoch": 0.24, + "learning_rate": 4.457887495806509e-06, + "loss": 1.1782, + "step": 7874 + }, + { + "epoch": 0.24, + "learning_rate": 4.4577358105274895e-06, + "loss": 1.1801, + "step": 7875 + }, + { + "epoch": 0.24, + "learning_rate": 4.457584106611768e-06, + "loss": 1.2303, + "step": 7876 + }, + { + "epoch": 0.24, + "learning_rate": 4.457432384060789e-06, + "loss": 1.0813, + "step": 7877 + }, + { + "epoch": 0.24, + "learning_rate": 4.457280642875995e-06, + "loss": 1.2009, + "step": 7878 + }, + { + "epoch": 0.24, + "learning_rate": 4.457128883058833e-06, + "loss": 1.2347, + "step": 7879 + }, + { + "epoch": 0.24, + "learning_rate": 4.456977104610747e-06, + "loss": 1.0742, + "step": 7880 + }, + { + "epoch": 0.24, + "learning_rate": 4.456825307533181e-06, + "loss": 1.1774, + "step": 7881 + }, + { + "epoch": 0.24, + "learning_rate": 4.45667349182758e-06, + "loss": 1.0427, + "step": 7882 + }, + { + "epoch": 0.24, + "learning_rate": 4.45652165749539e-06, + "loss": 1.1793, + "step": 7883 + }, + { + "epoch": 0.24, + "learning_rate": 4.456369804538057e-06, + "loss": 1.1595, + "step": 7884 + }, + { + "epoch": 0.24, + "learning_rate": 4.4562179329570244e-06, + "loss": 1.0846, + "step": 7885 + }, + { + "epoch": 0.24, + "learning_rate": 4.45606604275374e-06, + "loss": 1.0973, + "step": 7886 + }, + { + "epoch": 0.24, + "learning_rate": 4.455914133929649e-06, + "loss": 1.2338, + "step": 7887 + }, + { + "epoch": 0.24, + "learning_rate": 4.455762206486197e-06, + "loss": 1.1283, + "step": 7888 + }, + { + "epoch": 0.24, + "learning_rate": 4.455610260424831e-06, + "loss": 1.1552, + "step": 7889 + }, + { + "epoch": 0.24, + "learning_rate": 4.455458295746997e-06, + "loss": 1.0464, + "step": 7890 + }, + { + "epoch": 0.24, + "learning_rate": 4.455306312454142e-06, + "loss": 1.0989, + "step": 7891 + }, + { + "epoch": 0.24, + "learning_rate": 4.4551543105477125e-06, + "loss": 1.119, + "step": 7892 + }, + { + "epoch": 0.24, + "learning_rate": 4.455002290029155e-06, + "loss": 1.0106, + "step": 7893 + }, + { + "epoch": 0.24, + "learning_rate": 4.454850250899918e-06, + "loss": 1.1262, + "step": 7894 + }, + { + "epoch": 0.24, + "learning_rate": 4.4546981931614474e-06, + "loss": 1.0757, + "step": 7895 + }, + { + "epoch": 0.24, + "learning_rate": 4.4545461168151924e-06, + "loss": 1.1639, + "step": 7896 + }, + { + "epoch": 0.24, + "learning_rate": 4.454394021862599e-06, + "loss": 1.0818, + "step": 7897 + }, + { + "epoch": 0.24, + "learning_rate": 4.454241908305116e-06, + "loss": 1.1544, + "step": 7898 + }, + { + "epoch": 0.24, + "learning_rate": 4.454089776144192e-06, + "loss": 1.1641, + "step": 7899 + }, + { + "epoch": 0.24, + "learning_rate": 4.4539376253812735e-06, + "loss": 1.2039, + "step": 7900 + }, + { + "epoch": 0.24, + "learning_rate": 4.45378545601781e-06, + "loss": 1.0464, + "step": 7901 + }, + { + "epoch": 0.24, + "learning_rate": 4.453633268055249e-06, + "loss": 1.2211, + "step": 7902 + }, + { + "epoch": 0.24, + "learning_rate": 4.453481061495042e-06, + "loss": 1.0961, + "step": 7903 + }, + { + "epoch": 0.24, + "learning_rate": 4.4533288363386355e-06, + "loss": 1.1863, + "step": 7904 + }, + { + "epoch": 0.24, + "learning_rate": 4.453176592587479e-06, + "loss": 1.1955, + "step": 7905 + }, + { + "epoch": 0.24, + "learning_rate": 4.453024330243022e-06, + "loss": 1.2641, + "step": 7906 + }, + { + "epoch": 0.24, + "learning_rate": 4.452872049306714e-06, + "loss": 1.1568, + "step": 7907 + }, + { + "epoch": 0.24, + "learning_rate": 4.452719749780005e-06, + "loss": 1.1518, + "step": 7908 + }, + { + "epoch": 0.24, + "learning_rate": 4.4525674316643445e-06, + "loss": 1.1196, + "step": 7909 + }, + { + "epoch": 0.24, + "learning_rate": 4.4524150949611815e-06, + "loss": 1.1393, + "step": 7910 + }, + { + "epoch": 0.24, + "learning_rate": 4.4522627396719675e-06, + "loss": 1.1055, + "step": 7911 + }, + { + "epoch": 0.24, + "learning_rate": 4.452110365798153e-06, + "loss": 1.2839, + "step": 7912 + }, + { + "epoch": 0.24, + "learning_rate": 4.451957973341188e-06, + "loss": 1.1273, + "step": 7913 + }, + { + "epoch": 0.24, + "learning_rate": 4.451805562302523e-06, + "loss": 1.2091, + "step": 7914 + }, + { + "epoch": 0.24, + "learning_rate": 4.451653132683608e-06, + "loss": 1.1501, + "step": 7915 + }, + { + "epoch": 0.24, + "learning_rate": 4.451500684485896e-06, + "loss": 1.0739, + "step": 7916 + }, + { + "epoch": 0.24, + "learning_rate": 4.451348217710838e-06, + "loss": 1.1884, + "step": 7917 + }, + { + "epoch": 0.24, + "learning_rate": 4.451195732359884e-06, + "loss": 1.1425, + "step": 7918 + }, + { + "epoch": 0.24, + "learning_rate": 4.451043228434486e-06, + "loss": 1.0618, + "step": 7919 + }, + { + "epoch": 0.24, + "learning_rate": 4.4508907059360964e-06, + "loss": 1.1638, + "step": 7920 + }, + { + "epoch": 0.24, + "learning_rate": 4.450738164866168e-06, + "loss": 1.0984, + "step": 7921 + }, + { + "epoch": 0.24, + "learning_rate": 4.450585605226151e-06, + "loss": 1.1284, + "step": 7922 + }, + { + "epoch": 0.24, + "learning_rate": 4.450433027017497e-06, + "loss": 1.2583, + "step": 7923 + }, + { + "epoch": 0.24, + "learning_rate": 4.450280430241663e-06, + "loss": 1.0807, + "step": 7924 + }, + { + "epoch": 0.24, + "learning_rate": 4.450127814900096e-06, + "loss": 1.1036, + "step": 7925 + }, + { + "epoch": 0.24, + "learning_rate": 4.449975180994252e-06, + "loss": 1.0587, + "step": 7926 + }, + { + "epoch": 0.24, + "learning_rate": 4.449822528525584e-06, + "loss": 1.1541, + "step": 7927 + }, + { + "epoch": 0.24, + "learning_rate": 4.449669857495544e-06, + "loss": 1.1586, + "step": 7928 + }, + { + "epoch": 0.24, + "learning_rate": 4.449517167905586e-06, + "loss": 1.2906, + "step": 7929 + }, + { + "epoch": 0.24, + "learning_rate": 4.449364459757164e-06, + "loss": 1.3253, + "step": 7930 + }, + { + "epoch": 0.24, + "learning_rate": 4.4492117330517315e-06, + "loss": 1.2844, + "step": 7931 + }, + { + "epoch": 0.24, + "learning_rate": 4.449058987790741e-06, + "loss": 1.053, + "step": 7932 + }, + { + "epoch": 0.24, + "learning_rate": 4.448906223975648e-06, + "loss": 1.0742, + "step": 7933 + }, + { + "epoch": 0.24, + "learning_rate": 4.448753441607907e-06, + "loss": 1.1511, + "step": 7934 + }, + { + "epoch": 0.24, + "learning_rate": 4.4486006406889705e-06, + "loss": 1.1647, + "step": 7935 + }, + { + "epoch": 0.24, + "learning_rate": 4.448447821220296e-06, + "loss": 1.2203, + "step": 7936 + }, + { + "epoch": 0.24, + "learning_rate": 4.448294983203336e-06, + "loss": 1.113, + "step": 7937 + }, + { + "epoch": 0.24, + "learning_rate": 4.448142126639545e-06, + "loss": 1.138, + "step": 7938 + }, + { + "epoch": 0.24, + "learning_rate": 4.44798925153038e-06, + "loss": 1.0695, + "step": 7939 + }, + { + "epoch": 0.24, + "learning_rate": 4.447836357877296e-06, + "loss": 1.1426, + "step": 7940 + }, + { + "epoch": 0.24, + "learning_rate": 4.447683445681748e-06, + "loss": 1.1262, + "step": 7941 + }, + { + "epoch": 0.24, + "learning_rate": 4.447530514945191e-06, + "loss": 1.0544, + "step": 7942 + }, + { + "epoch": 0.24, + "learning_rate": 4.447377565669081e-06, + "loss": 1.1482, + "step": 7943 + }, + { + "epoch": 0.24, + "learning_rate": 4.447224597854875e-06, + "loss": 1.1436, + "step": 7944 + }, + { + "epoch": 0.24, + "learning_rate": 4.447071611504029e-06, + "loss": 1.2139, + "step": 7945 + }, + { + "epoch": 0.24, + "learning_rate": 4.446918606617999e-06, + "loss": 1.0849, + "step": 7946 + }, + { + "epoch": 0.24, + "learning_rate": 4.446765583198242e-06, + "loss": 1.1539, + "step": 7947 + }, + { + "epoch": 0.24, + "learning_rate": 4.446612541246213e-06, + "loss": 1.1136, + "step": 7948 + }, + { + "epoch": 0.24, + "learning_rate": 4.446459480763371e-06, + "loss": 1.1942, + "step": 7949 + }, + { + "epoch": 0.24, + "learning_rate": 4.446306401751172e-06, + "loss": 1.2816, + "step": 7950 + }, + { + "epoch": 0.24, + "learning_rate": 4.446153304211074e-06, + "loss": 1.1587, + "step": 7951 + }, + { + "epoch": 0.24, + "learning_rate": 4.446000188144532e-06, + "loss": 1.1858, + "step": 7952 + }, + { + "epoch": 0.24, + "learning_rate": 4.445847053553008e-06, + "loss": 1.1284, + "step": 7953 + }, + { + "epoch": 0.24, + "learning_rate": 4.445693900437955e-06, + "loss": 1.1808, + "step": 7954 + }, + { + "epoch": 0.24, + "learning_rate": 4.445540728800834e-06, + "loss": 1.1431, + "step": 7955 + }, + { + "epoch": 0.24, + "learning_rate": 4.445387538643102e-06, + "loss": 1.2555, + "step": 7956 + }, + { + "epoch": 0.24, + "learning_rate": 4.445234329966218e-06, + "loss": 1.0815, + "step": 7957 + }, + { + "epoch": 0.24, + "learning_rate": 4.44508110277164e-06, + "loss": 1.1338, + "step": 7958 + }, + { + "epoch": 0.24, + "learning_rate": 4.4449278570608264e-06, + "loss": 1.1624, + "step": 7959 + }, + { + "epoch": 0.24, + "learning_rate": 4.444774592835236e-06, + "loss": 1.0977, + "step": 7960 + }, + { + "epoch": 0.24, + "learning_rate": 4.444621310096329e-06, + "loss": 1.1797, + "step": 7961 + }, + { + "epoch": 0.24, + "learning_rate": 4.444468008845563e-06, + "loss": 1.1359, + "step": 7962 + }, + { + "epoch": 0.24, + "learning_rate": 4.444314689084398e-06, + "loss": 1.2845, + "step": 7963 + }, + { + "epoch": 0.24, + "learning_rate": 4.444161350814295e-06, + "loss": 1.0662, + "step": 7964 + }, + { + "epoch": 0.24, + "learning_rate": 4.4440079940367105e-06, + "loss": 1.0358, + "step": 7965 + }, + { + "epoch": 0.24, + "learning_rate": 4.4438546187531066e-06, + "loss": 1.0928, + "step": 7966 + }, + { + "epoch": 0.24, + "learning_rate": 4.443701224964943e-06, + "loss": 1.2373, + "step": 7967 + }, + { + "epoch": 0.24, + "learning_rate": 4.44354781267368e-06, + "loss": 1.2357, + "step": 7968 + }, + { + "epoch": 0.24, + "learning_rate": 4.443394381880778e-06, + "loss": 1.0406, + "step": 7969 + }, + { + "epoch": 0.24, + "learning_rate": 4.443240932587697e-06, + "loss": 1.1857, + "step": 7970 + }, + { + "epoch": 0.24, + "learning_rate": 4.4430874647958985e-06, + "loss": 1.1573, + "step": 7971 + }, + { + "epoch": 0.24, + "learning_rate": 4.442933978506843e-06, + "loss": 1.1655, + "step": 7972 + }, + { + "epoch": 0.24, + "learning_rate": 4.442780473721993e-06, + "loss": 1.207, + "step": 7973 + }, + { + "epoch": 0.24, + "learning_rate": 4.442626950442807e-06, + "loss": 1.1916, + "step": 7974 + }, + { + "epoch": 0.24, + "learning_rate": 4.442473408670748e-06, + "loss": 1.1768, + "step": 7975 + }, + { + "epoch": 0.24, + "learning_rate": 4.442319848407279e-06, + "loss": 1.191, + "step": 7976 + }, + { + "epoch": 0.24, + "learning_rate": 4.442166269653859e-06, + "loss": 1.1396, + "step": 7977 + }, + { + "epoch": 0.24, + "learning_rate": 4.442012672411953e-06, + "loss": 1.107, + "step": 7978 + }, + { + "epoch": 0.24, + "learning_rate": 4.44185905668302e-06, + "loss": 1.2402, + "step": 7979 + }, + { + "epoch": 0.24, + "learning_rate": 4.441705422468525e-06, + "loss": 1.2397, + "step": 7980 + }, + { + "epoch": 0.24, + "learning_rate": 4.44155176976993e-06, + "loss": 1.0179, + "step": 7981 + }, + { + "epoch": 0.24, + "learning_rate": 4.441398098588696e-06, + "loss": 1.1895, + "step": 7982 + }, + { + "epoch": 0.24, + "learning_rate": 4.441244408926288e-06, + "loss": 1.1206, + "step": 7983 + }, + { + "epoch": 0.24, + "learning_rate": 4.441090700784167e-06, + "loss": 0.9675, + "step": 7984 + }, + { + "epoch": 0.24, + "learning_rate": 4.440936974163799e-06, + "loss": 1.1792, + "step": 7985 + }, + { + "epoch": 0.24, + "learning_rate": 4.440783229066645e-06, + "loss": 1.1204, + "step": 7986 + }, + { + "epoch": 0.24, + "learning_rate": 4.440629465494169e-06, + "loss": 1.2523, + "step": 7987 + }, + { + "epoch": 0.24, + "learning_rate": 4.4404756834478366e-06, + "loss": 1.1115, + "step": 7988 + }, + { + "epoch": 0.24, + "learning_rate": 4.440321882929109e-06, + "loss": 1.0291, + "step": 7989 + }, + { + "epoch": 0.24, + "learning_rate": 4.440168063939452e-06, + "loss": 1.2223, + "step": 7990 + }, + { + "epoch": 0.24, + "learning_rate": 4.440014226480329e-06, + "loss": 0.9936, + "step": 7991 + }, + { + "epoch": 0.24, + "learning_rate": 4.439860370553205e-06, + "loss": 1.1622, + "step": 7992 + }, + { + "epoch": 0.24, + "learning_rate": 4.4397064961595445e-06, + "loss": 1.2214, + "step": 7993 + }, + { + "epoch": 0.24, + "learning_rate": 4.439552603300813e-06, + "loss": 1.0776, + "step": 7994 + }, + { + "epoch": 0.24, + "learning_rate": 4.4393986919784745e-06, + "loss": 1.2139, + "step": 7995 + }, + { + "epoch": 0.24, + "learning_rate": 4.439244762193994e-06, + "loss": 1.0912, + "step": 7996 + }, + { + "epoch": 0.24, + "learning_rate": 4.439090813948838e-06, + "loss": 1.1528, + "step": 7997 + }, + { + "epoch": 0.24, + "learning_rate": 4.438936847244471e-06, + "loss": 1.1414, + "step": 7998 + }, + { + "epoch": 0.24, + "learning_rate": 4.438782862082359e-06, + "loss": 1.1915, + "step": 7999 + }, + { + "epoch": 0.24, + "learning_rate": 4.438628858463968e-06, + "loss": 1.2137, + "step": 8000 + }, + { + "epoch": 0.24, + "learning_rate": 4.438474836390765e-06, + "loss": 1.1593, + "step": 8001 + }, + { + "epoch": 0.24, + "learning_rate": 4.438320795864214e-06, + "loss": 1.0856, + "step": 8002 + }, + { + "epoch": 0.24, + "learning_rate": 4.438166736885782e-06, + "loss": 1.1267, + "step": 8003 + }, + { + "epoch": 0.24, + "learning_rate": 4.438012659456937e-06, + "loss": 1.1837, + "step": 8004 + }, + { + "epoch": 0.24, + "learning_rate": 4.437858563579145e-06, + "loss": 1.1456, + "step": 8005 + }, + { + "epoch": 0.24, + "learning_rate": 4.437704449253872e-06, + "loss": 1.0795, + "step": 8006 + }, + { + "epoch": 0.24, + "learning_rate": 4.437550316482586e-06, + "loss": 1.1174, + "step": 8007 + }, + { + "epoch": 0.24, + "learning_rate": 4.437396165266755e-06, + "loss": 1.2197, + "step": 8008 + }, + { + "epoch": 0.24, + "learning_rate": 4.437241995607845e-06, + "loss": 1.1523, + "step": 8009 + }, + { + "epoch": 0.24, + "learning_rate": 4.437087807507324e-06, + "loss": 1.254, + "step": 8010 + }, + { + "epoch": 0.24, + "learning_rate": 4.436933600966661e-06, + "loss": 1.1293, + "step": 8011 + }, + { + "epoch": 0.24, + "learning_rate": 4.436779375987322e-06, + "loss": 1.1516, + "step": 8012 + }, + { + "epoch": 0.24, + "learning_rate": 4.436625132570776e-06, + "loss": 1.0793, + "step": 8013 + }, + { + "epoch": 0.24, + "learning_rate": 4.4364708707184925e-06, + "loss": 1.064, + "step": 8014 + }, + { + "epoch": 0.24, + "learning_rate": 4.436316590431938e-06, + "loss": 1.2316, + "step": 8015 + }, + { + "epoch": 0.24, + "learning_rate": 4.436162291712582e-06, + "loss": 1.0907, + "step": 8016 + }, + { + "epoch": 0.24, + "learning_rate": 4.436007974561894e-06, + "loss": 1.1115, + "step": 8017 + }, + { + "epoch": 0.24, + "learning_rate": 4.435853638981343e-06, + "loss": 1.2773, + "step": 8018 + }, + { + "epoch": 0.24, + "learning_rate": 4.4356992849723965e-06, + "loss": 1.1716, + "step": 8019 + }, + { + "epoch": 0.24, + "learning_rate": 4.4355449125365255e-06, + "loss": 1.2233, + "step": 8020 + }, + { + "epoch": 0.24, + "learning_rate": 4.435390521675199e-06, + "loss": 1.0585, + "step": 8021 + }, + { + "epoch": 0.24, + "learning_rate": 4.435236112389888e-06, + "loss": 1.1956, + "step": 8022 + }, + { + "epoch": 0.24, + "learning_rate": 4.43508168468206e-06, + "loss": 1.2044, + "step": 8023 + }, + { + "epoch": 0.24, + "learning_rate": 4.434927238553186e-06, + "loss": 1.2375, + "step": 8024 + }, + { + "epoch": 0.24, + "learning_rate": 4.4347727740047375e-06, + "loss": 1.1332, + "step": 8025 + }, + { + "epoch": 0.24, + "learning_rate": 4.4346182910381845e-06, + "loss": 1.1552, + "step": 8026 + }, + { + "epoch": 0.24, + "learning_rate": 4.434463789654996e-06, + "loss": 1.152, + "step": 8027 + }, + { + "epoch": 0.24, + "learning_rate": 4.434309269856644e-06, + "loss": 1.1022, + "step": 8028 + }, + { + "epoch": 0.24, + "learning_rate": 4.4341547316446e-06, + "loss": 1.2076, + "step": 8029 + }, + { + "epoch": 0.24, + "learning_rate": 4.434000175020334e-06, + "loss": 1.2782, + "step": 8030 + }, + { + "epoch": 0.24, + "learning_rate": 4.4338455999853176e-06, + "loss": 1.1791, + "step": 8031 + }, + { + "epoch": 0.24, + "learning_rate": 4.433691006541023e-06, + "loss": 1.0434, + "step": 8032 + }, + { + "epoch": 0.24, + "learning_rate": 4.433536394688921e-06, + "loss": 1.1109, + "step": 8033 + }, + { + "epoch": 0.24, + "learning_rate": 4.4333817644304834e-06, + "loss": 1.0406, + "step": 8034 + }, + { + "epoch": 0.24, + "learning_rate": 4.433227115767183e-06, + "loss": 1.1707, + "step": 8035 + }, + { + "epoch": 0.24, + "learning_rate": 4.433072448700492e-06, + "loss": 1.1721, + "step": 8036 + }, + { + "epoch": 0.24, + "learning_rate": 4.432917763231881e-06, + "loss": 1.2971, + "step": 8037 + }, + { + "epoch": 0.24, + "learning_rate": 4.432763059362825e-06, + "loss": 1.097, + "step": 8038 + }, + { + "epoch": 0.24, + "learning_rate": 4.432608337094795e-06, + "loss": 1.1282, + "step": 8039 + }, + { + "epoch": 0.24, + "learning_rate": 4.432453596429265e-06, + "loss": 1.0529, + "step": 8040 + }, + { + "epoch": 0.24, + "learning_rate": 4.432298837367707e-06, + "loss": 1.1046, + "step": 8041 + }, + { + "epoch": 0.24, + "learning_rate": 4.432144059911595e-06, + "loss": 1.2341, + "step": 8042 + }, + { + "epoch": 0.24, + "learning_rate": 4.431989264062401e-06, + "loss": 1.2748, + "step": 8043 + }, + { + "epoch": 0.24, + "learning_rate": 4.4318344498216e-06, + "loss": 1.0856, + "step": 8044 + }, + { + "epoch": 0.24, + "learning_rate": 4.431679617190667e-06, + "loss": 1.1339, + "step": 8045 + }, + { + "epoch": 0.24, + "learning_rate": 4.431524766171073e-06, + "loss": 1.0223, + "step": 8046 + }, + { + "epoch": 0.24, + "learning_rate": 4.431369896764294e-06, + "loss": 1.1754, + "step": 8047 + }, + { + "epoch": 0.24, + "learning_rate": 4.431215008971803e-06, + "loss": 1.0849, + "step": 8048 + }, + { + "epoch": 0.24, + "learning_rate": 4.431060102795076e-06, + "loss": 1.1964, + "step": 8049 + }, + { + "epoch": 0.24, + "learning_rate": 4.430905178235586e-06, + "loss": 1.0989, + "step": 8050 + }, + { + "epoch": 0.24, + "learning_rate": 4.43075023529481e-06, + "loss": 1.1728, + "step": 8051 + }, + { + "epoch": 0.24, + "learning_rate": 4.4305952739742205e-06, + "loss": 1.0834, + "step": 8052 + }, + { + "epoch": 0.24, + "learning_rate": 4.430440294275295e-06, + "loss": 1.1642, + "step": 8053 + }, + { + "epoch": 0.24, + "learning_rate": 4.430285296199506e-06, + "loss": 1.055, + "step": 8054 + }, + { + "epoch": 0.24, + "learning_rate": 4.430130279748331e-06, + "loss": 1.1239, + "step": 8055 + }, + { + "epoch": 0.24, + "learning_rate": 4.429975244923247e-06, + "loss": 1.1863, + "step": 8056 + }, + { + "epoch": 0.24, + "learning_rate": 4.429820191725726e-06, + "loss": 1.1256, + "step": 8057 + }, + { + "epoch": 0.24, + "learning_rate": 4.429665120157247e-06, + "loss": 1.0743, + "step": 8058 + }, + { + "epoch": 0.24, + "learning_rate": 4.4295100302192865e-06, + "loss": 1.0575, + "step": 8059 + }, + { + "epoch": 0.24, + "learning_rate": 4.429354921913318e-06, + "loss": 1.0447, + "step": 8060 + }, + { + "epoch": 0.24, + "learning_rate": 4.429199795240821e-06, + "loss": 1.1481, + "step": 8061 + }, + { + "epoch": 0.24, + "learning_rate": 4.42904465020327e-06, + "loss": 1.3103, + "step": 8062 + }, + { + "epoch": 0.24, + "learning_rate": 4.428889486802145e-06, + "loss": 1.1431, + "step": 8063 + }, + { + "epoch": 0.24, + "learning_rate": 4.42873430503892e-06, + "loss": 1.1853, + "step": 8064 + }, + { + "epoch": 0.24, + "learning_rate": 4.428579104915072e-06, + "loss": 1.1296, + "step": 8065 + }, + { + "epoch": 0.24, + "learning_rate": 4.428423886432082e-06, + "loss": 1.1759, + "step": 8066 + }, + { + "epoch": 0.24, + "learning_rate": 4.428268649591424e-06, + "loss": 1.1272, + "step": 8067 + }, + { + "epoch": 0.24, + "learning_rate": 4.428113394394578e-06, + "loss": 1.1377, + "step": 8068 + }, + { + "epoch": 0.24, + "learning_rate": 4.42795812084302e-06, + "loss": 1.1102, + "step": 8069 + }, + { + "epoch": 0.24, + "learning_rate": 4.4278028289382295e-06, + "loss": 1.14, + "step": 8070 + }, + { + "epoch": 0.24, + "learning_rate": 4.427647518681685e-06, + "loss": 1.1193, + "step": 8071 + }, + { + "epoch": 0.24, + "learning_rate": 4.427492190074864e-06, + "loss": 1.1371, + "step": 8072 + }, + { + "epoch": 0.24, + "learning_rate": 4.427336843119247e-06, + "loss": 1.1761, + "step": 8073 + }, + { + "epoch": 0.24, + "learning_rate": 4.4271814778163096e-06, + "loss": 1.2954, + "step": 8074 + }, + { + "epoch": 0.24, + "learning_rate": 4.427026094167534e-06, + "loss": 1.15, + "step": 8075 + }, + { + "epoch": 0.24, + "learning_rate": 4.426870692174397e-06, + "loss": 1.1761, + "step": 8076 + }, + { + "epoch": 0.24, + "learning_rate": 4.42671527183838e-06, + "loss": 1.077, + "step": 8077 + }, + { + "epoch": 0.24, + "learning_rate": 4.426559833160961e-06, + "loss": 1.1414, + "step": 8078 + }, + { + "epoch": 0.24, + "learning_rate": 4.426404376143621e-06, + "loss": 1.1417, + "step": 8079 + }, + { + "epoch": 0.24, + "learning_rate": 4.426248900787838e-06, + "loss": 1.0883, + "step": 8080 + }, + { + "epoch": 0.24, + "learning_rate": 4.426093407095095e-06, + "loss": 1.1419, + "step": 8081 + }, + { + "epoch": 0.24, + "learning_rate": 4.425937895066868e-06, + "loss": 1.202, + "step": 8082 + }, + { + "epoch": 0.24, + "learning_rate": 4.425782364704642e-06, + "loss": 1.1241, + "step": 8083 + }, + { + "epoch": 0.24, + "learning_rate": 4.425626816009894e-06, + "loss": 1.1582, + "step": 8084 + }, + { + "epoch": 0.24, + "learning_rate": 4.425471248984106e-06, + "loss": 1.2221, + "step": 8085 + }, + { + "epoch": 0.24, + "learning_rate": 4.42531566362876e-06, + "loss": 1.248, + "step": 8086 + }, + { + "epoch": 0.24, + "learning_rate": 4.425160059945335e-06, + "loss": 1.0651, + "step": 8087 + }, + { + "epoch": 0.24, + "learning_rate": 4.425004437935314e-06, + "loss": 1.1818, + "step": 8088 + }, + { + "epoch": 0.24, + "learning_rate": 4.424848797600179e-06, + "loss": 1.0873, + "step": 8089 + }, + { + "epoch": 0.24, + "learning_rate": 4.424693138941409e-06, + "loss": 1.1189, + "step": 8090 + }, + { + "epoch": 0.24, + "learning_rate": 4.424537461960488e-06, + "loss": 1.1472, + "step": 8091 + }, + { + "epoch": 0.24, + "learning_rate": 4.424381766658896e-06, + "loss": 1.1208, + "step": 8092 + }, + { + "epoch": 0.24, + "learning_rate": 4.424226053038118e-06, + "loss": 1.1375, + "step": 8093 + }, + { + "epoch": 0.24, + "learning_rate": 4.424070321099634e-06, + "loss": 1.226, + "step": 8094 + }, + { + "epoch": 0.24, + "learning_rate": 4.4239145708449275e-06, + "loss": 1.0613, + "step": 8095 + }, + { + "epoch": 0.24, + "learning_rate": 4.423758802275481e-06, + "loss": 1.094, + "step": 8096 + }, + { + "epoch": 0.24, + "learning_rate": 4.423603015392777e-06, + "loss": 1.124, + "step": 8097 + }, + { + "epoch": 0.24, + "learning_rate": 4.423447210198298e-06, + "loss": 1.1565, + "step": 8098 + }, + { + "epoch": 0.24, + "learning_rate": 4.423291386693528e-06, + "loss": 1.1765, + "step": 8099 + }, + { + "epoch": 0.24, + "learning_rate": 4.4231355448799514e-06, + "loss": 1.1245, + "step": 8100 + }, + { + "epoch": 0.24, + "learning_rate": 4.42297968475905e-06, + "loss": 1.1304, + "step": 8101 + }, + { + "epoch": 0.24, + "learning_rate": 4.422823806332308e-06, + "loss": 1.0903, + "step": 8102 + }, + { + "epoch": 0.24, + "learning_rate": 4.42266790960121e-06, + "loss": 1.1526, + "step": 8103 + }, + { + "epoch": 0.24, + "learning_rate": 4.422511994567239e-06, + "loss": 1.1605, + "step": 8104 + }, + { + "epoch": 0.24, + "learning_rate": 4.4223560612318795e-06, + "loss": 1.2169, + "step": 8105 + }, + { + "epoch": 0.24, + "learning_rate": 4.422200109596616e-06, + "loss": 1.1373, + "step": 8106 + }, + { + "epoch": 0.24, + "learning_rate": 4.422044139662934e-06, + "loss": 1.1785, + "step": 8107 + }, + { + "epoch": 0.24, + "learning_rate": 4.421888151432318e-06, + "loss": 1.2105, + "step": 8108 + }, + { + "epoch": 0.24, + "learning_rate": 4.421732144906251e-06, + "loss": 1.176, + "step": 8109 + }, + { + "epoch": 0.24, + "learning_rate": 4.42157612008622e-06, + "loss": 1.2693, + "step": 8110 + }, + { + "epoch": 0.24, + "learning_rate": 4.42142007697371e-06, + "loss": 1.2548, + "step": 8111 + }, + { + "epoch": 0.24, + "learning_rate": 4.4212640155702056e-06, + "loss": 1.2562, + "step": 8112 + }, + { + "epoch": 0.24, + "learning_rate": 4.4211079358771945e-06, + "loss": 1.187, + "step": 8113 + }, + { + "epoch": 0.24, + "learning_rate": 4.42095183789616e-06, + "loss": 1.2155, + "step": 8114 + }, + { + "epoch": 0.24, + "learning_rate": 4.420795721628589e-06, + "loss": 1.0437, + "step": 8115 + }, + { + "epoch": 0.24, + "learning_rate": 4.420639587075969e-06, + "loss": 1.1505, + "step": 8116 + }, + { + "epoch": 0.24, + "learning_rate": 4.420483434239784e-06, + "loss": 1.2192, + "step": 8117 + }, + { + "epoch": 0.24, + "learning_rate": 4.420327263121522e-06, + "loss": 1.1306, + "step": 8118 + }, + { + "epoch": 0.24, + "learning_rate": 4.420171073722669e-06, + "loss": 1.1, + "step": 8119 + }, + { + "epoch": 0.24, + "learning_rate": 4.420014866044713e-06, + "loss": 1.1251, + "step": 8120 + }, + { + "epoch": 0.24, + "learning_rate": 4.41985864008914e-06, + "loss": 1.1, + "step": 8121 + }, + { + "epoch": 0.24, + "learning_rate": 4.419702395857437e-06, + "loss": 1.1216, + "step": 8122 + }, + { + "epoch": 0.24, + "learning_rate": 4.419546133351091e-06, + "loss": 1.1393, + "step": 8123 + }, + { + "epoch": 0.24, + "learning_rate": 4.419389852571592e-06, + "loss": 1.0246, + "step": 8124 + }, + { + "epoch": 0.24, + "learning_rate": 4.419233553520425e-06, + "loss": 1.2021, + "step": 8125 + }, + { + "epoch": 0.24, + "learning_rate": 4.419077236199078e-06, + "loss": 1.1174, + "step": 8126 + }, + { + "epoch": 0.24, + "learning_rate": 4.418920900609041e-06, + "loss": 1.231, + "step": 8127 + }, + { + "epoch": 0.24, + "learning_rate": 4.418764546751802e-06, + "loss": 0.9951, + "step": 8128 + }, + { + "epoch": 0.24, + "learning_rate": 4.418608174628847e-06, + "loss": 1.1029, + "step": 8129 + }, + { + "epoch": 0.24, + "learning_rate": 4.4184517842416675e-06, + "loss": 1.144, + "step": 8130 + }, + { + "epoch": 0.24, + "learning_rate": 4.41829537559175e-06, + "loss": 1.2591, + "step": 8131 + }, + { + "epoch": 0.24, + "learning_rate": 4.4181389486805846e-06, + "loss": 1.0481, + "step": 8132 + }, + { + "epoch": 0.25, + "learning_rate": 4.417982503509661e-06, + "loss": 1.1017, + "step": 8133 + }, + { + "epoch": 0.25, + "learning_rate": 4.417826040080467e-06, + "loss": 1.0841, + "step": 8134 + }, + { + "epoch": 0.25, + "learning_rate": 4.417669558394494e-06, + "loss": 1.0522, + "step": 8135 + }, + { + "epoch": 0.25, + "learning_rate": 4.417513058453229e-06, + "loss": 1.1411, + "step": 8136 + }, + { + "epoch": 0.25, + "learning_rate": 4.417356540258163e-06, + "loss": 1.0753, + "step": 8137 + }, + { + "epoch": 0.25, + "learning_rate": 4.417200003810787e-06, + "loss": 1.0696, + "step": 8138 + }, + { + "epoch": 0.25, + "learning_rate": 4.41704344911259e-06, + "loss": 1.1808, + "step": 8139 + }, + { + "epoch": 0.25, + "learning_rate": 4.416886876165062e-06, + "loss": 1.1295, + "step": 8140 + }, + { + "epoch": 0.25, + "learning_rate": 4.416730284969695e-06, + "loss": 1.2097, + "step": 8141 + }, + { + "epoch": 0.25, + "learning_rate": 4.416573675527979e-06, + "loss": 1.1305, + "step": 8142 + }, + { + "epoch": 0.25, + "learning_rate": 4.416417047841404e-06, + "loss": 1.2, + "step": 8143 + }, + { + "epoch": 0.25, + "learning_rate": 4.416260401911463e-06, + "loss": 1.192, + "step": 8144 + }, + { + "epoch": 0.25, + "learning_rate": 4.416103737739645e-06, + "loss": 1.1106, + "step": 8145 + }, + { + "epoch": 0.25, + "learning_rate": 4.4159470553274405e-06, + "loss": 1.1282, + "step": 8146 + }, + { + "epoch": 0.25, + "learning_rate": 4.4157903546763445e-06, + "loss": 1.1246, + "step": 8147 + }, + { + "epoch": 0.25, + "learning_rate": 4.415633635787848e-06, + "loss": 1.2902, + "step": 8148 + }, + { + "epoch": 0.25, + "learning_rate": 4.4154768986634396e-06, + "loss": 1.1959, + "step": 8149 + }, + { + "epoch": 0.25, + "learning_rate": 4.415320143304616e-06, + "loss": 1.075, + "step": 8150 + }, + { + "epoch": 0.25, + "learning_rate": 4.4151633697128656e-06, + "loss": 1.2281, + "step": 8151 + }, + { + "epoch": 0.25, + "learning_rate": 4.4150065778896824e-06, + "loss": 1.036, + "step": 8152 + }, + { + "epoch": 0.25, + "learning_rate": 4.41484976783656e-06, + "loss": 1.0776, + "step": 8153 + }, + { + "epoch": 0.25, + "learning_rate": 4.414692939554988e-06, + "loss": 1.2093, + "step": 8154 + }, + { + "epoch": 0.25, + "learning_rate": 4.4145360930464625e-06, + "loss": 1.1767, + "step": 8155 + }, + { + "epoch": 0.25, + "learning_rate": 4.414379228312476e-06, + "loss": 1.2219, + "step": 8156 + }, + { + "epoch": 0.25, + "learning_rate": 4.41422234535452e-06, + "loss": 1.1959, + "step": 8157 + }, + { + "epoch": 0.25, + "learning_rate": 4.41406544417409e-06, + "loss": 1.161, + "step": 8158 + }, + { + "epoch": 0.25, + "learning_rate": 4.413908524772679e-06, + "loss": 1.1547, + "step": 8159 + }, + { + "epoch": 0.25, + "learning_rate": 4.41375158715178e-06, + "loss": 1.1699, + "step": 8160 + }, + { + "epoch": 0.25, + "learning_rate": 4.413594631312888e-06, + "loss": 1.1525, + "step": 8161 + }, + { + "epoch": 0.25, + "learning_rate": 4.413437657257497e-06, + "loss": 1.1572, + "step": 8162 + }, + { + "epoch": 0.25, + "learning_rate": 4.413280664987101e-06, + "loss": 1.0768, + "step": 8163 + }, + { + "epoch": 0.25, + "learning_rate": 4.413123654503193e-06, + "loss": 1.1473, + "step": 8164 + }, + { + "epoch": 0.25, + "learning_rate": 4.412966625807271e-06, + "loss": 1.1757, + "step": 8165 + }, + { + "epoch": 0.25, + "learning_rate": 4.412809578900827e-06, + "loss": 1.1992, + "step": 8166 + }, + { + "epoch": 0.25, + "learning_rate": 4.412652513785358e-06, + "loss": 1.203, + "step": 8167 + }, + { + "epoch": 0.25, + "learning_rate": 4.412495430462358e-06, + "loss": 1.1783, + "step": 8168 + }, + { + "epoch": 0.25, + "learning_rate": 4.412338328933322e-06, + "loss": 1.1821, + "step": 8169 + }, + { + "epoch": 0.25, + "learning_rate": 4.412181209199746e-06, + "loss": 1.1238, + "step": 8170 + }, + { + "epoch": 0.25, + "learning_rate": 4.412024071263127e-06, + "loss": 1.0764, + "step": 8171 + }, + { + "epoch": 0.25, + "learning_rate": 4.411866915124959e-06, + "loss": 1.1716, + "step": 8172 + }, + { + "epoch": 0.25, + "learning_rate": 4.411709740786738e-06, + "loss": 1.1074, + "step": 8173 + }, + { + "epoch": 0.25, + "learning_rate": 4.4115525482499625e-06, + "loss": 1.1932, + "step": 8174 + }, + { + "epoch": 0.25, + "learning_rate": 4.411395337516126e-06, + "loss": 1.1805, + "step": 8175 + }, + { + "epoch": 0.25, + "learning_rate": 4.411238108586727e-06, + "loss": 1.1371, + "step": 8176 + }, + { + "epoch": 0.25, + "learning_rate": 4.411080861463262e-06, + "loss": 1.2319, + "step": 8177 + }, + { + "epoch": 0.25, + "learning_rate": 4.410923596147227e-06, + "loss": 1.1094, + "step": 8178 + }, + { + "epoch": 0.25, + "learning_rate": 4.41076631264012e-06, + "loss": 1.1132, + "step": 8179 + }, + { + "epoch": 0.25, + "learning_rate": 4.410609010943439e-06, + "loss": 1.155, + "step": 8180 + }, + { + "epoch": 0.25, + "learning_rate": 4.410451691058679e-06, + "loss": 1.1743, + "step": 8181 + }, + { + "epoch": 0.25, + "learning_rate": 4.410294352987339e-06, + "loss": 1.0682, + "step": 8182 + }, + { + "epoch": 0.25, + "learning_rate": 4.410136996730917e-06, + "loss": 1.1361, + "step": 8183 + }, + { + "epoch": 0.25, + "learning_rate": 4.409979622290911e-06, + "loss": 1.136, + "step": 8184 + }, + { + "epoch": 0.25, + "learning_rate": 4.409822229668819e-06, + "loss": 1.1327, + "step": 8185 + }, + { + "epoch": 0.25, + "learning_rate": 4.409664818866139e-06, + "loss": 1.2369, + "step": 8186 + }, + { + "epoch": 0.25, + "learning_rate": 4.40950738988437e-06, + "loss": 1.1357, + "step": 8187 + }, + { + "epoch": 0.25, + "learning_rate": 4.40934994272501e-06, + "loss": 1.2925, + "step": 8188 + }, + { + "epoch": 0.25, + "learning_rate": 4.409192477389558e-06, + "loss": 1.2079, + "step": 8189 + }, + { + "epoch": 0.25, + "learning_rate": 4.409034993879513e-06, + "loss": 1.224, + "step": 8190 + }, + { + "epoch": 0.25, + "learning_rate": 4.408877492196374e-06, + "loss": 1.0992, + "step": 8191 + }, + { + "epoch": 0.25, + "learning_rate": 4.40871997234164e-06, + "loss": 1.1313, + "step": 8192 + }, + { + "epoch": 0.25, + "learning_rate": 4.4085624343168135e-06, + "loss": 1.2179, + "step": 8193 + }, + { + "epoch": 0.25, + "learning_rate": 4.40840487812339e-06, + "loss": 1.1684, + "step": 8194 + }, + { + "epoch": 0.25, + "learning_rate": 4.408247303762872e-06, + "loss": 1.1437, + "step": 8195 + }, + { + "epoch": 0.25, + "learning_rate": 4.408089711236758e-06, + "loss": 1.1318, + "step": 8196 + }, + { + "epoch": 0.25, + "learning_rate": 4.4079321005465494e-06, + "loss": 1.0892, + "step": 8197 + }, + { + "epoch": 0.25, + "learning_rate": 4.407774471693747e-06, + "loss": 1.2199, + "step": 8198 + }, + { + "epoch": 0.25, + "learning_rate": 4.407616824679849e-06, + "loss": 1.214, + "step": 8199 + }, + { + "epoch": 0.25, + "learning_rate": 4.4074591595063575e-06, + "loss": 1.2383, + "step": 8200 + }, + { + "epoch": 0.25, + "learning_rate": 4.407301476174774e-06, + "loss": 1.2753, + "step": 8201 + }, + { + "epoch": 0.25, + "learning_rate": 4.4071437746866e-06, + "loss": 1.1176, + "step": 8202 + }, + { + "epoch": 0.25, + "learning_rate": 4.4069860550433345e-06, + "loss": 1.2004, + "step": 8203 + }, + { + "epoch": 0.25, + "learning_rate": 4.40682831724648e-06, + "loss": 1.1729, + "step": 8204 + }, + { + "epoch": 0.25, + "learning_rate": 4.406670561297539e-06, + "loss": 1.1278, + "step": 8205 + }, + { + "epoch": 0.25, + "learning_rate": 4.4065127871980126e-06, + "loss": 1.3109, + "step": 8206 + }, + { + "epoch": 0.25, + "learning_rate": 4.406354994949402e-06, + "loss": 1.194, + "step": 8207 + }, + { + "epoch": 0.25, + "learning_rate": 4.40619718455321e-06, + "loss": 1.1125, + "step": 8208 + }, + { + "epoch": 0.25, + "learning_rate": 4.406039356010939e-06, + "loss": 1.1163, + "step": 8209 + }, + { + "epoch": 0.25, + "learning_rate": 4.405881509324093e-06, + "loss": 1.1642, + "step": 8210 + }, + { + "epoch": 0.25, + "learning_rate": 4.405723644494171e-06, + "loss": 1.297, + "step": 8211 + }, + { + "epoch": 0.25, + "learning_rate": 4.405565761522677e-06, + "loss": 1.0835, + "step": 8212 + }, + { + "epoch": 0.25, + "learning_rate": 4.405407860411117e-06, + "loss": 1.0989, + "step": 8213 + }, + { + "epoch": 0.25, + "learning_rate": 4.405249941160991e-06, + "loss": 1.1122, + "step": 8214 + }, + { + "epoch": 0.25, + "learning_rate": 4.405092003773802e-06, + "loss": 1.1249, + "step": 8215 + }, + { + "epoch": 0.25, + "learning_rate": 4.404934048251056e-06, + "loss": 1.0598, + "step": 8216 + }, + { + "epoch": 0.25, + "learning_rate": 4.404776074594255e-06, + "loss": 1.136, + "step": 8217 + }, + { + "epoch": 0.25, + "learning_rate": 4.404618082804903e-06, + "loss": 1.0652, + "step": 8218 + }, + { + "epoch": 0.25, + "learning_rate": 4.404460072884505e-06, + "loss": 1.097, + "step": 8219 + }, + { + "epoch": 0.25, + "learning_rate": 4.404302044834563e-06, + "loss": 1.1173, + "step": 8220 + }, + { + "epoch": 0.25, + "learning_rate": 4.404143998656582e-06, + "loss": 1.1498, + "step": 8221 + }, + { + "epoch": 0.25, + "learning_rate": 4.403985934352069e-06, + "loss": 1.2197, + "step": 8222 + }, + { + "epoch": 0.25, + "learning_rate": 4.403827851922526e-06, + "loss": 1.0848, + "step": 8223 + }, + { + "epoch": 0.25, + "learning_rate": 4.40366975136946e-06, + "loss": 1.1556, + "step": 8224 + }, + { + "epoch": 0.25, + "learning_rate": 4.403511632694373e-06, + "loss": 1.0685, + "step": 8225 + }, + { + "epoch": 0.25, + "learning_rate": 4.4033534958987736e-06, + "loss": 1.2018, + "step": 8226 + }, + { + "epoch": 0.25, + "learning_rate": 4.403195340984164e-06, + "loss": 1.1676, + "step": 8227 + }, + { + "epoch": 0.25, + "learning_rate": 4.403037167952052e-06, + "loss": 1.0922, + "step": 8228 + }, + { + "epoch": 0.25, + "learning_rate": 4.402878976803943e-06, + "loss": 1.2458, + "step": 8229 + }, + { + "epoch": 0.25, + "learning_rate": 4.402720767541343e-06, + "loss": 1.1539, + "step": 8230 + }, + { + "epoch": 0.25, + "learning_rate": 4.402562540165757e-06, + "loss": 1.1722, + "step": 8231 + }, + { + "epoch": 0.25, + "learning_rate": 4.402404294678692e-06, + "loss": 1.1423, + "step": 8232 + }, + { + "epoch": 0.25, + "learning_rate": 4.402246031081655e-06, + "loss": 1.0959, + "step": 8233 + }, + { + "epoch": 0.25, + "learning_rate": 4.402087749376151e-06, + "loss": 1.1115, + "step": 8234 + }, + { + "epoch": 0.25, + "learning_rate": 4.4019294495636874e-06, + "loss": 1.0684, + "step": 8235 + }, + { + "epoch": 0.25, + "learning_rate": 4.401771131645773e-06, + "loss": 1.1495, + "step": 8236 + }, + { + "epoch": 0.25, + "learning_rate": 4.401612795623912e-06, + "loss": 1.2072, + "step": 8237 + }, + { + "epoch": 0.25, + "learning_rate": 4.401454441499614e-06, + "loss": 1.2517, + "step": 8238 + }, + { + "epoch": 0.25, + "learning_rate": 4.401296069274384e-06, + "loss": 1.1802, + "step": 8239 + }, + { + "epoch": 0.25, + "learning_rate": 4.401137678949733e-06, + "loss": 1.1091, + "step": 8240 + }, + { + "epoch": 0.25, + "learning_rate": 4.400979270527166e-06, + "loss": 1.076, + "step": 8241 + }, + { + "epoch": 0.25, + "learning_rate": 4.400820844008192e-06, + "loss": 1.1211, + "step": 8242 + }, + { + "epoch": 0.25, + "learning_rate": 4.400662399394319e-06, + "loss": 1.1066, + "step": 8243 + }, + { + "epoch": 0.25, + "learning_rate": 4.400503936687055e-06, + "loss": 1.1049, + "step": 8244 + }, + { + "epoch": 0.25, + "learning_rate": 4.400345455887909e-06, + "loss": 1.0903, + "step": 8245 + }, + { + "epoch": 0.25, + "learning_rate": 4.4001869569983905e-06, + "loss": 1.1213, + "step": 8246 + }, + { + "epoch": 0.25, + "learning_rate": 4.400028440020006e-06, + "loss": 1.2258, + "step": 8247 + }, + { + "epoch": 0.25, + "learning_rate": 4.399869904954266e-06, + "loss": 1.1556, + "step": 8248 + }, + { + "epoch": 0.25, + "learning_rate": 4.39971135180268e-06, + "loss": 1.1173, + "step": 8249 + }, + { + "epoch": 0.25, + "learning_rate": 4.399552780566757e-06, + "loss": 1.1046, + "step": 8250 + }, + { + "epoch": 0.25, + "learning_rate": 4.399394191248006e-06, + "loss": 1.1777, + "step": 8251 + }, + { + "epoch": 0.25, + "learning_rate": 4.399235583847937e-06, + "loss": 1.1523, + "step": 8252 + }, + { + "epoch": 0.25, + "learning_rate": 4.39907695836806e-06, + "loss": 1.0712, + "step": 8253 + }, + { + "epoch": 0.25, + "learning_rate": 4.398918314809885e-06, + "loss": 1.176, + "step": 8254 + }, + { + "epoch": 0.25, + "learning_rate": 4.398759653174922e-06, + "loss": 1.2841, + "step": 8255 + }, + { + "epoch": 0.25, + "learning_rate": 4.398600973464682e-06, + "loss": 1.2221, + "step": 8256 + }, + { + "epoch": 0.25, + "learning_rate": 4.398442275680675e-06, + "loss": 1.1462, + "step": 8257 + }, + { + "epoch": 0.25, + "learning_rate": 4.398283559824412e-06, + "loss": 1.1848, + "step": 8258 + }, + { + "epoch": 0.25, + "learning_rate": 4.3981248258974035e-06, + "loss": 1.1458, + "step": 8259 + }, + { + "epoch": 0.25, + "learning_rate": 4.397966073901161e-06, + "loss": 1.1316, + "step": 8260 + }, + { + "epoch": 0.25, + "learning_rate": 4.397807303837195e-06, + "loss": 1.2596, + "step": 8261 + }, + { + "epoch": 0.25, + "learning_rate": 4.397648515707018e-06, + "loss": 1.2756, + "step": 8262 + }, + { + "epoch": 0.25, + "learning_rate": 4.397489709512141e-06, + "loss": 1.1971, + "step": 8263 + }, + { + "epoch": 0.25, + "learning_rate": 4.397330885254076e-06, + "loss": 1.1833, + "step": 8264 + }, + { + "epoch": 0.25, + "learning_rate": 4.397172042934335e-06, + "loss": 1.1823, + "step": 8265 + }, + { + "epoch": 0.25, + "learning_rate": 4.397013182554429e-06, + "loss": 0.9354, + "step": 8266 + }, + { + "epoch": 0.25, + "learning_rate": 4.396854304115872e-06, + "loss": 1.1107, + "step": 8267 + }, + { + "epoch": 0.25, + "learning_rate": 4.396695407620175e-06, + "loss": 1.0929, + "step": 8268 + }, + { + "epoch": 0.25, + "learning_rate": 4.396536493068851e-06, + "loss": 1.1894, + "step": 8269 + }, + { + "epoch": 0.25, + "learning_rate": 4.396377560463414e-06, + "loss": 1.1398, + "step": 8270 + }, + { + "epoch": 0.25, + "learning_rate": 4.3962186098053754e-06, + "loss": 1.181, + "step": 8271 + }, + { + "epoch": 0.25, + "learning_rate": 4.396059641096249e-06, + "loss": 1.1603, + "step": 8272 + }, + { + "epoch": 0.25, + "learning_rate": 4.3959006543375475e-06, + "loss": 1.2336, + "step": 8273 + }, + { + "epoch": 0.25, + "learning_rate": 4.3957416495307855e-06, + "loss": 1.1469, + "step": 8274 + }, + { + "epoch": 0.25, + "learning_rate": 4.395582626677476e-06, + "loss": 1.1716, + "step": 8275 + }, + { + "epoch": 0.25, + "learning_rate": 4.395423585779132e-06, + "loss": 1.1467, + "step": 8276 + }, + { + "epoch": 0.25, + "learning_rate": 4.395264526837269e-06, + "loss": 1.2175, + "step": 8277 + }, + { + "epoch": 0.25, + "learning_rate": 4.3951054498534e-06, + "loss": 1.0297, + "step": 8278 + }, + { + "epoch": 0.25, + "learning_rate": 4.3949463548290406e-06, + "loss": 1.0987, + "step": 8279 + }, + { + "epoch": 0.25, + "learning_rate": 4.394787241765705e-06, + "loss": 1.2748, + "step": 8280 + }, + { + "epoch": 0.25, + "learning_rate": 4.3946281106649055e-06, + "loss": 1.2102, + "step": 8281 + }, + { + "epoch": 0.25, + "learning_rate": 4.39446896152816e-06, + "loss": 1.1979, + "step": 8282 + }, + { + "epoch": 0.25, + "learning_rate": 4.394309794356982e-06, + "loss": 1.2145, + "step": 8283 + }, + { + "epoch": 0.25, + "learning_rate": 4.394150609152887e-06, + "loss": 1.0607, + "step": 8284 + }, + { + "epoch": 0.25, + "learning_rate": 4.3939914059173916e-06, + "loss": 1.1996, + "step": 8285 + }, + { + "epoch": 0.25, + "learning_rate": 4.39383218465201e-06, + "loss": 1.1971, + "step": 8286 + }, + { + "epoch": 0.25, + "learning_rate": 4.393672945358257e-06, + "loss": 1.0679, + "step": 8287 + }, + { + "epoch": 0.25, + "learning_rate": 4.393513688037651e-06, + "loss": 1.0744, + "step": 8288 + }, + { + "epoch": 0.25, + "learning_rate": 4.393354412691705e-06, + "loss": 1.0529, + "step": 8289 + }, + { + "epoch": 0.25, + "learning_rate": 4.393195119321937e-06, + "loss": 1.0687, + "step": 8290 + }, + { + "epoch": 0.25, + "learning_rate": 4.393035807929864e-06, + "loss": 1.1592, + "step": 8291 + }, + { + "epoch": 0.25, + "learning_rate": 4.392876478517002e-06, + "loss": 1.236, + "step": 8292 + }, + { + "epoch": 0.25, + "learning_rate": 4.3927171310848675e-06, + "loss": 1.1788, + "step": 8293 + }, + { + "epoch": 0.25, + "learning_rate": 4.3925577656349775e-06, + "loss": 1.1663, + "step": 8294 + }, + { + "epoch": 0.25, + "learning_rate": 4.392398382168848e-06, + "loss": 1.0737, + "step": 8295 + }, + { + "epoch": 0.25, + "learning_rate": 4.392238980687999e-06, + "loss": 1.1094, + "step": 8296 + }, + { + "epoch": 0.25, + "learning_rate": 4.392079561193945e-06, + "loss": 1.2108, + "step": 8297 + }, + { + "epoch": 0.25, + "learning_rate": 4.3919201236882055e-06, + "loss": 1.1069, + "step": 8298 + }, + { + "epoch": 0.25, + "learning_rate": 4.391760668172297e-06, + "loss": 1.1036, + "step": 8299 + }, + { + "epoch": 0.25, + "learning_rate": 4.391601194647738e-06, + "loss": 1.0792, + "step": 8300 + }, + { + "epoch": 0.25, + "learning_rate": 4.391441703116047e-06, + "loss": 1.1243, + "step": 8301 + }, + { + "epoch": 0.25, + "learning_rate": 4.391282193578743e-06, + "loss": 1.1033, + "step": 8302 + }, + { + "epoch": 0.25, + "learning_rate": 4.3911226660373415e-06, + "loss": 1.1099, + "step": 8303 + }, + { + "epoch": 0.25, + "learning_rate": 4.390963120493364e-06, + "loss": 1.1313, + "step": 8304 + }, + { + "epoch": 0.25, + "learning_rate": 4.390803556948328e-06, + "loss": 1.1547, + "step": 8305 + }, + { + "epoch": 0.25, + "learning_rate": 4.390643975403753e-06, + "loss": 1.1194, + "step": 8306 + }, + { + "epoch": 0.25, + "learning_rate": 4.390484375861158e-06, + "loss": 1.1954, + "step": 8307 + }, + { + "epoch": 0.25, + "learning_rate": 4.390324758322062e-06, + "loss": 1.1984, + "step": 8308 + }, + { + "epoch": 0.25, + "learning_rate": 4.390165122787985e-06, + "loss": 1.1837, + "step": 8309 + }, + { + "epoch": 0.25, + "learning_rate": 4.390005469260446e-06, + "loss": 1.0678, + "step": 8310 + }, + { + "epoch": 0.25, + "learning_rate": 4.389845797740966e-06, + "loss": 1.2194, + "step": 8311 + }, + { + "epoch": 0.25, + "learning_rate": 4.389686108231063e-06, + "loss": 1.0826, + "step": 8312 + }, + { + "epoch": 0.25, + "learning_rate": 4.389526400732259e-06, + "loss": 1.1927, + "step": 8313 + }, + { + "epoch": 0.25, + "learning_rate": 4.3893666752460734e-06, + "loss": 1.1677, + "step": 8314 + }, + { + "epoch": 0.25, + "learning_rate": 4.389206931774027e-06, + "loss": 1.1147, + "step": 8315 + }, + { + "epoch": 0.25, + "learning_rate": 4.38904717031764e-06, + "loss": 1.118, + "step": 8316 + }, + { + "epoch": 0.25, + "learning_rate": 4.388887390878435e-06, + "loss": 1.0942, + "step": 8317 + }, + { + "epoch": 0.25, + "learning_rate": 4.388727593457932e-06, + "loss": 1.1287, + "step": 8318 + }, + { + "epoch": 0.25, + "learning_rate": 4.388567778057651e-06, + "loss": 1.0519, + "step": 8319 + }, + { + "epoch": 0.25, + "learning_rate": 4.388407944679114e-06, + "loss": 1.1226, + "step": 8320 + }, + { + "epoch": 0.25, + "learning_rate": 4.388248093323843e-06, + "loss": 1.0549, + "step": 8321 + }, + { + "epoch": 0.25, + "learning_rate": 4.38808822399336e-06, + "loss": 1.2006, + "step": 8322 + }, + { + "epoch": 0.25, + "learning_rate": 4.387928336689187e-06, + "loss": 1.2427, + "step": 8323 + }, + { + "epoch": 0.25, + "learning_rate": 4.387768431412844e-06, + "loss": 1.245, + "step": 8324 + }, + { + "epoch": 0.25, + "learning_rate": 4.387608508165856e-06, + "loss": 1.1844, + "step": 8325 + }, + { + "epoch": 0.25, + "learning_rate": 4.387448566949743e-06, + "loss": 1.1163, + "step": 8326 + }, + { + "epoch": 0.25, + "learning_rate": 4.38728860776603e-06, + "loss": 1.0634, + "step": 8327 + }, + { + "epoch": 0.25, + "learning_rate": 4.387128630616237e-06, + "loss": 1.1695, + "step": 8328 + }, + { + "epoch": 0.25, + "learning_rate": 4.386968635501889e-06, + "loss": 0.9815, + "step": 8329 + }, + { + "epoch": 0.25, + "learning_rate": 4.386808622424509e-06, + "loss": 1.1938, + "step": 8330 + }, + { + "epoch": 0.25, + "learning_rate": 4.386648591385618e-06, + "loss": 1.2159, + "step": 8331 + }, + { + "epoch": 0.25, + "learning_rate": 4.386488542386743e-06, + "loss": 1.0863, + "step": 8332 + }, + { + "epoch": 0.25, + "learning_rate": 4.386328475429404e-06, + "loss": 1.1335, + "step": 8333 + }, + { + "epoch": 0.25, + "learning_rate": 4.386168390515128e-06, + "loss": 1.1245, + "step": 8334 + }, + { + "epoch": 0.25, + "learning_rate": 4.386008287645436e-06, + "loss": 1.058, + "step": 8335 + }, + { + "epoch": 0.25, + "learning_rate": 4.385848166821854e-06, + "loss": 1.2276, + "step": 8336 + }, + { + "epoch": 0.25, + "learning_rate": 4.385688028045905e-06, + "loss": 1.1882, + "step": 8337 + }, + { + "epoch": 0.25, + "learning_rate": 4.385527871319115e-06, + "loss": 1.1602, + "step": 8338 + }, + { + "epoch": 0.25, + "learning_rate": 4.385367696643007e-06, + "loss": 1.1572, + "step": 8339 + }, + { + "epoch": 0.25, + "learning_rate": 4.3852075040191074e-06, + "loss": 1.1541, + "step": 8340 + }, + { + "epoch": 0.25, + "learning_rate": 4.38504729344894e-06, + "loss": 1.0852, + "step": 8341 + }, + { + "epoch": 0.25, + "learning_rate": 4.384887064934031e-06, + "loss": 1.1919, + "step": 8342 + }, + { + "epoch": 0.25, + "learning_rate": 4.384726818475904e-06, + "loss": 1.0302, + "step": 8343 + }, + { + "epoch": 0.25, + "learning_rate": 4.3845665540760855e-06, + "loss": 1.2772, + "step": 8344 + }, + { + "epoch": 0.25, + "learning_rate": 4.3844062717361e-06, + "loss": 1.1672, + "step": 8345 + }, + { + "epoch": 0.25, + "learning_rate": 4.384245971457476e-06, + "loss": 1.1431, + "step": 8346 + }, + { + "epoch": 0.25, + "learning_rate": 4.384085653241738e-06, + "loss": 1.0562, + "step": 8347 + }, + { + "epoch": 0.25, + "learning_rate": 4.3839253170904105e-06, + "loss": 1.1362, + "step": 8348 + }, + { + "epoch": 0.25, + "learning_rate": 4.383764963005022e-06, + "loss": 1.1975, + "step": 8349 + }, + { + "epoch": 0.25, + "learning_rate": 4.383604590987098e-06, + "loss": 1.2782, + "step": 8350 + }, + { + "epoch": 0.25, + "learning_rate": 4.3834442010381664e-06, + "loss": 1.1122, + "step": 8351 + }, + { + "epoch": 0.25, + "learning_rate": 4.383283793159753e-06, + "loss": 1.1748, + "step": 8352 + }, + { + "epoch": 0.25, + "learning_rate": 4.383123367353383e-06, + "loss": 1.0625, + "step": 8353 + }, + { + "epoch": 0.25, + "learning_rate": 4.382962923620588e-06, + "loss": 1.223, + "step": 8354 + }, + { + "epoch": 0.25, + "learning_rate": 4.382802461962892e-06, + "loss": 1.2175, + "step": 8355 + }, + { + "epoch": 0.25, + "learning_rate": 4.382641982381823e-06, + "loss": 1.056, + "step": 8356 + }, + { + "epoch": 0.25, + "learning_rate": 4.382481484878909e-06, + "loss": 1.1315, + "step": 8357 + }, + { + "epoch": 0.25, + "learning_rate": 4.382320969455678e-06, + "loss": 1.1564, + "step": 8358 + }, + { + "epoch": 0.25, + "learning_rate": 4.3821604361136585e-06, + "loss": 1.2266, + "step": 8359 + }, + { + "epoch": 0.25, + "learning_rate": 4.381999884854377e-06, + "loss": 1.1231, + "step": 8360 + }, + { + "epoch": 0.25, + "learning_rate": 4.381839315679363e-06, + "loss": 1.1801, + "step": 8361 + }, + { + "epoch": 0.25, + "learning_rate": 4.381678728590146e-06, + "loss": 1.3735, + "step": 8362 + }, + { + "epoch": 0.25, + "learning_rate": 4.381518123588254e-06, + "loss": 1.0889, + "step": 8363 + }, + { + "epoch": 0.25, + "learning_rate": 4.381357500675215e-06, + "loss": 1.1374, + "step": 8364 + }, + { + "epoch": 0.25, + "learning_rate": 4.381196859852558e-06, + "loss": 1.0287, + "step": 8365 + }, + { + "epoch": 0.25, + "learning_rate": 4.381036201121814e-06, + "loss": 1.1891, + "step": 8366 + }, + { + "epoch": 0.25, + "learning_rate": 4.380875524484511e-06, + "loss": 1.193, + "step": 8367 + }, + { + "epoch": 0.25, + "learning_rate": 4.380714829942179e-06, + "loss": 1.116, + "step": 8368 + }, + { + "epoch": 0.25, + "learning_rate": 4.380554117496347e-06, + "loss": 1.1842, + "step": 8369 + }, + { + "epoch": 0.25, + "learning_rate": 4.380393387148546e-06, + "loss": 1.1441, + "step": 8370 + }, + { + "epoch": 0.25, + "learning_rate": 4.380232638900305e-06, + "loss": 1.0868, + "step": 8371 + }, + { + "epoch": 0.25, + "learning_rate": 4.380071872753156e-06, + "loss": 1.184, + "step": 8372 + }, + { + "epoch": 0.25, + "learning_rate": 4.3799110887086275e-06, + "loss": 1.1326, + "step": 8373 + }, + { + "epoch": 0.25, + "learning_rate": 4.379750286768251e-06, + "loss": 1.1014, + "step": 8374 + }, + { + "epoch": 0.25, + "learning_rate": 4.3795894669335574e-06, + "loss": 1.2012, + "step": 8375 + }, + { + "epoch": 0.25, + "learning_rate": 4.379428629206076e-06, + "loss": 1.1921, + "step": 8376 + }, + { + "epoch": 0.25, + "learning_rate": 4.379267773587341e-06, + "loss": 1.1052, + "step": 8377 + }, + { + "epoch": 0.25, + "learning_rate": 4.37910690007888e-06, + "loss": 1.1567, + "step": 8378 + }, + { + "epoch": 0.25, + "learning_rate": 4.378946008682228e-06, + "loss": 1.1076, + "step": 8379 + }, + { + "epoch": 0.25, + "learning_rate": 4.378785099398914e-06, + "loss": 1.1619, + "step": 8380 + }, + { + "epoch": 0.25, + "learning_rate": 4.378624172230471e-06, + "loss": 1.0612, + "step": 8381 + }, + { + "epoch": 0.25, + "learning_rate": 4.37846322717843e-06, + "loss": 1.0595, + "step": 8382 + }, + { + "epoch": 0.25, + "learning_rate": 4.378302264244325e-06, + "loss": 1.1305, + "step": 8383 + }, + { + "epoch": 0.25, + "learning_rate": 4.378141283429687e-06, + "loss": 1.0624, + "step": 8384 + }, + { + "epoch": 0.25, + "learning_rate": 4.377980284736047e-06, + "loss": 1.0109, + "step": 8385 + }, + { + "epoch": 0.25, + "learning_rate": 4.377819268164941e-06, + "loss": 1.2209, + "step": 8386 + }, + { + "epoch": 0.25, + "learning_rate": 4.3776582337178986e-06, + "loss": 1.1983, + "step": 8387 + }, + { + "epoch": 0.25, + "learning_rate": 4.377497181396455e-06, + "loss": 1.2102, + "step": 8388 + }, + { + "epoch": 0.25, + "learning_rate": 4.377336111202142e-06, + "loss": 1.324, + "step": 8389 + }, + { + "epoch": 0.25, + "learning_rate": 4.377175023136493e-06, + "loss": 1.1224, + "step": 8390 + }, + { + "epoch": 0.25, + "learning_rate": 4.377013917201043e-06, + "loss": 1.1688, + "step": 8391 + }, + { + "epoch": 0.25, + "learning_rate": 4.376852793397323e-06, + "loss": 1.2631, + "step": 8392 + }, + { + "epoch": 0.25, + "learning_rate": 4.37669165172687e-06, + "loss": 1.1136, + "step": 8393 + }, + { + "epoch": 0.25, + "learning_rate": 4.376530492191215e-06, + "loss": 1.0816, + "step": 8394 + }, + { + "epoch": 0.25, + "learning_rate": 4.376369314791894e-06, + "loss": 1.2293, + "step": 8395 + }, + { + "epoch": 0.25, + "learning_rate": 4.376208119530441e-06, + "loss": 1.0955, + "step": 8396 + }, + { + "epoch": 0.25, + "learning_rate": 4.37604690640839e-06, + "loss": 1.2368, + "step": 8397 + }, + { + "epoch": 0.25, + "learning_rate": 4.375885675427276e-06, + "loss": 1.1514, + "step": 8398 + }, + { + "epoch": 0.25, + "learning_rate": 4.375724426588634e-06, + "loss": 1.0447, + "step": 8399 + }, + { + "epoch": 0.25, + "learning_rate": 4.375563159893998e-06, + "loss": 1.1806, + "step": 8400 + }, + { + "epoch": 0.25, + "learning_rate": 4.375401875344906e-06, + "loss": 1.0816, + "step": 8401 + }, + { + "epoch": 0.25, + "learning_rate": 4.375240572942889e-06, + "loss": 1.0107, + "step": 8402 + }, + { + "epoch": 0.25, + "learning_rate": 4.375079252689487e-06, + "loss": 1.1613, + "step": 8403 + }, + { + "epoch": 0.25, + "learning_rate": 4.374917914586232e-06, + "loss": 1.2576, + "step": 8404 + }, + { + "epoch": 0.25, + "learning_rate": 4.374756558634662e-06, + "loss": 1.2253, + "step": 8405 + }, + { + "epoch": 0.25, + "learning_rate": 4.374595184836313e-06, + "loss": 1.2324, + "step": 8406 + }, + { + "epoch": 0.25, + "learning_rate": 4.3744337931927196e-06, + "loss": 1.1229, + "step": 8407 + }, + { + "epoch": 0.25, + "learning_rate": 4.37427238370542e-06, + "loss": 1.1209, + "step": 8408 + }, + { + "epoch": 0.25, + "learning_rate": 4.37411095637595e-06, + "loss": 1.0104, + "step": 8409 + }, + { + "epoch": 0.25, + "learning_rate": 4.373949511205846e-06, + "loss": 1.0221, + "step": 8410 + }, + { + "epoch": 0.25, + "learning_rate": 4.373788048196646e-06, + "loss": 1.1542, + "step": 8411 + }, + { + "epoch": 0.25, + "learning_rate": 4.373626567349885e-06, + "loss": 1.1966, + "step": 8412 + }, + { + "epoch": 0.25, + "learning_rate": 4.3734650686671025e-06, + "loss": 1.2164, + "step": 8413 + }, + { + "epoch": 0.25, + "learning_rate": 4.373303552149834e-06, + "loss": 1.1433, + "step": 8414 + }, + { + "epoch": 0.25, + "learning_rate": 4.373142017799618e-06, + "loss": 1.0576, + "step": 8415 + }, + { + "epoch": 0.25, + "learning_rate": 4.372980465617993e-06, + "loss": 1.064, + "step": 8416 + }, + { + "epoch": 0.25, + "learning_rate": 4.3728188956064946e-06, + "loss": 1.1223, + "step": 8417 + }, + { + "epoch": 0.25, + "learning_rate": 4.372657307766664e-06, + "loss": 1.1879, + "step": 8418 + }, + { + "epoch": 0.25, + "learning_rate": 4.372495702100036e-06, + "loss": 1.0358, + "step": 8419 + }, + { + "epoch": 0.25, + "learning_rate": 4.372334078608152e-06, + "loss": 1.0302, + "step": 8420 + }, + { + "epoch": 0.25, + "learning_rate": 4.372172437292548e-06, + "loss": 1.1104, + "step": 8421 + }, + { + "epoch": 0.25, + "learning_rate": 4.372010778154765e-06, + "loss": 1.0306, + "step": 8422 + }, + { + "epoch": 0.25, + "learning_rate": 4.371849101196342e-06, + "loss": 1.0065, + "step": 8423 + }, + { + "epoch": 0.25, + "learning_rate": 4.371687406418815e-06, + "loss": 1.2729, + "step": 8424 + }, + { + "epoch": 0.25, + "learning_rate": 4.371525693823727e-06, + "loss": 1.1101, + "step": 8425 + }, + { + "epoch": 0.25, + "learning_rate": 4.371363963412615e-06, + "loss": 1.2424, + "step": 8426 + }, + { + "epoch": 0.25, + "learning_rate": 4.37120221518702e-06, + "loss": 1.068, + "step": 8427 + }, + { + "epoch": 0.25, + "learning_rate": 4.37104044914848e-06, + "loss": 0.9944, + "step": 8428 + }, + { + "epoch": 0.25, + "learning_rate": 4.370878665298537e-06, + "loss": 1.111, + "step": 8429 + }, + { + "epoch": 0.25, + "learning_rate": 4.370716863638729e-06, + "loss": 1.0964, + "step": 8430 + }, + { + "epoch": 0.25, + "learning_rate": 4.370555044170598e-06, + "loss": 1.2555, + "step": 8431 + }, + { + "epoch": 0.25, + "learning_rate": 4.370393206895685e-06, + "loss": 1.1248, + "step": 8432 + }, + { + "epoch": 0.25, + "learning_rate": 4.370231351815528e-06, + "loss": 1.1984, + "step": 8433 + }, + { + "epoch": 0.25, + "learning_rate": 4.37006947893167e-06, + "loss": 1.157, + "step": 8434 + }, + { + "epoch": 0.25, + "learning_rate": 4.36990758824565e-06, + "loss": 1.1218, + "step": 8435 + }, + { + "epoch": 0.25, + "learning_rate": 4.369745679759012e-06, + "loss": 1.1957, + "step": 8436 + }, + { + "epoch": 0.25, + "learning_rate": 4.369583753473295e-06, + "loss": 1.0629, + "step": 8437 + }, + { + "epoch": 0.25, + "learning_rate": 4.369421809390041e-06, + "loss": 1.0469, + "step": 8438 + }, + { + "epoch": 0.25, + "learning_rate": 4.369259847510792e-06, + "loss": 1.1277, + "step": 8439 + }, + { + "epoch": 0.25, + "learning_rate": 4.369097867837089e-06, + "loss": 1.2682, + "step": 8440 + }, + { + "epoch": 0.25, + "learning_rate": 4.368935870370474e-06, + "loss": 1.1379, + "step": 8441 + }, + { + "epoch": 0.25, + "learning_rate": 4.368773855112491e-06, + "loss": 1.1389, + "step": 8442 + }, + { + "epoch": 0.25, + "learning_rate": 4.368611822064681e-06, + "loss": 1.1215, + "step": 8443 + }, + { + "epoch": 0.25, + "learning_rate": 4.368449771228586e-06, + "loss": 1.0118, + "step": 8444 + }, + { + "epoch": 0.25, + "learning_rate": 4.368287702605748e-06, + "loss": 1.0916, + "step": 8445 + }, + { + "epoch": 0.25, + "learning_rate": 4.368125616197711e-06, + "loss": 1.1186, + "step": 8446 + }, + { + "epoch": 0.25, + "learning_rate": 4.367963512006019e-06, + "loss": 1.0862, + "step": 8447 + }, + { + "epoch": 0.25, + "learning_rate": 4.367801390032214e-06, + "loss": 1.196, + "step": 8448 + }, + { + "epoch": 0.25, + "learning_rate": 4.367639250277839e-06, + "loss": 1.0728, + "step": 8449 + }, + { + "epoch": 0.25, + "learning_rate": 4.367477092744437e-06, + "loss": 1.134, + "step": 8450 + }, + { + "epoch": 0.25, + "learning_rate": 4.367314917433553e-06, + "loss": 1.2246, + "step": 8451 + }, + { + "epoch": 0.25, + "learning_rate": 4.367152724346731e-06, + "loss": 1.1265, + "step": 8452 + }, + { + "epoch": 0.25, + "learning_rate": 4.366990513485514e-06, + "loss": 1.087, + "step": 8453 + }, + { + "epoch": 0.25, + "learning_rate": 4.366828284851446e-06, + "loss": 1.0467, + "step": 8454 + }, + { + "epoch": 0.25, + "learning_rate": 4.366666038446072e-06, + "loss": 1.1937, + "step": 8455 + }, + { + "epoch": 0.25, + "learning_rate": 4.366503774270936e-06, + "loss": 1.1879, + "step": 8456 + }, + { + "epoch": 0.25, + "learning_rate": 4.366341492327583e-06, + "loss": 1.1787, + "step": 8457 + }, + { + "epoch": 0.25, + "learning_rate": 4.366179192617559e-06, + "loss": 1.0673, + "step": 8458 + }, + { + "epoch": 0.25, + "learning_rate": 4.366016875142407e-06, + "loss": 1.0529, + "step": 8459 + }, + { + "epoch": 0.25, + "learning_rate": 4.3658545399036736e-06, + "loss": 1.1212, + "step": 8460 + }, + { + "epoch": 0.25, + "learning_rate": 4.365692186902903e-06, + "loss": 1.1178, + "step": 8461 + }, + { + "epoch": 0.25, + "learning_rate": 4.365529816141641e-06, + "loss": 1.2444, + "step": 8462 + }, + { + "epoch": 0.25, + "learning_rate": 4.3653674276214345e-06, + "loss": 1.1427, + "step": 8463 + }, + { + "epoch": 0.25, + "learning_rate": 4.365205021343828e-06, + "loss": 1.123, + "step": 8464 + }, + { + "epoch": 0.26, + "learning_rate": 4.365042597310369e-06, + "loss": 1.0818, + "step": 8465 + }, + { + "epoch": 0.26, + "learning_rate": 4.364880155522602e-06, + "loss": 1.1734, + "step": 8466 + }, + { + "epoch": 0.26, + "learning_rate": 4.364717695982074e-06, + "loss": 1.0246, + "step": 8467 + }, + { + "epoch": 0.26, + "learning_rate": 4.3645552186903315e-06, + "loss": 1.2101, + "step": 8468 + }, + { + "epoch": 0.26, + "learning_rate": 4.3643927236489205e-06, + "loss": 1.1708, + "step": 8469 + }, + { + "epoch": 0.26, + "learning_rate": 4.36423021085939e-06, + "loss": 1.1611, + "step": 8470 + }, + { + "epoch": 0.26, + "learning_rate": 4.364067680323285e-06, + "loss": 1.0931, + "step": 8471 + }, + { + "epoch": 0.26, + "learning_rate": 4.3639051320421545e-06, + "loss": 1.0276, + "step": 8472 + }, + { + "epoch": 0.26, + "learning_rate": 4.363742566017544e-06, + "loss": 1.1018, + "step": 8473 + }, + { + "epoch": 0.26, + "learning_rate": 4.363579982251002e-06, + "loss": 1.1649, + "step": 8474 + }, + { + "epoch": 0.26, + "learning_rate": 4.3634173807440765e-06, + "loss": 1.2365, + "step": 8475 + }, + { + "epoch": 0.26, + "learning_rate": 4.363254761498314e-06, + "loss": 1.169, + "step": 8476 + }, + { + "epoch": 0.26, + "learning_rate": 4.363092124515263e-06, + "loss": 1.084, + "step": 8477 + }, + { + "epoch": 0.26, + "learning_rate": 4.362929469796474e-06, + "loss": 0.9954, + "step": 8478 + }, + { + "epoch": 0.26, + "learning_rate": 4.362766797343494e-06, + "loss": 1.173, + "step": 8479 + }, + { + "epoch": 0.26, + "learning_rate": 4.362604107157869e-06, + "loss": 1.2011, + "step": 8480 + }, + { + "epoch": 0.26, + "learning_rate": 4.362441399241152e-06, + "loss": 1.1934, + "step": 8481 + }, + { + "epoch": 0.26, + "learning_rate": 4.362278673594889e-06, + "loss": 1.2234, + "step": 8482 + }, + { + "epoch": 0.26, + "learning_rate": 4.36211593022063e-06, + "loss": 0.9951, + "step": 8483 + }, + { + "epoch": 0.26, + "learning_rate": 4.361953169119924e-06, + "loss": 1.1299, + "step": 8484 + }, + { + "epoch": 0.26, + "learning_rate": 4.361790390294321e-06, + "loss": 1.1658, + "step": 8485 + }, + { + "epoch": 0.26, + "learning_rate": 4.36162759374537e-06, + "loss": 1.3094, + "step": 8486 + }, + { + "epoch": 0.26, + "learning_rate": 4.36146477947462e-06, + "loss": 1.2307, + "step": 8487 + }, + { + "epoch": 0.26, + "learning_rate": 4.361301947483623e-06, + "loss": 1.0757, + "step": 8488 + }, + { + "epoch": 0.26, + "learning_rate": 4.3611390977739275e-06, + "loss": 1.2039, + "step": 8489 + }, + { + "epoch": 0.26, + "learning_rate": 4.360976230347085e-06, + "loss": 1.0854, + "step": 8490 + }, + { + "epoch": 0.26, + "learning_rate": 4.3608133452046434e-06, + "loss": 1.1748, + "step": 8491 + }, + { + "epoch": 0.26, + "learning_rate": 4.360650442348156e-06, + "loss": 1.2341, + "step": 8492 + }, + { + "epoch": 0.26, + "learning_rate": 4.360487521779173e-06, + "loss": 1.0883, + "step": 8493 + }, + { + "epoch": 0.26, + "learning_rate": 4.360324583499243e-06, + "loss": 1.0439, + "step": 8494 + }, + { + "epoch": 0.26, + "learning_rate": 4.360161627509921e-06, + "loss": 1.0557, + "step": 8495 + }, + { + "epoch": 0.26, + "learning_rate": 4.359998653812755e-06, + "loss": 1.0796, + "step": 8496 + }, + { + "epoch": 0.26, + "learning_rate": 4.3598356624092975e-06, + "loss": 1.1603, + "step": 8497 + }, + { + "epoch": 0.26, + "learning_rate": 4.3596726533011005e-06, + "loss": 1.2026, + "step": 8498 + }, + { + "epoch": 0.26, + "learning_rate": 4.359509626489716e-06, + "loss": 1.1816, + "step": 8499 + }, + { + "epoch": 0.26, + "learning_rate": 4.3593465819766944e-06, + "loss": 1.1661, + "step": 8500 + }, + { + "epoch": 0.26, + "learning_rate": 4.35918351976359e-06, + "loss": 1.0668, + "step": 8501 + }, + { + "epoch": 0.26, + "learning_rate": 4.359020439851953e-06, + "loss": 1.1362, + "step": 8502 + }, + { + "epoch": 0.26, + "learning_rate": 4.358857342243337e-06, + "loss": 1.0624, + "step": 8503 + }, + { + "epoch": 0.26, + "learning_rate": 4.3586942269392955e-06, + "loss": 1.1605, + "step": 8504 + }, + { + "epoch": 0.26, + "learning_rate": 4.358531093941378e-06, + "loss": 1.2486, + "step": 8505 + }, + { + "epoch": 0.26, + "learning_rate": 4.358367943251141e-06, + "loss": 1.1594, + "step": 8506 + }, + { + "epoch": 0.26, + "learning_rate": 4.358204774870136e-06, + "loss": 1.1587, + "step": 8507 + }, + { + "epoch": 0.26, + "learning_rate": 4.358041588799916e-06, + "loss": 1.1262, + "step": 8508 + }, + { + "epoch": 0.26, + "learning_rate": 4.357878385042036e-06, + "loss": 1.1638, + "step": 8509 + }, + { + "epoch": 0.26, + "learning_rate": 4.3577151635980475e-06, + "loss": 1.1164, + "step": 8510 + }, + { + "epoch": 0.26, + "learning_rate": 4.357551924469505e-06, + "loss": 1.0367, + "step": 8511 + }, + { + "epoch": 0.26, + "learning_rate": 4.357388667657964e-06, + "loss": 1.2826, + "step": 8512 + }, + { + "epoch": 0.26, + "learning_rate": 4.357225393164977e-06, + "loss": 1.101, + "step": 8513 + }, + { + "epoch": 0.26, + "learning_rate": 4.357062100992099e-06, + "loss": 1.1979, + "step": 8514 + }, + { + "epoch": 0.26, + "learning_rate": 4.356898791140884e-06, + "loss": 1.1063, + "step": 8515 + }, + { + "epoch": 0.26, + "learning_rate": 4.3567354636128865e-06, + "loss": 1.1498, + "step": 8516 + }, + { + "epoch": 0.26, + "learning_rate": 4.356572118409661e-06, + "loss": 1.209, + "step": 8517 + }, + { + "epoch": 0.26, + "learning_rate": 4.356408755532764e-06, + "loss": 1.2142, + "step": 8518 + }, + { + "epoch": 0.26, + "learning_rate": 4.35624537498375e-06, + "loss": 1.0558, + "step": 8519 + }, + { + "epoch": 0.26, + "learning_rate": 4.356081976764174e-06, + "loss": 1.0837, + "step": 8520 + }, + { + "epoch": 0.26, + "learning_rate": 4.355918560875591e-06, + "loss": 1.1962, + "step": 8521 + }, + { + "epoch": 0.26, + "learning_rate": 4.355755127319558e-06, + "loss": 1.2678, + "step": 8522 + }, + { + "epoch": 0.26, + "learning_rate": 4.355591676097628e-06, + "loss": 1.1816, + "step": 8523 + }, + { + "epoch": 0.26, + "learning_rate": 4.35542820721136e-06, + "loss": 1.2585, + "step": 8524 + }, + { + "epoch": 0.26, + "learning_rate": 4.35526472066231e-06, + "loss": 1.2616, + "step": 8525 + }, + { + "epoch": 0.26, + "learning_rate": 4.355101216452032e-06, + "loss": 1.0997, + "step": 8526 + }, + { + "epoch": 0.26, + "learning_rate": 4.3549376945820854e-06, + "loss": 1.1052, + "step": 8527 + }, + { + "epoch": 0.26, + "learning_rate": 4.354774155054024e-06, + "loss": 1.1348, + "step": 8528 + }, + { + "epoch": 0.26, + "learning_rate": 4.3546105978694065e-06, + "loss": 1.1252, + "step": 8529 + }, + { + "epoch": 0.26, + "learning_rate": 4.354447023029789e-06, + "loss": 1.1876, + "step": 8530 + }, + { + "epoch": 0.26, + "learning_rate": 4.3542834305367286e-06, + "loss": 1.201, + "step": 8531 + }, + { + "epoch": 0.26, + "learning_rate": 4.354119820391785e-06, + "loss": 1.1351, + "step": 8532 + }, + { + "epoch": 0.26, + "learning_rate": 4.353956192596512e-06, + "loss": 1.0948, + "step": 8533 + }, + { + "epoch": 0.26, + "learning_rate": 4.353792547152469e-06, + "loss": 1.0851, + "step": 8534 + }, + { + "epoch": 0.26, + "learning_rate": 4.353628884061214e-06, + "loss": 1.2224, + "step": 8535 + }, + { + "epoch": 0.26, + "learning_rate": 4.353465203324304e-06, + "loss": 1.0375, + "step": 8536 + }, + { + "epoch": 0.26, + "learning_rate": 4.353301504943299e-06, + "loss": 1.0744, + "step": 8537 + }, + { + "epoch": 0.26, + "learning_rate": 4.353137788919756e-06, + "loss": 1.118, + "step": 8538 + }, + { + "epoch": 0.26, + "learning_rate": 4.352974055255233e-06, + "loss": 1.1786, + "step": 8539 + }, + { + "epoch": 0.26, + "learning_rate": 4.352810303951291e-06, + "loss": 1.2108, + "step": 8540 + }, + { + "epoch": 0.26, + "learning_rate": 4.3526465350094855e-06, + "loss": 1.0214, + "step": 8541 + }, + { + "epoch": 0.26, + "learning_rate": 4.352482748431378e-06, + "loss": 1.1922, + "step": 8542 + }, + { + "epoch": 0.26, + "learning_rate": 4.352318944218527e-06, + "loss": 1.2457, + "step": 8543 + }, + { + "epoch": 0.26, + "learning_rate": 4.352155122372492e-06, + "loss": 1.1888, + "step": 8544 + }, + { + "epoch": 0.26, + "learning_rate": 4.351991282894832e-06, + "loss": 1.1977, + "step": 8545 + }, + { + "epoch": 0.26, + "learning_rate": 4.3518274257871065e-06, + "loss": 1.1412, + "step": 8546 + }, + { + "epoch": 0.26, + "learning_rate": 4.351663551050877e-06, + "loss": 1.159, + "step": 8547 + }, + { + "epoch": 0.26, + "learning_rate": 4.351499658687701e-06, + "loss": 1.1115, + "step": 8548 + }, + { + "epoch": 0.26, + "learning_rate": 4.35133574869914e-06, + "loss": 1.1757, + "step": 8549 + }, + { + "epoch": 0.26, + "learning_rate": 4.351171821086755e-06, + "loss": 1.1909, + "step": 8550 + }, + { + "epoch": 0.26, + "learning_rate": 4.351007875852106e-06, + "loss": 1.1001, + "step": 8551 + }, + { + "epoch": 0.26, + "learning_rate": 4.350843912996753e-06, + "loss": 1.1065, + "step": 8552 + }, + { + "epoch": 0.26, + "learning_rate": 4.350679932522257e-06, + "loss": 1.0572, + "step": 8553 + }, + { + "epoch": 0.26, + "learning_rate": 4.35051593443018e-06, + "loss": 1.1382, + "step": 8554 + }, + { + "epoch": 0.26, + "learning_rate": 4.350351918722082e-06, + "loss": 1.2202, + "step": 8555 + }, + { + "epoch": 0.26, + "learning_rate": 4.3501878853995246e-06, + "loss": 0.8915, + "step": 8556 + }, + { + "epoch": 0.26, + "learning_rate": 4.350023834464071e-06, + "loss": 1.094, + "step": 8557 + }, + { + "epoch": 0.26, + "learning_rate": 4.34985976591728e-06, + "loss": 1.0967, + "step": 8558 + }, + { + "epoch": 0.26, + "learning_rate": 4.349695679760716e-06, + "loss": 1.0784, + "step": 8559 + }, + { + "epoch": 0.26, + "learning_rate": 4.34953157599594e-06, + "loss": 1.1101, + "step": 8560 + }, + { + "epoch": 0.26, + "learning_rate": 4.349367454624513e-06, + "loss": 1.1342, + "step": 8561 + }, + { + "epoch": 0.26, + "learning_rate": 4.349203315648e-06, + "loss": 1.1888, + "step": 8562 + }, + { + "epoch": 0.26, + "learning_rate": 4.349039159067961e-06, + "loss": 1.2009, + "step": 8563 + }, + { + "epoch": 0.26, + "learning_rate": 4.34887498488596e-06, + "loss": 1.03, + "step": 8564 + }, + { + "epoch": 0.26, + "learning_rate": 4.34871079310356e-06, + "loss": 1.1241, + "step": 8565 + }, + { + "epoch": 0.26, + "learning_rate": 4.3485465837223235e-06, + "loss": 1.2004, + "step": 8566 + }, + { + "epoch": 0.26, + "learning_rate": 4.348382356743813e-06, + "loss": 1.1026, + "step": 8567 + }, + { + "epoch": 0.26, + "learning_rate": 4.3482181121695936e-06, + "loss": 1.1145, + "step": 8568 + }, + { + "epoch": 0.26, + "learning_rate": 4.348053850001228e-06, + "loss": 1.1708, + "step": 8569 + }, + { + "epoch": 0.26, + "learning_rate": 4.347889570240279e-06, + "loss": 1.157, + "step": 8570 + }, + { + "epoch": 0.26, + "learning_rate": 4.3477252728883115e-06, + "loss": 1.162, + "step": 8571 + }, + { + "epoch": 0.26, + "learning_rate": 4.34756095794689e-06, + "loss": 1.0731, + "step": 8572 + }, + { + "epoch": 0.26, + "learning_rate": 4.347396625417577e-06, + "loss": 1.1414, + "step": 8573 + }, + { + "epoch": 0.26, + "learning_rate": 4.347232275301938e-06, + "loss": 1.1259, + "step": 8574 + }, + { + "epoch": 0.26, + "learning_rate": 4.347067907601539e-06, + "loss": 1.1721, + "step": 8575 + }, + { + "epoch": 0.26, + "learning_rate": 4.346903522317941e-06, + "loss": 1.2223, + "step": 8576 + }, + { + "epoch": 0.26, + "learning_rate": 4.346739119452712e-06, + "loss": 1.1547, + "step": 8577 + }, + { + "epoch": 0.26, + "learning_rate": 4.346574699007416e-06, + "loss": 1.0729, + "step": 8578 + }, + { + "epoch": 0.26, + "learning_rate": 4.346410260983618e-06, + "loss": 1.1476, + "step": 8579 + }, + { + "epoch": 0.26, + "learning_rate": 4.3462458053828835e-06, + "loss": 1.202, + "step": 8580 + }, + { + "epoch": 0.26, + "learning_rate": 4.346081332206778e-06, + "loss": 1.1189, + "step": 8581 + }, + { + "epoch": 0.26, + "learning_rate": 4.345916841456867e-06, + "loss": 1.1805, + "step": 8582 + }, + { + "epoch": 0.26, + "learning_rate": 4.345752333134718e-06, + "loss": 1.1215, + "step": 8583 + }, + { + "epoch": 0.26, + "learning_rate": 4.345587807241895e-06, + "loss": 1.0649, + "step": 8584 + }, + { + "epoch": 0.26, + "learning_rate": 4.345423263779964e-06, + "loss": 1.1458, + "step": 8585 + }, + { + "epoch": 0.26, + "learning_rate": 4.345258702750493e-06, + "loss": 1.1295, + "step": 8586 + }, + { + "epoch": 0.26, + "learning_rate": 4.345094124155049e-06, + "loss": 1.1151, + "step": 8587 + }, + { + "epoch": 0.26, + "learning_rate": 4.3449295279951965e-06, + "loss": 1.2026, + "step": 8588 + }, + { + "epoch": 0.26, + "learning_rate": 4.344764914272503e-06, + "loss": 1.2, + "step": 8589 + }, + { + "epoch": 0.26, + "learning_rate": 4.344600282988537e-06, + "loss": 1.1615, + "step": 8590 + }, + { + "epoch": 0.26, + "learning_rate": 4.344435634144864e-06, + "loss": 1.0801, + "step": 8591 + }, + { + "epoch": 0.26, + "learning_rate": 4.344270967743052e-06, + "loss": 1.2502, + "step": 8592 + }, + { + "epoch": 0.26, + "learning_rate": 4.344106283784669e-06, + "loss": 1.1459, + "step": 8593 + }, + { + "epoch": 0.26, + "learning_rate": 4.343941582271283e-06, + "loss": 1.2017, + "step": 8594 + }, + { + "epoch": 0.26, + "learning_rate": 4.3437768632044605e-06, + "loss": 1.1784, + "step": 8595 + }, + { + "epoch": 0.26, + "learning_rate": 4.34361212658577e-06, + "loss": 1.1374, + "step": 8596 + }, + { + "epoch": 0.26, + "learning_rate": 4.34344737241678e-06, + "loss": 1.0885, + "step": 8597 + }, + { + "epoch": 0.26, + "learning_rate": 4.343282600699059e-06, + "loss": 1.1718, + "step": 8598 + }, + { + "epoch": 0.26, + "learning_rate": 4.343117811434176e-06, + "loss": 1.1594, + "step": 8599 + }, + { + "epoch": 0.26, + "learning_rate": 4.342953004623698e-06, + "loss": 1.3053, + "step": 8600 + }, + { + "epoch": 0.26, + "learning_rate": 4.342788180269196e-06, + "loss": 1.1888, + "step": 8601 + }, + { + "epoch": 0.26, + "learning_rate": 4.342623338372237e-06, + "loss": 1.1623, + "step": 8602 + }, + { + "epoch": 0.26, + "learning_rate": 4.342458478934392e-06, + "loss": 1.149, + "step": 8603 + }, + { + "epoch": 0.26, + "learning_rate": 4.342293601957229e-06, + "loss": 1.1031, + "step": 8604 + }, + { + "epoch": 0.26, + "learning_rate": 4.342128707442319e-06, + "loss": 1.157, + "step": 8605 + }, + { + "epoch": 0.26, + "learning_rate": 4.341963795391231e-06, + "loss": 1.1432, + "step": 8606 + }, + { + "epoch": 0.26, + "learning_rate": 4.341798865805534e-06, + "loss": 1.1542, + "step": 8607 + }, + { + "epoch": 0.26, + "learning_rate": 4.341633918686799e-06, + "loss": 1.1193, + "step": 8608 + }, + { + "epoch": 0.26, + "learning_rate": 4.341468954036597e-06, + "loss": 1.0295, + "step": 8609 + }, + { + "epoch": 0.26, + "learning_rate": 4.341303971856496e-06, + "loss": 1.1329, + "step": 8610 + }, + { + "epoch": 0.26, + "learning_rate": 4.341138972148069e-06, + "loss": 1.267, + "step": 8611 + }, + { + "epoch": 0.26, + "learning_rate": 4.3409739549128845e-06, + "loss": 1.1143, + "step": 8612 + }, + { + "epoch": 0.26, + "learning_rate": 4.340808920152516e-06, + "loss": 1.2426, + "step": 8613 + }, + { + "epoch": 0.26, + "learning_rate": 4.340643867868533e-06, + "loss": 1.1676, + "step": 8614 + }, + { + "epoch": 0.26, + "learning_rate": 4.3404787980625065e-06, + "loss": 1.2199, + "step": 8615 + }, + { + "epoch": 0.26, + "learning_rate": 4.340313710736009e-06, + "loss": 1.1652, + "step": 8616 + }, + { + "epoch": 0.26, + "learning_rate": 4.34014860589061e-06, + "loss": 1.2489, + "step": 8617 + }, + { + "epoch": 0.26, + "learning_rate": 4.339983483527883e-06, + "loss": 1.2445, + "step": 8618 + }, + { + "epoch": 0.26, + "learning_rate": 4.339818343649399e-06, + "loss": 1.1758, + "step": 8619 + }, + { + "epoch": 0.26, + "learning_rate": 4.339653186256731e-06, + "loss": 1.1249, + "step": 8620 + }, + { + "epoch": 0.26, + "learning_rate": 4.3394880113514504e-06, + "loss": 1.1168, + "step": 8621 + }, + { + "epoch": 0.26, + "learning_rate": 4.33932281893513e-06, + "loss": 1.0086, + "step": 8622 + }, + { + "epoch": 0.26, + "learning_rate": 4.3391576090093425e-06, + "loss": 1.103, + "step": 8623 + }, + { + "epoch": 0.26, + "learning_rate": 4.33899238157566e-06, + "loss": 1.061, + "step": 8624 + }, + { + "epoch": 0.26, + "learning_rate": 4.338827136635656e-06, + "loss": 1.2271, + "step": 8625 + }, + { + "epoch": 0.26, + "learning_rate": 4.3386618741909035e-06, + "loss": 1.1028, + "step": 8626 + }, + { + "epoch": 0.26, + "learning_rate": 4.338496594242975e-06, + "loss": 1.0814, + "step": 8627 + }, + { + "epoch": 0.26, + "learning_rate": 4.338331296793444e-06, + "loss": 1.051, + "step": 8628 + }, + { + "epoch": 0.26, + "learning_rate": 4.338165981843885e-06, + "loss": 1.1196, + "step": 8629 + }, + { + "epoch": 0.26, + "learning_rate": 4.338000649395871e-06, + "loss": 1.1034, + "step": 8630 + }, + { + "epoch": 0.26, + "learning_rate": 4.337835299450976e-06, + "loss": 1.0552, + "step": 8631 + }, + { + "epoch": 0.26, + "learning_rate": 4.337669932010774e-06, + "loss": 1.0574, + "step": 8632 + }, + { + "epoch": 0.26, + "learning_rate": 4.3375045470768395e-06, + "loss": 1.1597, + "step": 8633 + }, + { + "epoch": 0.26, + "learning_rate": 4.337339144650746e-06, + "loss": 1.0275, + "step": 8634 + }, + { + "epoch": 0.26, + "learning_rate": 4.33717372473407e-06, + "loss": 1.2061, + "step": 8635 + }, + { + "epoch": 0.26, + "learning_rate": 4.337008287328384e-06, + "loss": 1.2113, + "step": 8636 + }, + { + "epoch": 0.26, + "learning_rate": 4.336842832435264e-06, + "loss": 1.3286, + "step": 8637 + }, + { + "epoch": 0.26, + "learning_rate": 4.336677360056285e-06, + "loss": 1.0542, + "step": 8638 + }, + { + "epoch": 0.26, + "learning_rate": 4.336511870193023e-06, + "loss": 1.138, + "step": 8639 + }, + { + "epoch": 0.26, + "learning_rate": 4.336346362847051e-06, + "loss": 1.1033, + "step": 8640 + }, + { + "epoch": 0.26, + "learning_rate": 4.336180838019946e-06, + "loss": 1.1791, + "step": 8641 + }, + { + "epoch": 0.26, + "learning_rate": 4.336015295713285e-06, + "loss": 1.0822, + "step": 8642 + }, + { + "epoch": 0.26, + "learning_rate": 4.335849735928643e-06, + "loss": 1.1235, + "step": 8643 + }, + { + "epoch": 0.26, + "learning_rate": 4.3356841586675934e-06, + "loss": 1.1382, + "step": 8644 + }, + { + "epoch": 0.26, + "learning_rate": 4.335518563931717e-06, + "loss": 1.1141, + "step": 8645 + }, + { + "epoch": 0.26, + "learning_rate": 4.335352951722587e-06, + "loss": 1.1614, + "step": 8646 + }, + { + "epoch": 0.26, + "learning_rate": 4.33518732204178e-06, + "loss": 1.054, + "step": 8647 + }, + { + "epoch": 0.26, + "learning_rate": 4.335021674890875e-06, + "loss": 1.096, + "step": 8648 + }, + { + "epoch": 0.26, + "learning_rate": 4.334856010271446e-06, + "loss": 1.1187, + "step": 8649 + }, + { + "epoch": 0.26, + "learning_rate": 4.334690328185073e-06, + "loss": 1.2054, + "step": 8650 + }, + { + "epoch": 0.26, + "learning_rate": 4.3345246286333305e-06, + "loss": 1.1805, + "step": 8651 + }, + { + "epoch": 0.26, + "learning_rate": 4.334358911617797e-06, + "loss": 1.0571, + "step": 8652 + }, + { + "epoch": 0.26, + "learning_rate": 4.334193177140051e-06, + "loss": 1.1279, + "step": 8653 + }, + { + "epoch": 0.26, + "learning_rate": 4.334027425201669e-06, + "loss": 1.1771, + "step": 8654 + }, + { + "epoch": 0.26, + "learning_rate": 4.333861655804229e-06, + "loss": 1.0914, + "step": 8655 + }, + { + "epoch": 0.26, + "learning_rate": 4.33369586894931e-06, + "loss": 1.2642, + "step": 8656 + }, + { + "epoch": 0.26, + "learning_rate": 4.333530064638489e-06, + "loss": 1.2459, + "step": 8657 + }, + { + "epoch": 0.26, + "learning_rate": 4.333364242873344e-06, + "loss": 1.0617, + "step": 8658 + }, + { + "epoch": 0.26, + "learning_rate": 4.333198403655455e-06, + "loss": 1.1063, + "step": 8659 + }, + { + "epoch": 0.26, + "learning_rate": 4.3330325469864e-06, + "loss": 1.0745, + "step": 8660 + }, + { + "epoch": 0.26, + "learning_rate": 4.332866672867759e-06, + "loss": 1.2563, + "step": 8661 + }, + { + "epoch": 0.26, + "learning_rate": 4.3327007813011094e-06, + "loss": 1.0447, + "step": 8662 + }, + { + "epoch": 0.26, + "learning_rate": 4.33253487228803e-06, + "loss": 1.1747, + "step": 8663 + }, + { + "epoch": 0.26, + "learning_rate": 4.332368945830102e-06, + "loss": 1.2081, + "step": 8664 + }, + { + "epoch": 0.26, + "learning_rate": 4.332203001928905e-06, + "loss": 1.0771, + "step": 8665 + }, + { + "epoch": 0.26, + "learning_rate": 4.332037040586016e-06, + "loss": 1.1259, + "step": 8666 + }, + { + "epoch": 0.26, + "learning_rate": 4.331871061803018e-06, + "loss": 1.1165, + "step": 8667 + }, + { + "epoch": 0.26, + "learning_rate": 4.331705065581489e-06, + "loss": 1.0987, + "step": 8668 + }, + { + "epoch": 0.26, + "learning_rate": 4.331539051923011e-06, + "loss": 1.1262, + "step": 8669 + }, + { + "epoch": 0.26, + "learning_rate": 4.331373020829163e-06, + "loss": 1.2201, + "step": 8670 + }, + { + "epoch": 0.26, + "learning_rate": 4.331206972301525e-06, + "loss": 1.065, + "step": 8671 + }, + { + "epoch": 0.26, + "learning_rate": 4.331040906341679e-06, + "loss": 1.0999, + "step": 8672 + }, + { + "epoch": 0.26, + "learning_rate": 4.330874822951206e-06, + "loss": 1.1208, + "step": 8673 + }, + { + "epoch": 0.26, + "learning_rate": 4.330708722131686e-06, + "loss": 1.2562, + "step": 8674 + }, + { + "epoch": 0.26, + "learning_rate": 4.330542603884701e-06, + "loss": 1.1779, + "step": 8675 + }, + { + "epoch": 0.26, + "learning_rate": 4.330376468211832e-06, + "loss": 1.0881, + "step": 8676 + }, + { + "epoch": 0.26, + "learning_rate": 4.33021031511466e-06, + "loss": 1.1997, + "step": 8677 + }, + { + "epoch": 0.26, + "learning_rate": 4.330044144594767e-06, + "loss": 1.1531, + "step": 8678 + }, + { + "epoch": 0.26, + "learning_rate": 4.3298779566537365e-06, + "loss": 1.2212, + "step": 8679 + }, + { + "epoch": 0.26, + "learning_rate": 4.329711751293147e-06, + "loss": 1.198, + "step": 8680 + }, + { + "epoch": 0.26, + "learning_rate": 4.329545528514585e-06, + "loss": 1.1717, + "step": 8681 + }, + { + "epoch": 0.26, + "learning_rate": 4.32937928831963e-06, + "loss": 1.0708, + "step": 8682 + }, + { + "epoch": 0.26, + "learning_rate": 4.329213030709865e-06, + "loss": 1.064, + "step": 8683 + }, + { + "epoch": 0.26, + "learning_rate": 4.329046755686873e-06, + "loss": 1.2774, + "step": 8684 + }, + { + "epoch": 0.26, + "learning_rate": 4.328880463252237e-06, + "loss": 1.0828, + "step": 8685 + }, + { + "epoch": 0.26, + "learning_rate": 4.3287141534075395e-06, + "loss": 1.2117, + "step": 8686 + }, + { + "epoch": 0.26, + "learning_rate": 4.328547826154364e-06, + "loss": 1.1906, + "step": 8687 + }, + { + "epoch": 0.26, + "learning_rate": 4.328381481494294e-06, + "loss": 1.1286, + "step": 8688 + }, + { + "epoch": 0.26, + "learning_rate": 4.328215119428913e-06, + "loss": 1.0529, + "step": 8689 + }, + { + "epoch": 0.26, + "learning_rate": 4.328048739959805e-06, + "loss": 1.2035, + "step": 8690 + }, + { + "epoch": 0.26, + "learning_rate": 4.327882343088553e-06, + "loss": 1.1161, + "step": 8691 + }, + { + "epoch": 0.26, + "learning_rate": 4.32771592881674e-06, + "loss": 1.1575, + "step": 8692 + }, + { + "epoch": 0.26, + "learning_rate": 4.327549497145953e-06, + "loss": 1.0101, + "step": 8693 + }, + { + "epoch": 0.26, + "learning_rate": 4.327383048077776e-06, + "loss": 1.1242, + "step": 8694 + }, + { + "epoch": 0.26, + "learning_rate": 4.32721658161379e-06, + "loss": 1.1573, + "step": 8695 + }, + { + "epoch": 0.26, + "learning_rate": 4.327050097755584e-06, + "loss": 1.174, + "step": 8696 + }, + { + "epoch": 0.26, + "learning_rate": 4.32688359650474e-06, + "loss": 1.048, + "step": 8697 + }, + { + "epoch": 0.26, + "learning_rate": 4.326717077862845e-06, + "loss": 1.1521, + "step": 8698 + }, + { + "epoch": 0.26, + "learning_rate": 4.3265505418314825e-06, + "loss": 1.1105, + "step": 8699 + }, + { + "epoch": 0.26, + "learning_rate": 4.32638398841224e-06, + "loss": 1.1761, + "step": 8700 + }, + { + "epoch": 0.26, + "learning_rate": 4.326217417606699e-06, + "loss": 1.1326, + "step": 8701 + }, + { + "epoch": 0.26, + "learning_rate": 4.326050829416449e-06, + "loss": 1.1396, + "step": 8702 + }, + { + "epoch": 0.26, + "learning_rate": 4.325884223843075e-06, + "loss": 1.2943, + "step": 8703 + }, + { + "epoch": 0.26, + "learning_rate": 4.325717600888163e-06, + "loss": 1.0061, + "step": 8704 + }, + { + "epoch": 0.26, + "learning_rate": 4.325550960553298e-06, + "loss": 1.2117, + "step": 8705 + }, + { + "epoch": 0.26, + "learning_rate": 4.325384302840066e-06, + "loss": 1.134, + "step": 8706 + }, + { + "epoch": 0.26, + "learning_rate": 4.3252176277500555e-06, + "loss": 1.17, + "step": 8707 + }, + { + "epoch": 0.26, + "learning_rate": 4.325050935284853e-06, + "loss": 1.1079, + "step": 8708 + }, + { + "epoch": 0.26, + "learning_rate": 4.324884225446043e-06, + "loss": 1.1299, + "step": 8709 + }, + { + "epoch": 0.26, + "learning_rate": 4.324717498235215e-06, + "loss": 1.2125, + "step": 8710 + }, + { + "epoch": 0.26, + "learning_rate": 4.324550753653956e-06, + "loss": 1.1035, + "step": 8711 + }, + { + "epoch": 0.26, + "learning_rate": 4.324383991703851e-06, + "loss": 1.2387, + "step": 8712 + }, + { + "epoch": 0.26, + "learning_rate": 4.32421721238649e-06, + "loss": 1.1124, + "step": 8713 + }, + { + "epoch": 0.26, + "learning_rate": 4.324050415703459e-06, + "loss": 1.085, + "step": 8714 + }, + { + "epoch": 0.26, + "learning_rate": 4.3238836016563475e-06, + "loss": 1.0493, + "step": 8715 + }, + { + "epoch": 0.26, + "learning_rate": 4.323716770246742e-06, + "loss": 1.1274, + "step": 8716 + }, + { + "epoch": 0.26, + "learning_rate": 4.323549921476231e-06, + "loss": 1.2571, + "step": 8717 + }, + { + "epoch": 0.26, + "learning_rate": 4.323383055346403e-06, + "loss": 1.334, + "step": 8718 + }, + { + "epoch": 0.26, + "learning_rate": 4.323216171858847e-06, + "loss": 1.2231, + "step": 8719 + }, + { + "epoch": 0.26, + "learning_rate": 4.3230492710151505e-06, + "loss": 1.1841, + "step": 8720 + }, + { + "epoch": 0.26, + "learning_rate": 4.322882352816903e-06, + "loss": 1.1344, + "step": 8721 + }, + { + "epoch": 0.26, + "learning_rate": 4.322715417265694e-06, + "loss": 1.0914, + "step": 8722 + }, + { + "epoch": 0.26, + "learning_rate": 4.322548464363112e-06, + "loss": 1.0628, + "step": 8723 + }, + { + "epoch": 0.26, + "learning_rate": 4.3223814941107465e-06, + "loss": 1.2275, + "step": 8724 + }, + { + "epoch": 0.26, + "learning_rate": 4.322214506510186e-06, + "loss": 1.1477, + "step": 8725 + }, + { + "epoch": 0.26, + "learning_rate": 4.322047501563022e-06, + "loss": 1.1383, + "step": 8726 + }, + { + "epoch": 0.26, + "learning_rate": 4.321880479270842e-06, + "loss": 1.1428, + "step": 8727 + }, + { + "epoch": 0.26, + "learning_rate": 4.321713439635239e-06, + "loss": 1.2921, + "step": 8728 + }, + { + "epoch": 0.26, + "learning_rate": 4.321546382657801e-06, + "loss": 1.0824, + "step": 8729 + }, + { + "epoch": 0.26, + "learning_rate": 4.321379308340118e-06, + "loss": 1.2639, + "step": 8730 + }, + { + "epoch": 0.26, + "learning_rate": 4.321212216683781e-06, + "loss": 1.1536, + "step": 8731 + }, + { + "epoch": 0.26, + "learning_rate": 4.321045107690381e-06, + "loss": 1.1459, + "step": 8732 + }, + { + "epoch": 0.26, + "learning_rate": 4.3208779813615095e-06, + "loss": 1.1374, + "step": 8733 + }, + { + "epoch": 0.26, + "learning_rate": 4.320710837698756e-06, + "loss": 1.1863, + "step": 8734 + }, + { + "epoch": 0.26, + "learning_rate": 4.3205436767037124e-06, + "loss": 1.1287, + "step": 8735 + }, + { + "epoch": 0.26, + "learning_rate": 4.320376498377969e-06, + "loss": 1.1475, + "step": 8736 + }, + { + "epoch": 0.26, + "learning_rate": 4.320209302723119e-06, + "loss": 1.1958, + "step": 8737 + }, + { + "epoch": 0.26, + "learning_rate": 4.320042089740752e-06, + "loss": 1.04, + "step": 8738 + }, + { + "epoch": 0.26, + "learning_rate": 4.319874859432462e-06, + "loss": 1.105, + "step": 8739 + }, + { + "epoch": 0.26, + "learning_rate": 4.31970761179984e-06, + "loss": 1.1215, + "step": 8740 + }, + { + "epoch": 0.26, + "learning_rate": 4.319540346844478e-06, + "loss": 1.1201, + "step": 8741 + }, + { + "epoch": 0.26, + "learning_rate": 4.319373064567966e-06, + "loss": 1.0936, + "step": 8742 + }, + { + "epoch": 0.26, + "learning_rate": 4.319205764971901e-06, + "loss": 1.1192, + "step": 8743 + }, + { + "epoch": 0.26, + "learning_rate": 4.319038448057873e-06, + "loss": 1.1079, + "step": 8744 + }, + { + "epoch": 0.26, + "learning_rate": 4.318871113827474e-06, + "loss": 1.1464, + "step": 8745 + }, + { + "epoch": 0.26, + "learning_rate": 4.318703762282299e-06, + "loss": 1.0402, + "step": 8746 + }, + { + "epoch": 0.26, + "learning_rate": 4.31853639342394e-06, + "loss": 1.1134, + "step": 8747 + }, + { + "epoch": 0.26, + "learning_rate": 4.3183690072539895e-06, + "loss": 1.1464, + "step": 8748 + }, + { + "epoch": 0.26, + "learning_rate": 4.318201603774043e-06, + "loss": 1.0464, + "step": 8749 + }, + { + "epoch": 0.26, + "learning_rate": 4.318034182985692e-06, + "loss": 1.0597, + "step": 8750 + }, + { + "epoch": 0.26, + "learning_rate": 4.317866744890531e-06, + "loss": 1.2021, + "step": 8751 + }, + { + "epoch": 0.26, + "learning_rate": 4.317699289490155e-06, + "loss": 1.1422, + "step": 8752 + }, + { + "epoch": 0.26, + "learning_rate": 4.317531816786157e-06, + "loss": 1.1305, + "step": 8753 + }, + { + "epoch": 0.26, + "learning_rate": 4.317364326780131e-06, + "loss": 1.2868, + "step": 8754 + }, + { + "epoch": 0.26, + "learning_rate": 4.317196819473672e-06, + "loss": 1.2644, + "step": 8755 + }, + { + "epoch": 0.26, + "learning_rate": 4.317029294868375e-06, + "loss": 1.1208, + "step": 8756 + }, + { + "epoch": 0.26, + "learning_rate": 4.316861752965833e-06, + "loss": 1.0956, + "step": 8757 + }, + { + "epoch": 0.26, + "learning_rate": 4.316694193767643e-06, + "loss": 1.1184, + "step": 8758 + }, + { + "epoch": 0.26, + "learning_rate": 4.3165266172754e-06, + "loss": 1.1622, + "step": 8759 + }, + { + "epoch": 0.26, + "learning_rate": 4.316359023490697e-06, + "loss": 1.1792, + "step": 8760 + }, + { + "epoch": 0.26, + "learning_rate": 4.316191412415132e-06, + "loss": 1.2594, + "step": 8761 + }, + { + "epoch": 0.26, + "learning_rate": 4.316023784050298e-06, + "loss": 1.2888, + "step": 8762 + }, + { + "epoch": 0.26, + "learning_rate": 4.315856138397793e-06, + "loss": 1.1204, + "step": 8763 + }, + { + "epoch": 0.26, + "learning_rate": 4.315688475459213e-06, + "loss": 1.2872, + "step": 8764 + }, + { + "epoch": 0.26, + "learning_rate": 4.3155207952361525e-06, + "loss": 1.1531, + "step": 8765 + }, + { + "epoch": 0.26, + "learning_rate": 4.315353097730208e-06, + "loss": 1.1436, + "step": 8766 + }, + { + "epoch": 0.26, + "learning_rate": 4.315185382942977e-06, + "loss": 1.1478, + "step": 8767 + }, + { + "epoch": 0.26, + "learning_rate": 4.315017650876055e-06, + "loss": 1.0079, + "step": 8768 + }, + { + "epoch": 0.26, + "learning_rate": 4.314849901531038e-06, + "loss": 1.1091, + "step": 8769 + }, + { + "epoch": 0.26, + "learning_rate": 4.3146821349095255e-06, + "loss": 1.2197, + "step": 8770 + }, + { + "epoch": 0.26, + "learning_rate": 4.314514351013113e-06, + "loss": 1.0529, + "step": 8771 + }, + { + "epoch": 0.26, + "learning_rate": 4.314346549843398e-06, + "loss": 1.1516, + "step": 8772 + }, + { + "epoch": 0.26, + "learning_rate": 4.314178731401977e-06, + "loss": 1.1104, + "step": 8773 + }, + { + "epoch": 0.26, + "learning_rate": 4.314010895690449e-06, + "loss": 1.2328, + "step": 8774 + }, + { + "epoch": 0.26, + "learning_rate": 4.313843042710409e-06, + "loss": 1.2449, + "step": 8775 + }, + { + "epoch": 0.26, + "learning_rate": 4.313675172463459e-06, + "loss": 1.1816, + "step": 8776 + }, + { + "epoch": 0.26, + "learning_rate": 4.3135072849511935e-06, + "loss": 1.1885, + "step": 8777 + }, + { + "epoch": 0.26, + "learning_rate": 4.313339380175213e-06, + "loss": 1.1189, + "step": 8778 + }, + { + "epoch": 0.26, + "learning_rate": 4.313171458137114e-06, + "loss": 1.0867, + "step": 8779 + }, + { + "epoch": 0.26, + "learning_rate": 4.313003518838497e-06, + "loss": 1.0715, + "step": 8780 + }, + { + "epoch": 0.26, + "learning_rate": 4.31283556228096e-06, + "loss": 1.182, + "step": 8781 + }, + { + "epoch": 0.26, + "learning_rate": 4.312667588466099e-06, + "loss": 1.1343, + "step": 8782 + }, + { + "epoch": 0.26, + "learning_rate": 4.312499597395518e-06, + "loss": 1.1705, + "step": 8783 + }, + { + "epoch": 0.26, + "learning_rate": 4.312331589070813e-06, + "loss": 1.1937, + "step": 8784 + }, + { + "epoch": 0.26, + "learning_rate": 4.312163563493584e-06, + "loss": 1.2327, + "step": 8785 + }, + { + "epoch": 0.26, + "learning_rate": 4.311995520665431e-06, + "loss": 1.1735, + "step": 8786 + }, + { + "epoch": 0.26, + "learning_rate": 4.311827460587953e-06, + "loss": 1.0757, + "step": 8787 + }, + { + "epoch": 0.26, + "learning_rate": 4.31165938326275e-06, + "loss": 1.1531, + "step": 8788 + }, + { + "epoch": 0.26, + "learning_rate": 4.311491288691423e-06, + "loss": 1.0825, + "step": 8789 + }, + { + "epoch": 0.26, + "learning_rate": 4.31132317687557e-06, + "loss": 1.1149, + "step": 8790 + }, + { + "epoch": 0.26, + "learning_rate": 4.311155047816794e-06, + "loss": 1.1762, + "step": 8791 + }, + { + "epoch": 0.26, + "learning_rate": 4.310986901516694e-06, + "loss": 1.2268, + "step": 8792 + }, + { + "epoch": 0.26, + "learning_rate": 4.31081873797687e-06, + "loss": 1.0991, + "step": 8793 + }, + { + "epoch": 0.26, + "learning_rate": 4.310650557198925e-06, + "loss": 1.2352, + "step": 8794 + }, + { + "epoch": 0.26, + "learning_rate": 4.310482359184458e-06, + "loss": 1.1009, + "step": 8795 + }, + { + "epoch": 0.26, + "learning_rate": 4.310314143935071e-06, + "loss": 1.0337, + "step": 8796 + }, + { + "epoch": 0.27, + "learning_rate": 4.310145911452365e-06, + "loss": 1.1472, + "step": 8797 + }, + { + "epoch": 0.27, + "learning_rate": 4.309977661737942e-06, + "loss": 1.2031, + "step": 8798 + }, + { + "epoch": 0.27, + "learning_rate": 4.309809394793404e-06, + "loss": 1.1462, + "step": 8799 + }, + { + "epoch": 0.27, + "learning_rate": 4.309641110620352e-06, + "loss": 1.176, + "step": 8800 + }, + { + "epoch": 0.27, + "learning_rate": 4.309472809220388e-06, + "loss": 1.0925, + "step": 8801 + }, + { + "epoch": 0.27, + "learning_rate": 4.309304490595113e-06, + "loss": 1.1738, + "step": 8802 + }, + { + "epoch": 0.27, + "learning_rate": 4.309136154746132e-06, + "loss": 1.1196, + "step": 8803 + }, + { + "epoch": 0.27, + "learning_rate": 4.308967801675046e-06, + "loss": 1.1007, + "step": 8804 + }, + { + "epoch": 0.27, + "learning_rate": 4.308799431383457e-06, + "loss": 1.2717, + "step": 8805 + }, + { + "epoch": 0.27, + "learning_rate": 4.30863104387297e-06, + "loss": 1.0263, + "step": 8806 + }, + { + "epoch": 0.27, + "learning_rate": 4.308462639145186e-06, + "loss": 1.1437, + "step": 8807 + }, + { + "epoch": 0.27, + "learning_rate": 4.308294217201707e-06, + "loss": 1.2017, + "step": 8808 + }, + { + "epoch": 0.27, + "learning_rate": 4.30812577804414e-06, + "loss": 1.1136, + "step": 8809 + }, + { + "epoch": 0.27, + "learning_rate": 4.3079573216740855e-06, + "loss": 1.1036, + "step": 8810 + }, + { + "epoch": 0.27, + "learning_rate": 4.307788848093148e-06, + "loss": 1.2711, + "step": 8811 + }, + { + "epoch": 0.27, + "learning_rate": 4.307620357302932e-06, + "loss": 1.2437, + "step": 8812 + }, + { + "epoch": 0.27, + "learning_rate": 4.30745184930504e-06, + "loss": 1.0417, + "step": 8813 + }, + { + "epoch": 0.27, + "learning_rate": 4.307283324101078e-06, + "loss": 1.239, + "step": 8814 + }, + { + "epoch": 0.27, + "learning_rate": 4.3071147816926484e-06, + "loss": 1.2433, + "step": 8815 + }, + { + "epoch": 0.27, + "learning_rate": 4.306946222081356e-06, + "loss": 1.105, + "step": 8816 + }, + { + "epoch": 0.27, + "learning_rate": 4.306777645268806e-06, + "loss": 1.0569, + "step": 8817 + }, + { + "epoch": 0.27, + "learning_rate": 4.306609051256603e-06, + "loss": 1.1519, + "step": 8818 + }, + { + "epoch": 0.27, + "learning_rate": 4.306440440046353e-06, + "loss": 1.0289, + "step": 8819 + }, + { + "epoch": 0.27, + "learning_rate": 4.306271811639659e-06, + "loss": 1.174, + "step": 8820 + }, + { + "epoch": 0.27, + "learning_rate": 4.3061031660381275e-06, + "loss": 1.1023, + "step": 8821 + }, + { + "epoch": 0.27, + "learning_rate": 4.305934503243364e-06, + "loss": 1.067, + "step": 8822 + }, + { + "epoch": 0.27, + "learning_rate": 4.305765823256973e-06, + "loss": 1.1971, + "step": 8823 + }, + { + "epoch": 0.27, + "learning_rate": 4.305597126080562e-06, + "loss": 1.2474, + "step": 8824 + }, + { + "epoch": 0.27, + "learning_rate": 4.305428411715735e-06, + "loss": 1.0916, + "step": 8825 + }, + { + "epoch": 0.27, + "learning_rate": 4.3052596801641e-06, + "loss": 1.1628, + "step": 8826 + }, + { + "epoch": 0.27, + "learning_rate": 4.305090931427262e-06, + "loss": 1.0533, + "step": 8827 + }, + { + "epoch": 0.27, + "learning_rate": 4.304922165506827e-06, + "loss": 1.0348, + "step": 8828 + }, + { + "epoch": 0.27, + "learning_rate": 4.304753382404403e-06, + "loss": 1.2133, + "step": 8829 + }, + { + "epoch": 0.27, + "learning_rate": 4.304584582121596e-06, + "loss": 1.2216, + "step": 8830 + }, + { + "epoch": 0.27, + "learning_rate": 4.304415764660013e-06, + "loss": 1.1978, + "step": 8831 + }, + { + "epoch": 0.27, + "learning_rate": 4.30424693002126e-06, + "loss": 1.2048, + "step": 8832 + }, + { + "epoch": 0.27, + "learning_rate": 4.304078078206946e-06, + "loss": 1.1185, + "step": 8833 + }, + { + "epoch": 0.27, + "learning_rate": 4.303909209218677e-06, + "loss": 1.1116, + "step": 8834 + }, + { + "epoch": 0.27, + "learning_rate": 4.303740323058062e-06, + "loss": 1.2192, + "step": 8835 + }, + { + "epoch": 0.27, + "learning_rate": 4.303571419726707e-06, + "loss": 1.1454, + "step": 8836 + }, + { + "epoch": 0.27, + "learning_rate": 4.303402499226221e-06, + "loss": 1.1482, + "step": 8837 + }, + { + "epoch": 0.27, + "learning_rate": 4.303233561558212e-06, + "loss": 1.0934, + "step": 8838 + }, + { + "epoch": 0.27, + "learning_rate": 4.303064606724288e-06, + "loss": 1.0638, + "step": 8839 + }, + { + "epoch": 0.27, + "learning_rate": 4.302895634726057e-06, + "loss": 1.0439, + "step": 8840 + }, + { + "epoch": 0.27, + "learning_rate": 4.302726645565129e-06, + "loss": 1.0472, + "step": 8841 + }, + { + "epoch": 0.27, + "learning_rate": 4.30255763924311e-06, + "loss": 1.0364, + "step": 8842 + }, + { + "epoch": 0.27, + "learning_rate": 4.302388615761611e-06, + "loss": 1.2788, + "step": 8843 + }, + { + "epoch": 0.27, + "learning_rate": 4.302219575122239e-06, + "loss": 1.3479, + "step": 8844 + }, + { + "epoch": 0.27, + "learning_rate": 4.302050517326607e-06, + "loss": 1.191, + "step": 8845 + }, + { + "epoch": 0.27, + "learning_rate": 4.301881442376321e-06, + "loss": 1.1122, + "step": 8846 + }, + { + "epoch": 0.27, + "learning_rate": 4.301712350272991e-06, + "loss": 1.1191, + "step": 8847 + }, + { + "epoch": 0.27, + "learning_rate": 4.301543241018228e-06, + "loss": 1.1412, + "step": 8848 + }, + { + "epoch": 0.27, + "learning_rate": 4.3013741146136406e-06, + "loss": 1.266, + "step": 8849 + }, + { + "epoch": 0.27, + "learning_rate": 4.30120497106084e-06, + "loss": 1.1889, + "step": 8850 + }, + { + "epoch": 0.27, + "learning_rate": 4.301035810361433e-06, + "loss": 1.1819, + "step": 8851 + }, + { + "epoch": 0.27, + "learning_rate": 4.3008666325170355e-06, + "loss": 1.1592, + "step": 8852 + }, + { + "epoch": 0.27, + "learning_rate": 4.300697437529253e-06, + "loss": 1.1761, + "step": 8853 + }, + { + "epoch": 0.27, + "learning_rate": 4.3005282253996996e-06, + "loss": 1.2156, + "step": 8854 + }, + { + "epoch": 0.27, + "learning_rate": 4.300358996129984e-06, + "loss": 1.1392, + "step": 8855 + }, + { + "epoch": 0.27, + "learning_rate": 4.3001897497217186e-06, + "loss": 1.2167, + "step": 8856 + }, + { + "epoch": 0.27, + "learning_rate": 4.300020486176512e-06, + "loss": 1.1684, + "step": 8857 + }, + { + "epoch": 0.27, + "learning_rate": 4.2998512054959785e-06, + "loss": 1.1436, + "step": 8858 + }, + { + "epoch": 0.27, + "learning_rate": 4.299681907681728e-06, + "loss": 1.1144, + "step": 8859 + }, + { + "epoch": 0.27, + "learning_rate": 4.299512592735373e-06, + "loss": 1.1127, + "step": 8860 + }, + { + "epoch": 0.27, + "learning_rate": 4.2993432606585235e-06, + "loss": 1.2085, + "step": 8861 + }, + { + "epoch": 0.27, + "learning_rate": 4.299173911452794e-06, + "loss": 1.1202, + "step": 8862 + }, + { + "epoch": 0.27, + "learning_rate": 4.2990045451197956e-06, + "loss": 1.1672, + "step": 8863 + }, + { + "epoch": 0.27, + "learning_rate": 4.29883516166114e-06, + "loss": 1.151, + "step": 8864 + }, + { + "epoch": 0.27, + "learning_rate": 4.298665761078439e-06, + "loss": 1.1138, + "step": 8865 + }, + { + "epoch": 0.27, + "learning_rate": 4.298496343373307e-06, + "loss": 1.0929, + "step": 8866 + }, + { + "epoch": 0.27, + "learning_rate": 4.298326908547357e-06, + "loss": 1.1553, + "step": 8867 + }, + { + "epoch": 0.27, + "learning_rate": 4.2981574566022e-06, + "loss": 1.0873, + "step": 8868 + }, + { + "epoch": 0.27, + "learning_rate": 4.29798798753945e-06, + "loss": 1.1889, + "step": 8869 + }, + { + "epoch": 0.27, + "learning_rate": 4.29781850136072e-06, + "loss": 1.1727, + "step": 8870 + }, + { + "epoch": 0.27, + "learning_rate": 4.297648998067624e-06, + "loss": 1.1829, + "step": 8871 + }, + { + "epoch": 0.27, + "learning_rate": 4.297479477661775e-06, + "loss": 1.1821, + "step": 8872 + }, + { + "epoch": 0.27, + "learning_rate": 4.297309940144788e-06, + "loss": 1.0759, + "step": 8873 + }, + { + "epoch": 0.27, + "learning_rate": 4.297140385518275e-06, + "loss": 1.2217, + "step": 8874 + }, + { + "epoch": 0.27, + "learning_rate": 4.2969708137838515e-06, + "loss": 1.1317, + "step": 8875 + }, + { + "epoch": 0.27, + "learning_rate": 4.296801224943131e-06, + "loss": 1.2098, + "step": 8876 + }, + { + "epoch": 0.27, + "learning_rate": 4.296631618997728e-06, + "loss": 1.1542, + "step": 8877 + }, + { + "epoch": 0.27, + "learning_rate": 4.2964619959492586e-06, + "loss": 1.072, + "step": 8878 + }, + { + "epoch": 0.27, + "learning_rate": 4.296292355799335e-06, + "loss": 1.0927, + "step": 8879 + }, + { + "epoch": 0.27, + "learning_rate": 4.296122698549574e-06, + "loss": 1.0845, + "step": 8880 + }, + { + "epoch": 0.27, + "learning_rate": 4.29595302420159e-06, + "loss": 1.2031, + "step": 8881 + }, + { + "epoch": 0.27, + "learning_rate": 4.295783332756997e-06, + "loss": 1.1674, + "step": 8882 + }, + { + "epoch": 0.27, + "learning_rate": 4.295613624217413e-06, + "loss": 1.1475, + "step": 8883 + }, + { + "epoch": 0.27, + "learning_rate": 4.295443898584451e-06, + "loss": 1.1178, + "step": 8884 + }, + { + "epoch": 0.27, + "learning_rate": 4.295274155859729e-06, + "loss": 1.2244, + "step": 8885 + }, + { + "epoch": 0.27, + "learning_rate": 4.295104396044861e-06, + "loss": 1.2239, + "step": 8886 + }, + { + "epoch": 0.27, + "learning_rate": 4.2949346191414635e-06, + "loss": 1.2347, + "step": 8887 + }, + { + "epoch": 0.27, + "learning_rate": 4.294764825151153e-06, + "loss": 1.1401, + "step": 8888 + }, + { + "epoch": 0.27, + "learning_rate": 4.2945950140755454e-06, + "loss": 1.1016, + "step": 8889 + }, + { + "epoch": 0.27, + "learning_rate": 4.294425185916258e-06, + "loss": 1.12, + "step": 8890 + }, + { + "epoch": 0.27, + "learning_rate": 4.2942553406749064e-06, + "loss": 1.0901, + "step": 8891 + }, + { + "epoch": 0.27, + "learning_rate": 4.2940854783531096e-06, + "loss": 1.1274, + "step": 8892 + }, + { + "epoch": 0.27, + "learning_rate": 4.2939155989524815e-06, + "loss": 1.0998, + "step": 8893 + }, + { + "epoch": 0.27, + "learning_rate": 4.293745702474642e-06, + "loss": 1.2095, + "step": 8894 + }, + { + "epoch": 0.27, + "learning_rate": 4.293575788921207e-06, + "loss": 1.2059, + "step": 8895 + }, + { + "epoch": 0.27, + "learning_rate": 4.293405858293794e-06, + "loss": 1.0933, + "step": 8896 + }, + { + "epoch": 0.27, + "learning_rate": 4.2932359105940215e-06, + "loss": 1.1818, + "step": 8897 + }, + { + "epoch": 0.27, + "learning_rate": 4.293065945823506e-06, + "loss": 1.1946, + "step": 8898 + }, + { + "epoch": 0.27, + "learning_rate": 4.292895963983866e-06, + "loss": 1.1222, + "step": 8899 + }, + { + "epoch": 0.27, + "learning_rate": 4.292725965076721e-06, + "loss": 1.1678, + "step": 8900 + }, + { + "epoch": 0.27, + "learning_rate": 4.292555949103688e-06, + "loss": 1.2596, + "step": 8901 + }, + { + "epoch": 0.27, + "learning_rate": 4.292385916066385e-06, + "loss": 1.1316, + "step": 8902 + }, + { + "epoch": 0.27, + "learning_rate": 4.292215865966433e-06, + "loss": 1.181, + "step": 8903 + }, + { + "epoch": 0.27, + "learning_rate": 4.292045798805448e-06, + "loss": 1.076, + "step": 8904 + }, + { + "epoch": 0.27, + "learning_rate": 4.29187571458505e-06, + "loss": 1.104, + "step": 8905 + }, + { + "epoch": 0.27, + "learning_rate": 4.291705613306858e-06, + "loss": 1.286, + "step": 8906 + }, + { + "epoch": 0.27, + "learning_rate": 4.291535494972491e-06, + "loss": 1.1431, + "step": 8907 + }, + { + "epoch": 0.27, + "learning_rate": 4.2913653595835705e-06, + "loss": 1.1295, + "step": 8908 + }, + { + "epoch": 0.27, + "learning_rate": 4.291195207141713e-06, + "loss": 1.1783, + "step": 8909 + }, + { + "epoch": 0.27, + "learning_rate": 4.291025037648541e-06, + "loss": 1.0871, + "step": 8910 + }, + { + "epoch": 0.27, + "learning_rate": 4.290854851105672e-06, + "loss": 1.0897, + "step": 8911 + }, + { + "epoch": 0.27, + "learning_rate": 4.290684647514728e-06, + "loss": 1.2651, + "step": 8912 + }, + { + "epoch": 0.27, + "learning_rate": 4.290514426877328e-06, + "loss": 1.0588, + "step": 8913 + }, + { + "epoch": 0.27, + "learning_rate": 4.290344189195094e-06, + "loss": 1.0923, + "step": 8914 + }, + { + "epoch": 0.27, + "learning_rate": 4.290173934469646e-06, + "loss": 1.1547, + "step": 8915 + }, + { + "epoch": 0.27, + "learning_rate": 4.290003662702603e-06, + "loss": 1.1174, + "step": 8916 + }, + { + "epoch": 0.27, + "learning_rate": 4.289833373895588e-06, + "loss": 1.1804, + "step": 8917 + }, + { + "epoch": 0.27, + "learning_rate": 4.289663068050221e-06, + "loss": 1.269, + "step": 8918 + }, + { + "epoch": 0.27, + "learning_rate": 4.289492745168124e-06, + "loss": 1.3033, + "step": 8919 + }, + { + "epoch": 0.27, + "learning_rate": 4.289322405250916e-06, + "loss": 1.0831, + "step": 8920 + }, + { + "epoch": 0.27, + "learning_rate": 4.2891520483002224e-06, + "loss": 1.1108, + "step": 8921 + }, + { + "epoch": 0.27, + "learning_rate": 4.288981674317663e-06, + "loss": 1.0806, + "step": 8922 + }, + { + "epoch": 0.27, + "learning_rate": 4.288811283304859e-06, + "loss": 1.2271, + "step": 8923 + }, + { + "epoch": 0.27, + "learning_rate": 4.288640875263433e-06, + "loss": 1.1255, + "step": 8924 + }, + { + "epoch": 0.27, + "learning_rate": 4.288470450195007e-06, + "loss": 1.1486, + "step": 8925 + }, + { + "epoch": 0.27, + "learning_rate": 4.288300008101205e-06, + "loss": 1.2958, + "step": 8926 + }, + { + "epoch": 0.27, + "learning_rate": 4.288129548983647e-06, + "loss": 1.2314, + "step": 8927 + }, + { + "epoch": 0.27, + "learning_rate": 4.287959072843957e-06, + "loss": 1.0612, + "step": 8928 + }, + { + "epoch": 0.27, + "learning_rate": 4.287788579683759e-06, + "loss": 1.0005, + "step": 8929 + }, + { + "epoch": 0.27, + "learning_rate": 4.287618069504673e-06, + "loss": 1.2623, + "step": 8930 + }, + { + "epoch": 0.27, + "learning_rate": 4.287447542308325e-06, + "loss": 1.1404, + "step": 8931 + }, + { + "epoch": 0.27, + "learning_rate": 4.287276998096337e-06, + "loss": 1.1201, + "step": 8932 + }, + { + "epoch": 0.27, + "learning_rate": 4.287106436870333e-06, + "loss": 1.1313, + "step": 8933 + }, + { + "epoch": 0.27, + "learning_rate": 4.2869358586319355e-06, + "loss": 1.2703, + "step": 8934 + }, + { + "epoch": 0.27, + "learning_rate": 4.286765263382771e-06, + "loss": 1.1149, + "step": 8935 + }, + { + "epoch": 0.27, + "learning_rate": 4.28659465112446e-06, + "loss": 1.1994, + "step": 8936 + }, + { + "epoch": 0.27, + "learning_rate": 4.286424021858629e-06, + "loss": 1.0842, + "step": 8937 + }, + { + "epoch": 0.27, + "learning_rate": 4.286253375586901e-06, + "loss": 1.0256, + "step": 8938 + }, + { + "epoch": 0.27, + "learning_rate": 4.286082712310903e-06, + "loss": 1.1284, + "step": 8939 + }, + { + "epoch": 0.27, + "learning_rate": 4.285912032032256e-06, + "loss": 1.1035, + "step": 8940 + }, + { + "epoch": 0.27, + "learning_rate": 4.285741334752588e-06, + "loss": 1.1863, + "step": 8941 + }, + { + "epoch": 0.27, + "learning_rate": 4.285570620473522e-06, + "loss": 1.1743, + "step": 8942 + }, + { + "epoch": 0.27, + "learning_rate": 4.285399889196683e-06, + "loss": 1.2101, + "step": 8943 + }, + { + "epoch": 0.27, + "learning_rate": 4.2852291409236965e-06, + "loss": 1.1922, + "step": 8944 + }, + { + "epoch": 0.27, + "learning_rate": 4.28505837565619e-06, + "loss": 1.1323, + "step": 8945 + }, + { + "epoch": 0.27, + "learning_rate": 4.284887593395787e-06, + "loss": 1.283, + "step": 8946 + }, + { + "epoch": 0.27, + "learning_rate": 4.284716794144113e-06, + "loss": 1.1819, + "step": 8947 + }, + { + "epoch": 0.27, + "learning_rate": 4.284545977902795e-06, + "loss": 1.196, + "step": 8948 + }, + { + "epoch": 0.27, + "learning_rate": 4.284375144673459e-06, + "loss": 1.3448, + "step": 8949 + }, + { + "epoch": 0.27, + "learning_rate": 4.284204294457731e-06, + "loss": 1.2335, + "step": 8950 + }, + { + "epoch": 0.27, + "learning_rate": 4.284033427257237e-06, + "loss": 1.2208, + "step": 8951 + }, + { + "epoch": 0.27, + "learning_rate": 4.2838625430736046e-06, + "loss": 1.1171, + "step": 8952 + }, + { + "epoch": 0.27, + "learning_rate": 4.28369164190846e-06, + "loss": 1.0951, + "step": 8953 + }, + { + "epoch": 0.27, + "learning_rate": 4.283520723763429e-06, + "loss": 1.1286, + "step": 8954 + }, + { + "epoch": 0.27, + "learning_rate": 4.28334978864014e-06, + "loss": 1.1654, + "step": 8955 + }, + { + "epoch": 0.27, + "learning_rate": 4.2831788365402205e-06, + "loss": 1.152, + "step": 8956 + }, + { + "epoch": 0.27, + "learning_rate": 4.2830078674652965e-06, + "loss": 1.0474, + "step": 8957 + }, + { + "epoch": 0.27, + "learning_rate": 4.282836881416997e-06, + "loss": 1.2014, + "step": 8958 + }, + { + "epoch": 0.27, + "learning_rate": 4.282665878396949e-06, + "loss": 1.1311, + "step": 8959 + }, + { + "epoch": 0.27, + "learning_rate": 4.282494858406781e-06, + "loss": 1.1298, + "step": 8960 + }, + { + "epoch": 0.27, + "learning_rate": 4.282323821448119e-06, + "loss": 1.1812, + "step": 8961 + }, + { + "epoch": 0.27, + "learning_rate": 4.282152767522594e-06, + "loss": 1.1141, + "step": 8962 + }, + { + "epoch": 0.27, + "learning_rate": 4.281981696631832e-06, + "loss": 1.128, + "step": 8963 + }, + { + "epoch": 0.27, + "learning_rate": 4.2818106087774625e-06, + "loss": 1.1251, + "step": 8964 + }, + { + "epoch": 0.27, + "learning_rate": 4.281639503961114e-06, + "loss": 1.1646, + "step": 8965 + }, + { + "epoch": 0.27, + "learning_rate": 4.281468382184416e-06, + "loss": 1.1241, + "step": 8966 + }, + { + "epoch": 0.27, + "learning_rate": 4.281297243448997e-06, + "loss": 1.1856, + "step": 8967 + }, + { + "epoch": 0.27, + "learning_rate": 4.281126087756487e-06, + "loss": 1.2209, + "step": 8968 + }, + { + "epoch": 0.27, + "learning_rate": 4.280954915108513e-06, + "loss": 1.2016, + "step": 8969 + }, + { + "epoch": 0.27, + "learning_rate": 4.280783725506706e-06, + "loss": 1.0934, + "step": 8970 + }, + { + "epoch": 0.27, + "learning_rate": 4.280612518952696e-06, + "loss": 1.0954, + "step": 8971 + }, + { + "epoch": 0.27, + "learning_rate": 4.280441295448112e-06, + "loss": 1.0681, + "step": 8972 + }, + { + "epoch": 0.27, + "learning_rate": 4.280270054994586e-06, + "loss": 1.28, + "step": 8973 + }, + { + "epoch": 0.27, + "learning_rate": 4.280098797593744e-06, + "loss": 1.1671, + "step": 8974 + }, + { + "epoch": 0.27, + "learning_rate": 4.27992752324722e-06, + "loss": 1.0878, + "step": 8975 + }, + { + "epoch": 0.27, + "learning_rate": 4.2797562319566435e-06, + "loss": 1.1813, + "step": 8976 + }, + { + "epoch": 0.27, + "learning_rate": 4.279584923723645e-06, + "loss": 0.9933, + "step": 8977 + }, + { + "epoch": 0.27, + "learning_rate": 4.2794135985498544e-06, + "loss": 1.1849, + "step": 8978 + }, + { + "epoch": 0.27, + "learning_rate": 4.279242256436904e-06, + "loss": 1.1835, + "step": 8979 + }, + { + "epoch": 0.27, + "learning_rate": 4.279070897386424e-06, + "loss": 1.1305, + "step": 8980 + }, + { + "epoch": 0.27, + "learning_rate": 4.278899521400045e-06, + "loss": 1.1035, + "step": 8981 + }, + { + "epoch": 0.27, + "learning_rate": 4.2787281284794e-06, + "loss": 1.0959, + "step": 8982 + }, + { + "epoch": 0.27, + "learning_rate": 4.27855671862612e-06, + "loss": 1.0795, + "step": 8983 + }, + { + "epoch": 0.27, + "learning_rate": 4.278385291841837e-06, + "loss": 1.0635, + "step": 8984 + }, + { + "epoch": 0.27, + "learning_rate": 4.278213848128182e-06, + "loss": 1.1336, + "step": 8985 + }, + { + "epoch": 0.27, + "learning_rate": 4.278042387486787e-06, + "loss": 1.0648, + "step": 8986 + }, + { + "epoch": 0.27, + "learning_rate": 4.277870909919286e-06, + "loss": 1.1083, + "step": 8987 + }, + { + "epoch": 0.27, + "learning_rate": 4.27769941542731e-06, + "loss": 1.0873, + "step": 8988 + }, + { + "epoch": 0.27, + "learning_rate": 4.277527904012491e-06, + "loss": 1.1492, + "step": 8989 + }, + { + "epoch": 0.27, + "learning_rate": 4.277356375676462e-06, + "loss": 1.1184, + "step": 8990 + }, + { + "epoch": 0.27, + "learning_rate": 4.277184830420858e-06, + "loss": 1.1379, + "step": 8991 + }, + { + "epoch": 0.27, + "learning_rate": 4.27701326824731e-06, + "loss": 1.134, + "step": 8992 + }, + { + "epoch": 0.27, + "learning_rate": 4.27684168915745e-06, + "loss": 1.1745, + "step": 8993 + }, + { + "epoch": 0.27, + "learning_rate": 4.276670093152915e-06, + "loss": 1.1367, + "step": 8994 + }, + { + "epoch": 0.27, + "learning_rate": 4.276498480235335e-06, + "loss": 1.1113, + "step": 8995 + }, + { + "epoch": 0.27, + "learning_rate": 4.276326850406345e-06, + "loss": 1.113, + "step": 8996 + }, + { + "epoch": 0.27, + "learning_rate": 4.276155203667579e-06, + "loss": 1.0485, + "step": 8997 + }, + { + "epoch": 0.27, + "learning_rate": 4.275983540020671e-06, + "loss": 1.149, + "step": 8998 + }, + { + "epoch": 0.27, + "learning_rate": 4.275811859467255e-06, + "loss": 1.1727, + "step": 8999 + }, + { + "epoch": 0.27, + "learning_rate": 4.275640162008966e-06, + "loss": 1.2222, + "step": 9000 + }, + { + "epoch": 0.27, + "learning_rate": 4.275468447647438e-06, + "loss": 1.1234, + "step": 9001 + }, + { + "epoch": 0.27, + "learning_rate": 4.275296716384304e-06, + "loss": 1.1953, + "step": 9002 + }, + { + "epoch": 0.27, + "learning_rate": 4.275124968221201e-06, + "loss": 1.093, + "step": 9003 + }, + { + "epoch": 0.27, + "learning_rate": 4.274953203159763e-06, + "loss": 1.1807, + "step": 9004 + }, + { + "epoch": 0.27, + "learning_rate": 4.274781421201626e-06, + "loss": 1.2792, + "step": 9005 + }, + { + "epoch": 0.27, + "learning_rate": 4.2746096223484245e-06, + "loss": 1.1591, + "step": 9006 + }, + { + "epoch": 0.27, + "learning_rate": 4.274437806601794e-06, + "loss": 1.0891, + "step": 9007 + }, + { + "epoch": 0.27, + "learning_rate": 4.2742659739633695e-06, + "loss": 1.058, + "step": 9008 + }, + { + "epoch": 0.27, + "learning_rate": 4.274094124434788e-06, + "loss": 1.0943, + "step": 9009 + }, + { + "epoch": 0.27, + "learning_rate": 4.273922258017685e-06, + "loss": 1.0828, + "step": 9010 + }, + { + "epoch": 0.27, + "learning_rate": 4.273750374713697e-06, + "loss": 1.0988, + "step": 9011 + }, + { + "epoch": 0.27, + "learning_rate": 4.273578474524459e-06, + "loss": 1.2403, + "step": 9012 + }, + { + "epoch": 0.27, + "learning_rate": 4.273406557451608e-06, + "loss": 1.088, + "step": 9013 + }, + { + "epoch": 0.27, + "learning_rate": 4.2732346234967805e-06, + "loss": 1.2229, + "step": 9014 + }, + { + "epoch": 0.27, + "learning_rate": 4.273062672661613e-06, + "loss": 1.1648, + "step": 9015 + }, + { + "epoch": 0.27, + "learning_rate": 4.272890704947744e-06, + "loss": 1.0144, + "step": 9016 + }, + { + "epoch": 0.27, + "learning_rate": 4.272718720356809e-06, + "loss": 1.1093, + "step": 9017 + }, + { + "epoch": 0.27, + "learning_rate": 4.2725467188904455e-06, + "loss": 1.187, + "step": 9018 + }, + { + "epoch": 0.27, + "learning_rate": 4.27237470055029e-06, + "loss": 1.1527, + "step": 9019 + }, + { + "epoch": 0.27, + "learning_rate": 4.2722026653379824e-06, + "loss": 1.1018, + "step": 9020 + }, + { + "epoch": 0.27, + "learning_rate": 4.272030613255158e-06, + "loss": 1.1902, + "step": 9021 + }, + { + "epoch": 0.27, + "learning_rate": 4.2718585443034564e-06, + "loss": 1.142, + "step": 9022 + }, + { + "epoch": 0.27, + "learning_rate": 4.271686458484514e-06, + "loss": 1.0395, + "step": 9023 + }, + { + "epoch": 0.27, + "learning_rate": 4.27151435579997e-06, + "loss": 1.064, + "step": 9024 + }, + { + "epoch": 0.27, + "learning_rate": 4.2713422362514625e-06, + "loss": 1.1859, + "step": 9025 + }, + { + "epoch": 0.27, + "learning_rate": 4.27117009984063e-06, + "loss": 1.1697, + "step": 9026 + }, + { + "epoch": 0.27, + "learning_rate": 4.270997946569112e-06, + "loss": 1.2428, + "step": 9027 + }, + { + "epoch": 0.27, + "learning_rate": 4.2708257764385455e-06, + "loss": 1.1973, + "step": 9028 + }, + { + "epoch": 0.27, + "learning_rate": 4.27065358945057e-06, + "loss": 1.1345, + "step": 9029 + }, + { + "epoch": 0.27, + "learning_rate": 4.270481385606827e-06, + "loss": 1.1445, + "step": 9030 + }, + { + "epoch": 0.27, + "learning_rate": 4.270309164908952e-06, + "loss": 1.1616, + "step": 9031 + }, + { + "epoch": 0.27, + "learning_rate": 4.270136927358588e-06, + "loss": 1.1387, + "step": 9032 + }, + { + "epoch": 0.27, + "learning_rate": 4.269964672957372e-06, + "loss": 1.2211, + "step": 9033 + }, + { + "epoch": 0.27, + "learning_rate": 4.269792401706945e-06, + "loss": 1.0892, + "step": 9034 + }, + { + "epoch": 0.27, + "learning_rate": 4.2696201136089466e-06, + "loss": 1.0938, + "step": 9035 + }, + { + "epoch": 0.27, + "learning_rate": 4.269447808665017e-06, + "loss": 1.1801, + "step": 9036 + }, + { + "epoch": 0.27, + "learning_rate": 4.269275486876796e-06, + "loss": 1.0659, + "step": 9037 + }, + { + "epoch": 0.27, + "learning_rate": 4.269103148245925e-06, + "loss": 1.1445, + "step": 9038 + }, + { + "epoch": 0.27, + "learning_rate": 4.268930792774044e-06, + "loss": 1.0942, + "step": 9039 + }, + { + "epoch": 0.27, + "learning_rate": 4.268758420462794e-06, + "loss": 1.0779, + "step": 9040 + }, + { + "epoch": 0.27, + "learning_rate": 4.2685860313138155e-06, + "loss": 1.0579, + "step": 9041 + }, + { + "epoch": 0.27, + "learning_rate": 4.26841362532875e-06, + "loss": 1.0479, + "step": 9042 + }, + { + "epoch": 0.27, + "learning_rate": 4.268241202509238e-06, + "loss": 1.2421, + "step": 9043 + }, + { + "epoch": 0.27, + "learning_rate": 4.268068762856922e-06, + "loss": 1.1439, + "step": 9044 + }, + { + "epoch": 0.27, + "learning_rate": 4.267896306373442e-06, + "loss": 1.1202, + "step": 9045 + }, + { + "epoch": 0.27, + "learning_rate": 4.267723833060441e-06, + "loss": 1.1416, + "step": 9046 + }, + { + "epoch": 0.27, + "learning_rate": 4.2675513429195605e-06, + "loss": 1.2198, + "step": 9047 + }, + { + "epoch": 0.27, + "learning_rate": 4.267378835952442e-06, + "loss": 1.2384, + "step": 9048 + }, + { + "epoch": 0.27, + "learning_rate": 4.26720631216073e-06, + "loss": 1.119, + "step": 9049 + }, + { + "epoch": 0.27, + "learning_rate": 4.267033771546063e-06, + "loss": 1.0582, + "step": 9050 + }, + { + "epoch": 0.27, + "learning_rate": 4.266861214110086e-06, + "loss": 1.2094, + "step": 9051 + }, + { + "epoch": 0.27, + "learning_rate": 4.266688639854442e-06, + "loss": 1.2684, + "step": 9052 + }, + { + "epoch": 0.27, + "learning_rate": 4.2665160487807724e-06, + "loss": 1.2584, + "step": 9053 + }, + { + "epoch": 0.27, + "learning_rate": 4.266343440890721e-06, + "loss": 1.0854, + "step": 9054 + }, + { + "epoch": 0.27, + "learning_rate": 4.2661708161859304e-06, + "loss": 1.2458, + "step": 9055 + }, + { + "epoch": 0.27, + "learning_rate": 4.265998174668045e-06, + "loss": 1.0647, + "step": 9056 + }, + { + "epoch": 0.27, + "learning_rate": 4.265825516338707e-06, + "loss": 1.1754, + "step": 9057 + }, + { + "epoch": 0.27, + "learning_rate": 4.265652841199561e-06, + "loss": 1.1512, + "step": 9058 + }, + { + "epoch": 0.27, + "learning_rate": 4.265480149252249e-06, + "loss": 1.1954, + "step": 9059 + }, + { + "epoch": 0.27, + "learning_rate": 4.265307440498418e-06, + "loss": 1.1539, + "step": 9060 + }, + { + "epoch": 0.27, + "learning_rate": 4.265134714939709e-06, + "loss": 1.2629, + "step": 9061 + }, + { + "epoch": 0.27, + "learning_rate": 4.264961972577768e-06, + "loss": 1.2589, + "step": 9062 + }, + { + "epoch": 0.27, + "learning_rate": 4.26478921341424e-06, + "loss": 1.1626, + "step": 9063 + }, + { + "epoch": 0.27, + "learning_rate": 4.264616437450767e-06, + "loss": 1.0897, + "step": 9064 + }, + { + "epoch": 0.27, + "learning_rate": 4.264443644688997e-06, + "loss": 1.04, + "step": 9065 + }, + { + "epoch": 0.27, + "learning_rate": 4.264270835130572e-06, + "loss": 1.3087, + "step": 9066 + }, + { + "epoch": 0.27, + "learning_rate": 4.264098008777139e-06, + "loss": 1.1443, + "step": 9067 + }, + { + "epoch": 0.27, + "learning_rate": 4.263925165630343e-06, + "loss": 1.0821, + "step": 9068 + }, + { + "epoch": 0.27, + "learning_rate": 4.2637523056918275e-06, + "loss": 1.3202, + "step": 9069 + }, + { + "epoch": 0.27, + "learning_rate": 4.26357942896324e-06, + "loss": 1.1521, + "step": 9070 + }, + { + "epoch": 0.27, + "learning_rate": 4.2634065354462265e-06, + "loss": 1.1404, + "step": 9071 + }, + { + "epoch": 0.27, + "learning_rate": 4.263233625142432e-06, + "loss": 1.0673, + "step": 9072 + }, + { + "epoch": 0.27, + "learning_rate": 4.263060698053503e-06, + "loss": 1.0665, + "step": 9073 + }, + { + "epoch": 0.27, + "learning_rate": 4.2628877541810835e-06, + "loss": 1.1838, + "step": 9074 + }, + { + "epoch": 0.27, + "learning_rate": 4.262714793526823e-06, + "loss": 1.1625, + "step": 9075 + }, + { + "epoch": 0.27, + "learning_rate": 4.262541816092366e-06, + "loss": 1.2363, + "step": 9076 + }, + { + "epoch": 0.27, + "learning_rate": 4.26236882187936e-06, + "loss": 1.1642, + "step": 9077 + }, + { + "epoch": 0.27, + "learning_rate": 4.262195810889452e-06, + "loss": 1.0432, + "step": 9078 + }, + { + "epoch": 0.27, + "learning_rate": 4.262022783124288e-06, + "loss": 1.2277, + "step": 9079 + }, + { + "epoch": 0.27, + "learning_rate": 4.261849738585516e-06, + "loss": 1.2099, + "step": 9080 + }, + { + "epoch": 0.27, + "learning_rate": 4.261676677274783e-06, + "loss": 1.1777, + "step": 9081 + }, + { + "epoch": 0.27, + "learning_rate": 4.261503599193737e-06, + "loss": 1.1218, + "step": 9082 + }, + { + "epoch": 0.27, + "learning_rate": 4.261330504344024e-06, + "loss": 1.0921, + "step": 9083 + }, + { + "epoch": 0.27, + "learning_rate": 4.261157392727293e-06, + "loss": 1.1009, + "step": 9084 + }, + { + "epoch": 0.27, + "learning_rate": 4.260984264345192e-06, + "loss": 1.0857, + "step": 9085 + }, + { + "epoch": 0.27, + "learning_rate": 4.26081111919937e-06, + "loss": 1.2063, + "step": 9086 + }, + { + "epoch": 0.27, + "learning_rate": 4.260637957291473e-06, + "loss": 1.1998, + "step": 9087 + }, + { + "epoch": 0.27, + "learning_rate": 4.260464778623151e-06, + "loss": 1.1154, + "step": 9088 + }, + { + "epoch": 0.27, + "learning_rate": 4.260291583196052e-06, + "loss": 1.0812, + "step": 9089 + }, + { + "epoch": 0.27, + "learning_rate": 4.260118371011825e-06, + "loss": 1.1352, + "step": 9090 + }, + { + "epoch": 0.27, + "learning_rate": 4.259945142072119e-06, + "loss": 1.0485, + "step": 9091 + }, + { + "epoch": 0.27, + "learning_rate": 4.259771896378583e-06, + "loss": 1.2093, + "step": 9092 + }, + { + "epoch": 0.27, + "learning_rate": 4.259598633932866e-06, + "loss": 1.2193, + "step": 9093 + }, + { + "epoch": 0.27, + "learning_rate": 4.259425354736617e-06, + "loss": 1.1121, + "step": 9094 + }, + { + "epoch": 0.27, + "learning_rate": 4.259252058791487e-06, + "loss": 1.0425, + "step": 9095 + }, + { + "epoch": 0.27, + "learning_rate": 4.259078746099123e-06, + "loss": 1.1191, + "step": 9096 + }, + { + "epoch": 0.27, + "learning_rate": 4.258905416661178e-06, + "loss": 1.0747, + "step": 9097 + }, + { + "epoch": 0.27, + "learning_rate": 4.2587320704793004e-06, + "loss": 1.1581, + "step": 9098 + }, + { + "epoch": 0.27, + "learning_rate": 4.258558707555141e-06, + "loss": 1.1127, + "step": 9099 + }, + { + "epoch": 0.27, + "learning_rate": 4.258385327890347e-06, + "loss": 1.1089, + "step": 9100 + }, + { + "epoch": 0.27, + "learning_rate": 4.258211931486574e-06, + "loss": 1.0906, + "step": 9101 + }, + { + "epoch": 0.27, + "learning_rate": 4.25803851834547e-06, + "loss": 1.1379, + "step": 9102 + }, + { + "epoch": 0.27, + "learning_rate": 4.257865088468685e-06, + "loss": 1.1351, + "step": 9103 + }, + { + "epoch": 0.27, + "learning_rate": 4.257691641857872e-06, + "loss": 1.3016, + "step": 9104 + }, + { + "epoch": 0.27, + "learning_rate": 4.25751817851468e-06, + "loss": 1.132, + "step": 9105 + }, + { + "epoch": 0.27, + "learning_rate": 4.257344698440763e-06, + "loss": 1.3187, + "step": 9106 + }, + { + "epoch": 0.27, + "learning_rate": 4.257171201637769e-06, + "loss": 1.1719, + "step": 9107 + }, + { + "epoch": 0.27, + "learning_rate": 4.256997688107353e-06, + "loss": 1.0947, + "step": 9108 + }, + { + "epoch": 0.27, + "learning_rate": 4.256824157851165e-06, + "loss": 1.16, + "step": 9109 + }, + { + "epoch": 0.27, + "learning_rate": 4.256650610870856e-06, + "loss": 1.1783, + "step": 9110 + }, + { + "epoch": 0.27, + "learning_rate": 4.25647704716808e-06, + "loss": 1.1891, + "step": 9111 + }, + { + "epoch": 0.27, + "learning_rate": 4.256303466744488e-06, + "loss": 1.1434, + "step": 9112 + }, + { + "epoch": 0.27, + "learning_rate": 4.2561298696017335e-06, + "loss": 1.0225, + "step": 9113 + }, + { + "epoch": 0.27, + "learning_rate": 4.255956255741468e-06, + "loss": 1.1446, + "step": 9114 + }, + { + "epoch": 0.27, + "learning_rate": 4.255782625165344e-06, + "loss": 1.0974, + "step": 9115 + }, + { + "epoch": 0.27, + "learning_rate": 4.255608977875017e-06, + "loss": 1.1227, + "step": 9116 + }, + { + "epoch": 0.27, + "learning_rate": 4.255435313872137e-06, + "loss": 1.1554, + "step": 9117 + }, + { + "epoch": 0.27, + "learning_rate": 4.255261633158358e-06, + "loss": 1.2535, + "step": 9118 + }, + { + "epoch": 0.27, + "learning_rate": 4.255087935735334e-06, + "loss": 1.1719, + "step": 9119 + }, + { + "epoch": 0.27, + "learning_rate": 4.254914221604717e-06, + "loss": 1.1747, + "step": 9120 + }, + { + "epoch": 0.27, + "learning_rate": 4.254740490768163e-06, + "loss": 1.1855, + "step": 9121 + }, + { + "epoch": 0.27, + "learning_rate": 4.254566743227324e-06, + "loss": 1.1934, + "step": 9122 + }, + { + "epoch": 0.27, + "learning_rate": 4.254392978983856e-06, + "loss": 1.1425, + "step": 9123 + }, + { + "epoch": 0.27, + "learning_rate": 4.25421919803941e-06, + "loss": 1.1441, + "step": 9124 + }, + { + "epoch": 0.27, + "learning_rate": 4.254045400395643e-06, + "loss": 1.2937, + "step": 9125 + }, + { + "epoch": 0.27, + "learning_rate": 4.253871586054208e-06, + "loss": 1.1622, + "step": 9126 + }, + { + "epoch": 0.27, + "learning_rate": 4.253697755016761e-06, + "loss": 1.0698, + "step": 9127 + }, + { + "epoch": 0.27, + "learning_rate": 4.253523907284955e-06, + "loss": 1.1245, + "step": 9128 + }, + { + "epoch": 0.28, + "learning_rate": 4.253350042860447e-06, + "loss": 1.1266, + "step": 9129 + }, + { + "epoch": 0.28, + "learning_rate": 4.2531761617448905e-06, + "loss": 1.1508, + "step": 9130 + }, + { + "epoch": 0.28, + "learning_rate": 4.253002263939941e-06, + "loss": 1.0375, + "step": 9131 + }, + { + "epoch": 0.28, + "learning_rate": 4.252828349447254e-06, + "loss": 1.0809, + "step": 9132 + }, + { + "epoch": 0.28, + "learning_rate": 4.252654418268486e-06, + "loss": 1.1693, + "step": 9133 + }, + { + "epoch": 0.28, + "learning_rate": 4.252480470405293e-06, + "loss": 1.1314, + "step": 9134 + }, + { + "epoch": 0.28, + "learning_rate": 4.252306505859329e-06, + "loss": 1.1212, + "step": 9135 + }, + { + "epoch": 0.28, + "learning_rate": 4.25213252463225e-06, + "loss": 1.1931, + "step": 9136 + }, + { + "epoch": 0.28, + "learning_rate": 4.251958526725714e-06, + "loss": 1.2158, + "step": 9137 + }, + { + "epoch": 0.28, + "learning_rate": 4.251784512141377e-06, + "loss": 1.0739, + "step": 9138 + }, + { + "epoch": 0.28, + "learning_rate": 4.251610480880895e-06, + "loss": 1.0658, + "step": 9139 + }, + { + "epoch": 0.28, + "learning_rate": 4.2514364329459246e-06, + "loss": 1.2128, + "step": 9140 + }, + { + "epoch": 0.28, + "learning_rate": 4.251262368338123e-06, + "loss": 1.1531, + "step": 9141 + }, + { + "epoch": 0.28, + "learning_rate": 4.251088287059146e-06, + "loss": 1.1635, + "step": 9142 + }, + { + "epoch": 0.28, + "learning_rate": 4.250914189110653e-06, + "loss": 1.1857, + "step": 9143 + }, + { + "epoch": 0.28, + "learning_rate": 4.250740074494301e-06, + "loss": 1.121, + "step": 9144 + }, + { + "epoch": 0.28, + "learning_rate": 4.250565943211745e-06, + "loss": 1.1317, + "step": 9145 + }, + { + "epoch": 0.28, + "learning_rate": 4.250391795264645e-06, + "loss": 1.1208, + "step": 9146 + }, + { + "epoch": 0.28, + "learning_rate": 4.250217630654658e-06, + "loss": 1.0257, + "step": 9147 + }, + { + "epoch": 0.28, + "learning_rate": 4.250043449383443e-06, + "loss": 1.204, + "step": 9148 + }, + { + "epoch": 0.28, + "learning_rate": 4.249869251452656e-06, + "loss": 1.0646, + "step": 9149 + }, + { + "epoch": 0.28, + "learning_rate": 4.249695036863957e-06, + "loss": 1.13, + "step": 9150 + }, + { + "epoch": 0.28, + "learning_rate": 4.249520805619004e-06, + "loss": 1.173, + "step": 9151 + }, + { + "epoch": 0.28, + "learning_rate": 4.249346557719456e-06, + "loss": 1.1979, + "step": 9152 + }, + { + "epoch": 0.28, + "learning_rate": 4.24917229316697e-06, + "loss": 1.0582, + "step": 9153 + }, + { + "epoch": 0.28, + "learning_rate": 4.248998011963207e-06, + "loss": 1.1412, + "step": 9154 + }, + { + "epoch": 0.28, + "learning_rate": 4.248823714109826e-06, + "loss": 1.2095, + "step": 9155 + }, + { + "epoch": 0.28, + "learning_rate": 4.2486493996084835e-06, + "loss": 1.187, + "step": 9156 + }, + { + "epoch": 0.28, + "learning_rate": 4.2484750684608425e-06, + "loss": 1.1734, + "step": 9157 + }, + { + "epoch": 0.28, + "learning_rate": 4.24830072066856e-06, + "loss": 1.226, + "step": 9158 + }, + { + "epoch": 0.28, + "learning_rate": 4.248126356233298e-06, + "loss": 1.082, + "step": 9159 + }, + { + "epoch": 0.28, + "learning_rate": 4.247951975156714e-06, + "loss": 1.2894, + "step": 9160 + }, + { + "epoch": 0.28, + "learning_rate": 4.247777577440469e-06, + "loss": 1.1021, + "step": 9161 + }, + { + "epoch": 0.28, + "learning_rate": 4.247603163086223e-06, + "loss": 1.3279, + "step": 9162 + }, + { + "epoch": 0.28, + "learning_rate": 4.2474287320956375e-06, + "loss": 1.0712, + "step": 9163 + }, + { + "epoch": 0.28, + "learning_rate": 4.2472542844703715e-06, + "loss": 1.1142, + "step": 9164 + }, + { + "epoch": 0.28, + "learning_rate": 4.2470798202120865e-06, + "loss": 1.1107, + "step": 9165 + }, + { + "epoch": 0.28, + "learning_rate": 4.2469053393224425e-06, + "loss": 1.1257, + "step": 9166 + }, + { + "epoch": 0.28, + "learning_rate": 4.2467308418031015e-06, + "loss": 1.2107, + "step": 9167 + }, + { + "epoch": 0.28, + "learning_rate": 4.246556327655724e-06, + "loss": 1.2349, + "step": 9168 + }, + { + "epoch": 0.28, + "learning_rate": 4.246381796881971e-06, + "loss": 1.1436, + "step": 9169 + }, + { + "epoch": 0.28, + "learning_rate": 4.246207249483505e-06, + "loss": 1.1736, + "step": 9170 + }, + { + "epoch": 0.28, + "learning_rate": 4.246032685461987e-06, + "loss": 1.1826, + "step": 9171 + }, + { + "epoch": 0.28, + "learning_rate": 4.245858104819078e-06, + "loss": 1.2527, + "step": 9172 + }, + { + "epoch": 0.28, + "learning_rate": 4.245683507556442e-06, + "loss": 1.2059, + "step": 9173 + }, + { + "epoch": 0.28, + "learning_rate": 4.2455088936757386e-06, + "loss": 1.2365, + "step": 9174 + }, + { + "epoch": 0.28, + "learning_rate": 4.245334263178632e-06, + "loss": 1.0474, + "step": 9175 + }, + { + "epoch": 0.28, + "learning_rate": 4.245159616066783e-06, + "loss": 1.1465, + "step": 9176 + }, + { + "epoch": 0.28, + "learning_rate": 4.244984952341855e-06, + "loss": 1.1327, + "step": 9177 + }, + { + "epoch": 0.28, + "learning_rate": 4.24481027200551e-06, + "loss": 1.1014, + "step": 9178 + }, + { + "epoch": 0.28, + "learning_rate": 4.244635575059413e-06, + "loss": 1.239, + "step": 9179 + }, + { + "epoch": 0.28, + "learning_rate": 4.2444608615052255e-06, + "loss": 1.124, + "step": 9180 + }, + { + "epoch": 0.28, + "learning_rate": 4.24428613134461e-06, + "loss": 1.1716, + "step": 9181 + }, + { + "epoch": 0.28, + "learning_rate": 4.244111384579231e-06, + "loss": 1.0927, + "step": 9182 + }, + { + "epoch": 0.28, + "learning_rate": 4.243936621210751e-06, + "loss": 1.2324, + "step": 9183 + }, + { + "epoch": 0.28, + "learning_rate": 4.243761841240835e-06, + "loss": 1.2161, + "step": 9184 + }, + { + "epoch": 0.28, + "learning_rate": 4.243587044671147e-06, + "loss": 1.1884, + "step": 9185 + }, + { + "epoch": 0.28, + "learning_rate": 4.243412231503348e-06, + "loss": 1.2113, + "step": 9186 + }, + { + "epoch": 0.28, + "learning_rate": 4.243237401739106e-06, + "loss": 1.2427, + "step": 9187 + }, + { + "epoch": 0.28, + "learning_rate": 4.243062555380082e-06, + "loss": 1.0549, + "step": 9188 + }, + { + "epoch": 0.28, + "learning_rate": 4.2428876924279425e-06, + "loss": 1.0718, + "step": 9189 + }, + { + "epoch": 0.28, + "learning_rate": 4.242712812884353e-06, + "loss": 1.0838, + "step": 9190 + }, + { + "epoch": 0.28, + "learning_rate": 4.242537916750975e-06, + "loss": 1.1429, + "step": 9191 + }, + { + "epoch": 0.28, + "learning_rate": 4.242363004029476e-06, + "loss": 1.1209, + "step": 9192 + }, + { + "epoch": 0.28, + "learning_rate": 4.242188074721521e-06, + "loss": 1.2086, + "step": 9193 + }, + { + "epoch": 0.28, + "learning_rate": 4.242013128828773e-06, + "loss": 1.1818, + "step": 9194 + }, + { + "epoch": 0.28, + "learning_rate": 4.2418381663529e-06, + "loss": 1.1882, + "step": 9195 + }, + { + "epoch": 0.28, + "learning_rate": 4.241663187295566e-06, + "loss": 1.1119, + "step": 9196 + }, + { + "epoch": 0.28, + "learning_rate": 4.241488191658438e-06, + "loss": 1.2108, + "step": 9197 + }, + { + "epoch": 0.28, + "learning_rate": 4.24131317944318e-06, + "loss": 1.1526, + "step": 9198 + }, + { + "epoch": 0.28, + "learning_rate": 4.24113815065146e-06, + "loss": 1.0762, + "step": 9199 + }, + { + "epoch": 0.28, + "learning_rate": 4.240963105284944e-06, + "loss": 1.1628, + "step": 9200 + }, + { + "epoch": 0.28, + "learning_rate": 4.240788043345297e-06, + "loss": 1.1305, + "step": 9201 + }, + { + "epoch": 0.28, + "learning_rate": 4.240612964834186e-06, + "loss": 1.1107, + "step": 9202 + }, + { + "epoch": 0.28, + "learning_rate": 4.240437869753278e-06, + "loss": 1.1479, + "step": 9203 + }, + { + "epoch": 0.28, + "learning_rate": 4.24026275810424e-06, + "loss": 1.1901, + "step": 9204 + }, + { + "epoch": 0.28, + "learning_rate": 4.2400876298887385e-06, + "loss": 1.2133, + "step": 9205 + }, + { + "epoch": 0.28, + "learning_rate": 4.239912485108441e-06, + "loss": 1.2867, + "step": 9206 + }, + { + "epoch": 0.28, + "learning_rate": 4.239737323765014e-06, + "loss": 1.1246, + "step": 9207 + }, + { + "epoch": 0.28, + "learning_rate": 4.239562145860127e-06, + "loss": 1.1573, + "step": 9208 + }, + { + "epoch": 0.28, + "learning_rate": 4.239386951395444e-06, + "loss": 1.0364, + "step": 9209 + }, + { + "epoch": 0.28, + "learning_rate": 4.239211740372637e-06, + "loss": 1.1082, + "step": 9210 + }, + { + "epoch": 0.28, + "learning_rate": 4.239036512793371e-06, + "loss": 1.1174, + "step": 9211 + }, + { + "epoch": 0.28, + "learning_rate": 4.238861268659314e-06, + "loss": 1.1163, + "step": 9212 + }, + { + "epoch": 0.28, + "learning_rate": 4.238686007972137e-06, + "loss": 1.0699, + "step": 9213 + }, + { + "epoch": 0.28, + "learning_rate": 4.238510730733506e-06, + "loss": 1.121, + "step": 9214 + }, + { + "epoch": 0.28, + "learning_rate": 4.238335436945089e-06, + "loss": 1.0043, + "step": 9215 + }, + { + "epoch": 0.28, + "learning_rate": 4.238160126608557e-06, + "loss": 1.1876, + "step": 9216 + }, + { + "epoch": 0.28, + "learning_rate": 4.237984799725577e-06, + "loss": 1.1567, + "step": 9217 + }, + { + "epoch": 0.28, + "learning_rate": 4.23780945629782e-06, + "loss": 1.2299, + "step": 9218 + }, + { + "epoch": 0.28, + "learning_rate": 4.237634096326952e-06, + "loss": 1.0941, + "step": 9219 + }, + { + "epoch": 0.28, + "learning_rate": 4.237458719814646e-06, + "loss": 1.111, + "step": 9220 + }, + { + "epoch": 0.28, + "learning_rate": 4.237283326762569e-06, + "loss": 1.116, + "step": 9221 + }, + { + "epoch": 0.28, + "learning_rate": 4.237107917172392e-06, + "loss": 1.0543, + "step": 9222 + }, + { + "epoch": 0.28, + "learning_rate": 4.236932491045784e-06, + "loss": 1.1297, + "step": 9223 + }, + { + "epoch": 0.28, + "learning_rate": 4.236757048384415e-06, + "loss": 1.134, + "step": 9224 + }, + { + "epoch": 0.28, + "learning_rate": 4.236581589189955e-06, + "loss": 1.0781, + "step": 9225 + }, + { + "epoch": 0.28, + "learning_rate": 4.236406113464075e-06, + "loss": 1.1074, + "step": 9226 + }, + { + "epoch": 0.28, + "learning_rate": 4.236230621208446e-06, + "loss": 1.0931, + "step": 9227 + }, + { + "epoch": 0.28, + "learning_rate": 4.236055112424736e-06, + "loss": 1.1113, + "step": 9228 + }, + { + "epoch": 0.28, + "learning_rate": 4.235879587114619e-06, + "loss": 1.2054, + "step": 9229 + }, + { + "epoch": 0.28, + "learning_rate": 4.235704045279762e-06, + "loss": 1.1447, + "step": 9230 + }, + { + "epoch": 0.28, + "learning_rate": 4.235528486921842e-06, + "loss": 1.082, + "step": 9231 + }, + { + "epoch": 0.28, + "learning_rate": 4.235352912042524e-06, + "loss": 1.0418, + "step": 9232 + }, + { + "epoch": 0.28, + "learning_rate": 4.235177320643483e-06, + "loss": 1.1235, + "step": 9233 + }, + { + "epoch": 0.28, + "learning_rate": 4.235001712726389e-06, + "loss": 1.0194, + "step": 9234 + }, + { + "epoch": 0.28, + "learning_rate": 4.2348260882929144e-06, + "loss": 1.2351, + "step": 9235 + }, + { + "epoch": 0.28, + "learning_rate": 4.234650447344731e-06, + "loss": 1.2191, + "step": 9236 + }, + { + "epoch": 0.28, + "learning_rate": 4.234474789883511e-06, + "loss": 1.2135, + "step": 9237 + }, + { + "epoch": 0.28, + "learning_rate": 4.234299115910927e-06, + "loss": 1.0994, + "step": 9238 + }, + { + "epoch": 0.28, + "learning_rate": 4.23412342542865e-06, + "loss": 1.0598, + "step": 9239 + }, + { + "epoch": 0.28, + "learning_rate": 4.233947718438353e-06, + "loss": 1.0932, + "step": 9240 + }, + { + "epoch": 0.28, + "learning_rate": 4.233771994941709e-06, + "loss": 1.064, + "step": 9241 + }, + { + "epoch": 0.28, + "learning_rate": 4.233596254940391e-06, + "loss": 1.1763, + "step": 9242 + }, + { + "epoch": 0.28, + "learning_rate": 4.233420498436071e-06, + "loss": 0.9941, + "step": 9243 + }, + { + "epoch": 0.28, + "learning_rate": 4.233244725430423e-06, + "loss": 1.0939, + "step": 9244 + }, + { + "epoch": 0.28, + "learning_rate": 4.23306893592512e-06, + "loss": 1.2003, + "step": 9245 + }, + { + "epoch": 0.28, + "learning_rate": 4.232893129921835e-06, + "loss": 1.1528, + "step": 9246 + }, + { + "epoch": 0.28, + "learning_rate": 4.232717307422243e-06, + "loss": 1.1725, + "step": 9247 + }, + { + "epoch": 0.28, + "learning_rate": 4.232541468428016e-06, + "loss": 1.0854, + "step": 9248 + }, + { + "epoch": 0.28, + "learning_rate": 4.232365612940828e-06, + "loss": 1.0851, + "step": 9249 + }, + { + "epoch": 0.28, + "learning_rate": 4.232189740962354e-06, + "loss": 1.1356, + "step": 9250 + }, + { + "epoch": 0.28, + "learning_rate": 4.232013852494269e-06, + "loss": 1.1495, + "step": 9251 + }, + { + "epoch": 0.28, + "learning_rate": 4.231837947538246e-06, + "loss": 1.1627, + "step": 9252 + }, + { + "epoch": 0.28, + "learning_rate": 4.231662026095958e-06, + "loss": 1.2831, + "step": 9253 + }, + { + "epoch": 0.28, + "learning_rate": 4.2314860881690834e-06, + "loss": 1.0365, + "step": 9254 + }, + { + "epoch": 0.28, + "learning_rate": 4.231310133759295e-06, + "loss": 1.231, + "step": 9255 + }, + { + "epoch": 0.28, + "learning_rate": 4.231134162868267e-06, + "loss": 1.1218, + "step": 9256 + }, + { + "epoch": 0.28, + "learning_rate": 4.230958175497677e-06, + "loss": 1.1967, + "step": 9257 + }, + { + "epoch": 0.28, + "learning_rate": 4.230782171649197e-06, + "loss": 1.032, + "step": 9258 + }, + { + "epoch": 0.28, + "learning_rate": 4.2306061513245065e-06, + "loss": 1.1338, + "step": 9259 + }, + { + "epoch": 0.28, + "learning_rate": 4.230430114525277e-06, + "loss": 1.0325, + "step": 9260 + }, + { + "epoch": 0.28, + "learning_rate": 4.2302540612531876e-06, + "loss": 1.2405, + "step": 9261 + }, + { + "epoch": 0.28, + "learning_rate": 4.230077991509911e-06, + "loss": 1.1255, + "step": 9262 + }, + { + "epoch": 0.28, + "learning_rate": 4.229901905297127e-06, + "loss": 1.1481, + "step": 9263 + }, + { + "epoch": 0.28, + "learning_rate": 4.229725802616509e-06, + "loss": 1.1282, + "step": 9264 + }, + { + "epoch": 0.28, + "learning_rate": 4.229549683469735e-06, + "loss": 1.1775, + "step": 9265 + }, + { + "epoch": 0.28, + "learning_rate": 4.229373547858481e-06, + "loss": 1.2146, + "step": 9266 + }, + { + "epoch": 0.28, + "learning_rate": 4.229197395784424e-06, + "loss": 1.1249, + "step": 9267 + }, + { + "epoch": 0.28, + "learning_rate": 4.229021227249239e-06, + "loss": 1.2414, + "step": 9268 + }, + { + "epoch": 0.28, + "learning_rate": 4.228845042254606e-06, + "loss": 1.1911, + "step": 9269 + }, + { + "epoch": 0.28, + "learning_rate": 4.228668840802201e-06, + "loss": 1.2068, + "step": 9270 + }, + { + "epoch": 0.28, + "learning_rate": 4.2284926228937e-06, + "loss": 1.0913, + "step": 9271 + }, + { + "epoch": 0.28, + "learning_rate": 4.228316388530783e-06, + "loss": 1.1805, + "step": 9272 + }, + { + "epoch": 0.28, + "learning_rate": 4.228140137715126e-06, + "loss": 1.0383, + "step": 9273 + }, + { + "epoch": 0.28, + "learning_rate": 4.227963870448406e-06, + "loss": 1.0829, + "step": 9274 + }, + { + "epoch": 0.28, + "learning_rate": 4.227787586732304e-06, + "loss": 1.1855, + "step": 9275 + }, + { + "epoch": 0.28, + "learning_rate": 4.227611286568495e-06, + "loss": 1.1298, + "step": 9276 + }, + { + "epoch": 0.28, + "learning_rate": 4.227434969958659e-06, + "loss": 1.0814, + "step": 9277 + }, + { + "epoch": 0.28, + "learning_rate": 4.227258636904474e-06, + "loss": 1.113, + "step": 9278 + }, + { + "epoch": 0.28, + "learning_rate": 4.227082287407619e-06, + "loss": 1.2649, + "step": 9279 + }, + { + "epoch": 0.28, + "learning_rate": 4.226905921469772e-06, + "loss": 1.1146, + "step": 9280 + }, + { + "epoch": 0.28, + "learning_rate": 4.226729539092613e-06, + "loss": 1.1687, + "step": 9281 + }, + { + "epoch": 0.28, + "learning_rate": 4.226553140277819e-06, + "loss": 1.0172, + "step": 9282 + }, + { + "epoch": 0.28, + "learning_rate": 4.226376725027072e-06, + "loss": 1.1956, + "step": 9283 + }, + { + "epoch": 0.28, + "learning_rate": 4.22620029334205e-06, + "loss": 1.1105, + "step": 9284 + }, + { + "epoch": 0.28, + "learning_rate": 4.226023845224431e-06, + "loss": 1.1999, + "step": 9285 + }, + { + "epoch": 0.28, + "learning_rate": 4.225847380675898e-06, + "loss": 1.1483, + "step": 9286 + }, + { + "epoch": 0.28, + "learning_rate": 4.225670899698128e-06, + "loss": 1.2228, + "step": 9287 + }, + { + "epoch": 0.28, + "learning_rate": 4.2254944022928035e-06, + "loss": 1.1511, + "step": 9288 + }, + { + "epoch": 0.28, + "learning_rate": 4.225317888461602e-06, + "loss": 1.2206, + "step": 9289 + }, + { + "epoch": 0.28, + "learning_rate": 4.225141358206206e-06, + "loss": 1.1255, + "step": 9290 + }, + { + "epoch": 0.28, + "learning_rate": 4.224964811528295e-06, + "loss": 1.1154, + "step": 9291 + }, + { + "epoch": 0.28, + "learning_rate": 4.22478824842955e-06, + "loss": 1.0958, + "step": 9292 + }, + { + "epoch": 0.28, + "learning_rate": 4.22461166891165e-06, + "loss": 1.1422, + "step": 9293 + }, + { + "epoch": 0.28, + "learning_rate": 4.22443507297628e-06, + "loss": 1.0963, + "step": 9294 + }, + { + "epoch": 0.28, + "learning_rate": 4.224258460625117e-06, + "loss": 1.3002, + "step": 9295 + }, + { + "epoch": 0.28, + "learning_rate": 4.224081831859844e-06, + "loss": 1.0966, + "step": 9296 + }, + { + "epoch": 0.28, + "learning_rate": 4.223905186682142e-06, + "loss": 1.1785, + "step": 9297 + }, + { + "epoch": 0.28, + "learning_rate": 4.223728525093694e-06, + "loss": 1.1704, + "step": 9298 + }, + { + "epoch": 0.28, + "learning_rate": 4.22355184709618e-06, + "loss": 1.131, + "step": 9299 + }, + { + "epoch": 0.28, + "learning_rate": 4.223375152691283e-06, + "loss": 1.178, + "step": 9300 + }, + { + "epoch": 0.28, + "learning_rate": 4.223198441880683e-06, + "loss": 1.078, + "step": 9301 + }, + { + "epoch": 0.28, + "learning_rate": 4.223021714666064e-06, + "loss": 1.1912, + "step": 9302 + }, + { + "epoch": 0.28, + "learning_rate": 4.2228449710491095e-06, + "loss": 1.0383, + "step": 9303 + }, + { + "epoch": 0.28, + "learning_rate": 4.2226682110315e-06, + "loss": 1.1554, + "step": 9304 + }, + { + "epoch": 0.28, + "learning_rate": 4.2224914346149195e-06, + "loss": 1.2576, + "step": 9305 + }, + { + "epoch": 0.28, + "learning_rate": 4.2223146418010495e-06, + "loss": 1.1466, + "step": 9306 + }, + { + "epoch": 0.28, + "learning_rate": 4.222137832591573e-06, + "loss": 1.0541, + "step": 9307 + }, + { + "epoch": 0.28, + "learning_rate": 4.221961006988175e-06, + "loss": 1.1116, + "step": 9308 + }, + { + "epoch": 0.28, + "learning_rate": 4.221784164992536e-06, + "loss": 0.9911, + "step": 9309 + }, + { + "epoch": 0.28, + "learning_rate": 4.221607306606342e-06, + "loss": 1.0479, + "step": 9310 + }, + { + "epoch": 0.28, + "learning_rate": 4.221430431831276e-06, + "loss": 1.2207, + "step": 9311 + }, + { + "epoch": 0.28, + "learning_rate": 4.221253540669021e-06, + "loss": 1.1879, + "step": 9312 + }, + { + "epoch": 0.28, + "learning_rate": 4.221076633121261e-06, + "loss": 1.1925, + "step": 9313 + }, + { + "epoch": 0.28, + "learning_rate": 4.22089970918968e-06, + "loss": 1.1411, + "step": 9314 + }, + { + "epoch": 0.28, + "learning_rate": 4.220722768875962e-06, + "loss": 0.9876, + "step": 9315 + }, + { + "epoch": 0.28, + "learning_rate": 4.220545812181794e-06, + "loss": 1.1955, + "step": 9316 + }, + { + "epoch": 0.28, + "learning_rate": 4.220368839108857e-06, + "loss": 1.1343, + "step": 9317 + }, + { + "epoch": 0.28, + "learning_rate": 4.220191849658838e-06, + "loss": 1.2232, + "step": 9318 + }, + { + "epoch": 0.28, + "learning_rate": 4.22001484383342e-06, + "loss": 1.1001, + "step": 9319 + }, + { + "epoch": 0.28, + "learning_rate": 4.21983782163429e-06, + "loss": 1.0305, + "step": 9320 + }, + { + "epoch": 0.28, + "learning_rate": 4.219660783063132e-06, + "loss": 1.1042, + "step": 9321 + }, + { + "epoch": 0.28, + "learning_rate": 4.2194837281216325e-06, + "loss": 1.0952, + "step": 9322 + }, + { + "epoch": 0.28, + "learning_rate": 4.2193066568114745e-06, + "loss": 1.1996, + "step": 9323 + }, + { + "epoch": 0.28, + "learning_rate": 4.219129569134346e-06, + "loss": 1.1866, + "step": 9324 + }, + { + "epoch": 0.28, + "learning_rate": 4.2189524650919315e-06, + "loss": 1.1452, + "step": 9325 + }, + { + "epoch": 0.28, + "learning_rate": 4.2187753446859185e-06, + "loss": 1.1379, + "step": 9326 + }, + { + "epoch": 0.28, + "learning_rate": 4.218598207917991e-06, + "loss": 1.2549, + "step": 9327 + }, + { + "epoch": 0.28, + "learning_rate": 4.218421054789837e-06, + "loss": 1.1848, + "step": 9328 + }, + { + "epoch": 0.28, + "learning_rate": 4.218243885303141e-06, + "loss": 1.172, + "step": 9329 + }, + { + "epoch": 0.28, + "learning_rate": 4.218066699459591e-06, + "loss": 1.3326, + "step": 9330 + }, + { + "epoch": 0.28, + "learning_rate": 4.2178894972608745e-06, + "loss": 1.2382, + "step": 9331 + }, + { + "epoch": 0.28, + "learning_rate": 4.217712278708676e-06, + "loss": 1.1544, + "step": 9332 + }, + { + "epoch": 0.28, + "learning_rate": 4.217535043804685e-06, + "loss": 1.1927, + "step": 9333 + }, + { + "epoch": 0.28, + "learning_rate": 4.217357792550587e-06, + "loss": 1.0485, + "step": 9334 + }, + { + "epoch": 0.28, + "learning_rate": 4.2171805249480705e-06, + "loss": 1.0505, + "step": 9335 + }, + { + "epoch": 0.28, + "learning_rate": 4.217003240998822e-06, + "loss": 1.162, + "step": 9336 + }, + { + "epoch": 0.28, + "learning_rate": 4.2168259407045295e-06, + "loss": 1.2578, + "step": 9337 + }, + { + "epoch": 0.28, + "learning_rate": 4.216648624066881e-06, + "loss": 1.1629, + "step": 9338 + }, + { + "epoch": 0.28, + "learning_rate": 4.216471291087564e-06, + "loss": 1.0748, + "step": 9339 + }, + { + "epoch": 0.28, + "learning_rate": 4.216293941768267e-06, + "loss": 1.1076, + "step": 9340 + }, + { + "epoch": 0.28, + "learning_rate": 4.216116576110679e-06, + "loss": 1.1149, + "step": 9341 + }, + { + "epoch": 0.28, + "learning_rate": 4.215939194116488e-06, + "loss": 1.0906, + "step": 9342 + }, + { + "epoch": 0.28, + "learning_rate": 4.215761795787381e-06, + "loss": 1.129, + "step": 9343 + }, + { + "epoch": 0.28, + "learning_rate": 4.215584381125048e-06, + "loss": 1.1742, + "step": 9344 + }, + { + "epoch": 0.28, + "learning_rate": 4.215406950131179e-06, + "loss": 1.1781, + "step": 9345 + }, + { + "epoch": 0.28, + "learning_rate": 4.215229502807462e-06, + "loss": 1.1214, + "step": 9346 + }, + { + "epoch": 0.28, + "learning_rate": 4.215052039155586e-06, + "loss": 1.2596, + "step": 9347 + }, + { + "epoch": 0.28, + "learning_rate": 4.21487455917724e-06, + "loss": 1.204, + "step": 9348 + }, + { + "epoch": 0.28, + "learning_rate": 4.2146970628741145e-06, + "loss": 1.1741, + "step": 9349 + }, + { + "epoch": 0.28, + "learning_rate": 4.2145195502478995e-06, + "loss": 1.0093, + "step": 9350 + }, + { + "epoch": 0.28, + "learning_rate": 4.214342021300283e-06, + "loss": 1.1036, + "step": 9351 + }, + { + "epoch": 0.28, + "learning_rate": 4.214164476032957e-06, + "loss": 1.2675, + "step": 9352 + }, + { + "epoch": 0.28, + "learning_rate": 4.21398691444761e-06, + "loss": 1.2101, + "step": 9353 + }, + { + "epoch": 0.28, + "learning_rate": 4.213809336545933e-06, + "loss": 1.1755, + "step": 9354 + }, + { + "epoch": 0.28, + "learning_rate": 4.213631742329617e-06, + "loss": 1.1916, + "step": 9355 + }, + { + "epoch": 0.28, + "learning_rate": 4.213454131800352e-06, + "loss": 1.1865, + "step": 9356 + }, + { + "epoch": 0.28, + "learning_rate": 4.213276504959829e-06, + "loss": 1.0928, + "step": 9357 + }, + { + "epoch": 0.28, + "learning_rate": 4.213098861809739e-06, + "loss": 1.1315, + "step": 9358 + }, + { + "epoch": 0.28, + "learning_rate": 4.212921202351772e-06, + "loss": 1.1472, + "step": 9359 + }, + { + "epoch": 0.28, + "learning_rate": 4.212743526587621e-06, + "loss": 1.1476, + "step": 9360 + }, + { + "epoch": 0.28, + "learning_rate": 4.212565834518977e-06, + "loss": 1.1639, + "step": 9361 + }, + { + "epoch": 0.28, + "learning_rate": 4.2123881261475294e-06, + "loss": 1.3049, + "step": 9362 + }, + { + "epoch": 0.28, + "learning_rate": 4.212210401474973e-06, + "loss": 1.113, + "step": 9363 + }, + { + "epoch": 0.28, + "learning_rate": 4.212032660502997e-06, + "loss": 1.1938, + "step": 9364 + }, + { + "epoch": 0.28, + "learning_rate": 4.211854903233296e-06, + "loss": 1.1043, + "step": 9365 + }, + { + "epoch": 0.28, + "learning_rate": 4.2116771296675596e-06, + "loss": 1.1241, + "step": 9366 + }, + { + "epoch": 0.28, + "learning_rate": 4.211499339807482e-06, + "loss": 1.1664, + "step": 9367 + }, + { + "epoch": 0.28, + "learning_rate": 4.211321533654755e-06, + "loss": 1.1418, + "step": 9368 + }, + { + "epoch": 0.28, + "learning_rate": 4.2111437112110705e-06, + "loss": 1.0926, + "step": 9369 + }, + { + "epoch": 0.28, + "learning_rate": 4.210965872478122e-06, + "loss": 1.0731, + "step": 9370 + }, + { + "epoch": 0.28, + "learning_rate": 4.210788017457603e-06, + "loss": 1.1329, + "step": 9371 + }, + { + "epoch": 0.28, + "learning_rate": 4.2106101461512065e-06, + "loss": 1.131, + "step": 9372 + }, + { + "epoch": 0.28, + "learning_rate": 4.210432258560624e-06, + "loss": 1.0995, + "step": 9373 + }, + { + "epoch": 0.28, + "learning_rate": 4.210254354687551e-06, + "loss": 1.1938, + "step": 9374 + }, + { + "epoch": 0.28, + "learning_rate": 4.2100764345336795e-06, + "loss": 1.0823, + "step": 9375 + }, + { + "epoch": 0.28, + "learning_rate": 4.209898498100705e-06, + "loss": 1.1559, + "step": 9376 + }, + { + "epoch": 0.28, + "learning_rate": 4.20972054539032e-06, + "loss": 1.0825, + "step": 9377 + }, + { + "epoch": 0.28, + "learning_rate": 4.209542576404219e-06, + "loss": 1.1638, + "step": 9378 + }, + { + "epoch": 0.28, + "learning_rate": 4.209364591144095e-06, + "loss": 1.2162, + "step": 9379 + }, + { + "epoch": 0.28, + "learning_rate": 4.209186589611644e-06, + "loss": 1.2809, + "step": 9380 + }, + { + "epoch": 0.28, + "learning_rate": 4.2090085718085596e-06, + "loss": 1.0204, + "step": 9381 + }, + { + "epoch": 0.28, + "learning_rate": 4.208830537736537e-06, + "loss": 1.2515, + "step": 9382 + }, + { + "epoch": 0.28, + "learning_rate": 4.208652487397271e-06, + "loss": 1.1735, + "step": 9383 + }, + { + "epoch": 0.28, + "learning_rate": 4.208474420792456e-06, + "loss": 1.1054, + "step": 9384 + }, + { + "epoch": 0.28, + "learning_rate": 4.208296337923787e-06, + "loss": 1.1937, + "step": 9385 + }, + { + "epoch": 0.28, + "learning_rate": 4.208118238792959e-06, + "loss": 1.1417, + "step": 9386 + }, + { + "epoch": 0.28, + "learning_rate": 4.207940123401669e-06, + "loss": 1.2353, + "step": 9387 + }, + { + "epoch": 0.28, + "learning_rate": 4.207761991751612e-06, + "loss": 1.1452, + "step": 9388 + }, + { + "epoch": 0.28, + "learning_rate": 4.207583843844483e-06, + "loss": 1.1753, + "step": 9389 + }, + { + "epoch": 0.28, + "learning_rate": 4.207405679681977e-06, + "loss": 1.0776, + "step": 9390 + }, + { + "epoch": 0.28, + "learning_rate": 4.207227499265792e-06, + "loss": 1.2309, + "step": 9391 + }, + { + "epoch": 0.28, + "learning_rate": 4.207049302597624e-06, + "loss": 1.1735, + "step": 9392 + }, + { + "epoch": 0.28, + "learning_rate": 4.206871089679169e-06, + "loss": 1.2926, + "step": 9393 + }, + { + "epoch": 0.28, + "learning_rate": 4.206692860512122e-06, + "loss": 1.1183, + "step": 9394 + }, + { + "epoch": 0.28, + "learning_rate": 4.206514615098182e-06, + "loss": 1.1786, + "step": 9395 + }, + { + "epoch": 0.28, + "learning_rate": 4.206336353439044e-06, + "loss": 1.0602, + "step": 9396 + }, + { + "epoch": 0.28, + "learning_rate": 4.206158075536407e-06, + "loss": 1.1582, + "step": 9397 + }, + { + "epoch": 0.28, + "learning_rate": 4.205979781391965e-06, + "loss": 1.1841, + "step": 9398 + }, + { + "epoch": 0.28, + "learning_rate": 4.205801471007418e-06, + "loss": 1.2051, + "step": 9399 + }, + { + "epoch": 0.28, + "learning_rate": 4.205623144384463e-06, + "loss": 1.0283, + "step": 9400 + }, + { + "epoch": 0.28, + "learning_rate": 4.205444801524796e-06, + "loss": 1.1307, + "step": 9401 + }, + { + "epoch": 0.28, + "learning_rate": 4.205266442430117e-06, + "loss": 1.145, + "step": 9402 + }, + { + "epoch": 0.28, + "learning_rate": 4.205088067102122e-06, + "loss": 1.0811, + "step": 9403 + }, + { + "epoch": 0.28, + "learning_rate": 4.204909675542511e-06, + "loss": 1.0684, + "step": 9404 + }, + { + "epoch": 0.28, + "learning_rate": 4.20473126775298e-06, + "loss": 1.1929, + "step": 9405 + }, + { + "epoch": 0.28, + "learning_rate": 4.204552843735228e-06, + "loss": 1.2535, + "step": 9406 + }, + { + "epoch": 0.28, + "learning_rate": 4.204374403490954e-06, + "loss": 1.0959, + "step": 9407 + }, + { + "epoch": 0.28, + "learning_rate": 4.204195947021857e-06, + "loss": 1.2095, + "step": 9408 + }, + { + "epoch": 0.28, + "learning_rate": 4.204017474329635e-06, + "loss": 1.043, + "step": 9409 + }, + { + "epoch": 0.28, + "learning_rate": 4.203838985415988e-06, + "loss": 1.2493, + "step": 9410 + }, + { + "epoch": 0.28, + "learning_rate": 4.203660480282614e-06, + "loss": 1.1151, + "step": 9411 + }, + { + "epoch": 0.28, + "learning_rate": 4.203481958931212e-06, + "loss": 1.1368, + "step": 9412 + }, + { + "epoch": 0.28, + "learning_rate": 4.2033034213634835e-06, + "loss": 1.3265, + "step": 9413 + }, + { + "epoch": 0.28, + "learning_rate": 4.203124867581126e-06, + "loss": 1.1797, + "step": 9414 + }, + { + "epoch": 0.28, + "learning_rate": 4.202946297585841e-06, + "loss": 1.0826, + "step": 9415 + }, + { + "epoch": 0.28, + "learning_rate": 4.202767711379326e-06, + "loss": 1.1241, + "step": 9416 + }, + { + "epoch": 0.28, + "learning_rate": 4.202589108963283e-06, + "loss": 1.2066, + "step": 9417 + }, + { + "epoch": 0.28, + "learning_rate": 4.2024104903394115e-06, + "loss": 1.1207, + "step": 9418 + }, + { + "epoch": 0.28, + "learning_rate": 4.202231855509413e-06, + "loss": 1.1179, + "step": 9419 + }, + { + "epoch": 0.28, + "learning_rate": 4.202053204474986e-06, + "loss": 1.1418, + "step": 9420 + }, + { + "epoch": 0.28, + "learning_rate": 4.201874537237832e-06, + "loss": 1.1542, + "step": 9421 + }, + { + "epoch": 0.28, + "learning_rate": 4.201695853799653e-06, + "loss": 1.1761, + "step": 9422 + }, + { + "epoch": 0.28, + "learning_rate": 4.201517154162149e-06, + "loss": 1.093, + "step": 9423 + }, + { + "epoch": 0.28, + "learning_rate": 4.201338438327021e-06, + "loss": 1.1858, + "step": 9424 + }, + { + "epoch": 0.28, + "learning_rate": 4.20115970629597e-06, + "loss": 1.1263, + "step": 9425 + }, + { + "epoch": 0.28, + "learning_rate": 4.200980958070698e-06, + "loss": 1.1528, + "step": 9426 + }, + { + "epoch": 0.28, + "learning_rate": 4.200802193652906e-06, + "loss": 1.0629, + "step": 9427 + }, + { + "epoch": 0.28, + "learning_rate": 4.200623413044298e-06, + "loss": 1.1146, + "step": 9428 + }, + { + "epoch": 0.28, + "learning_rate": 4.200444616246573e-06, + "loss": 1.1406, + "step": 9429 + }, + { + "epoch": 0.28, + "learning_rate": 4.200265803261434e-06, + "loss": 1.2198, + "step": 9430 + }, + { + "epoch": 0.28, + "learning_rate": 4.200086974090584e-06, + "loss": 1.0417, + "step": 9431 + }, + { + "epoch": 0.28, + "learning_rate": 4.199908128735724e-06, + "loss": 1.1625, + "step": 9432 + }, + { + "epoch": 0.28, + "learning_rate": 4.199729267198558e-06, + "loss": 1.1258, + "step": 9433 + }, + { + "epoch": 0.28, + "learning_rate": 4.1995503894807885e-06, + "loss": 1.0349, + "step": 9434 + }, + { + "epoch": 0.28, + "learning_rate": 4.199371495584117e-06, + "loss": 1.1698, + "step": 9435 + }, + { + "epoch": 0.28, + "learning_rate": 4.199192585510248e-06, + "loss": 1.1289, + "step": 9436 + }, + { + "epoch": 0.28, + "learning_rate": 4.199013659260883e-06, + "loss": 1.1688, + "step": 9437 + }, + { + "epoch": 0.28, + "learning_rate": 4.198834716837726e-06, + "loss": 1.1608, + "step": 9438 + }, + { + "epoch": 0.28, + "learning_rate": 4.198655758242482e-06, + "loss": 1.1514, + "step": 9439 + }, + { + "epoch": 0.28, + "learning_rate": 4.198476783476852e-06, + "loss": 1.1687, + "step": 9440 + }, + { + "epoch": 0.28, + "learning_rate": 4.198297792542542e-06, + "loss": 1.0858, + "step": 9441 + }, + { + "epoch": 0.28, + "learning_rate": 4.1981187854412546e-06, + "loss": 1.1406, + "step": 9442 + }, + { + "epoch": 0.28, + "learning_rate": 4.197939762174694e-06, + "loss": 1.0507, + "step": 9443 + }, + { + "epoch": 0.28, + "learning_rate": 4.197760722744565e-06, + "loss": 1.0811, + "step": 9444 + }, + { + "epoch": 0.28, + "learning_rate": 4.197581667152572e-06, + "loss": 1.0782, + "step": 9445 + }, + { + "epoch": 0.28, + "learning_rate": 4.197402595400418e-06, + "loss": 1.1497, + "step": 9446 + }, + { + "epoch": 0.28, + "learning_rate": 4.1972235074898096e-06, + "loss": 1.1617, + "step": 9447 + }, + { + "epoch": 0.28, + "learning_rate": 4.197044403422451e-06, + "loss": 1.0606, + "step": 9448 + }, + { + "epoch": 0.28, + "learning_rate": 4.196865283200045e-06, + "loss": 1.2279, + "step": 9449 + }, + { + "epoch": 0.28, + "learning_rate": 4.1966861468243015e-06, + "loss": 1.0059, + "step": 9450 + }, + { + "epoch": 0.28, + "learning_rate": 4.196506994296922e-06, + "loss": 1.1204, + "step": 9451 + }, + { + "epoch": 0.28, + "learning_rate": 4.196327825619613e-06, + "loss": 1.1208, + "step": 9452 + }, + { + "epoch": 0.28, + "learning_rate": 4.19614864079408e-06, + "loss": 1.2125, + "step": 9453 + }, + { + "epoch": 0.28, + "learning_rate": 4.1959694398220285e-06, + "loss": 1.1949, + "step": 9454 + }, + { + "epoch": 0.28, + "learning_rate": 4.195790222705165e-06, + "loss": 1.1937, + "step": 9455 + }, + { + "epoch": 0.28, + "learning_rate": 4.1956109894451955e-06, + "loss": 1.1432, + "step": 9456 + }, + { + "epoch": 0.28, + "learning_rate": 4.195431740043825e-06, + "loss": 1.0774, + "step": 9457 + }, + { + "epoch": 0.28, + "learning_rate": 4.195252474502762e-06, + "loss": 1.2306, + "step": 9458 + }, + { + "epoch": 0.28, + "learning_rate": 4.195073192823712e-06, + "loss": 1.0118, + "step": 9459 + }, + { + "epoch": 0.28, + "learning_rate": 4.19489389500838e-06, + "loss": 1.1194, + "step": 9460 + }, + { + "epoch": 0.29, + "learning_rate": 4.194714581058476e-06, + "loss": 1.1392, + "step": 9461 + }, + { + "epoch": 0.29, + "learning_rate": 4.194535250975706e-06, + "loss": 1.0731, + "step": 9462 + }, + { + "epoch": 0.29, + "learning_rate": 4.194355904761774e-06, + "loss": 1.1678, + "step": 9463 + }, + { + "epoch": 0.29, + "learning_rate": 4.194176542418392e-06, + "loss": 1.1537, + "step": 9464 + }, + { + "epoch": 0.29, + "learning_rate": 4.193997163947264e-06, + "loss": 1.1704, + "step": 9465 + }, + { + "epoch": 0.29, + "learning_rate": 4.1938177693501e-06, + "loss": 1.2239, + "step": 9466 + }, + { + "epoch": 0.29, + "learning_rate": 4.193638358628606e-06, + "loss": 1.1154, + "step": 9467 + }, + { + "epoch": 0.29, + "learning_rate": 4.1934589317844905e-06, + "loss": 1.1178, + "step": 9468 + }, + { + "epoch": 0.29, + "learning_rate": 4.1932794888194615e-06, + "loss": 1.0642, + "step": 9469 + }, + { + "epoch": 0.29, + "learning_rate": 4.193100029735228e-06, + "loss": 1.1411, + "step": 9470 + }, + { + "epoch": 0.29, + "learning_rate": 4.192920554533497e-06, + "loss": 1.1266, + "step": 9471 + }, + { + "epoch": 0.29, + "learning_rate": 4.192741063215977e-06, + "loss": 1.1064, + "step": 9472 + }, + { + "epoch": 0.29, + "learning_rate": 4.192561555784378e-06, + "loss": 1.2555, + "step": 9473 + }, + { + "epoch": 0.29, + "learning_rate": 4.192382032240408e-06, + "loss": 1.1526, + "step": 9474 + }, + { + "epoch": 0.29, + "learning_rate": 4.192202492585776e-06, + "loss": 1.1285, + "step": 9475 + }, + { + "epoch": 0.29, + "learning_rate": 4.192022936822192e-06, + "loss": 1.1467, + "step": 9476 + }, + { + "epoch": 0.29, + "learning_rate": 4.191843364951364e-06, + "loss": 1.0939, + "step": 9477 + }, + { + "epoch": 0.29, + "learning_rate": 4.191663776975003e-06, + "loss": 1.1002, + "step": 9478 + }, + { + "epoch": 0.29, + "learning_rate": 4.191484172894816e-06, + "loss": 1.1748, + "step": 9479 + }, + { + "epoch": 0.29, + "learning_rate": 4.191304552712515e-06, + "loss": 1.1797, + "step": 9480 + }, + { + "epoch": 0.29, + "learning_rate": 4.19112491642981e-06, + "loss": 1.0906, + "step": 9481 + }, + { + "epoch": 0.29, + "learning_rate": 4.190945264048409e-06, + "loss": 1.2166, + "step": 9482 + }, + { + "epoch": 0.29, + "learning_rate": 4.190765595570023e-06, + "loss": 1.1394, + "step": 9483 + }, + { + "epoch": 0.29, + "learning_rate": 4.190585910996364e-06, + "loss": 1.1016, + "step": 9484 + }, + { + "epoch": 0.29, + "learning_rate": 4.190406210329142e-06, + "loss": 1.0838, + "step": 9485 + }, + { + "epoch": 0.29, + "learning_rate": 4.1902264935700654e-06, + "loss": 1.2679, + "step": 9486 + }, + { + "epoch": 0.29, + "learning_rate": 4.190046760720847e-06, + "loss": 1.2755, + "step": 9487 + }, + { + "epoch": 0.29, + "learning_rate": 4.189867011783198e-06, + "loss": 1.212, + "step": 9488 + }, + { + "epoch": 0.29, + "learning_rate": 4.189687246758829e-06, + "loss": 1.1346, + "step": 9489 + }, + { + "epoch": 0.29, + "learning_rate": 4.18950746564945e-06, + "loss": 1.1402, + "step": 9490 + }, + { + "epoch": 0.29, + "learning_rate": 4.189327668456775e-06, + "loss": 1.1199, + "step": 9491 + }, + { + "epoch": 0.29, + "learning_rate": 4.1891478551825135e-06, + "loss": 1.2639, + "step": 9492 + }, + { + "epoch": 0.29, + "learning_rate": 4.188968025828379e-06, + "loss": 1.2617, + "step": 9493 + }, + { + "epoch": 0.29, + "learning_rate": 4.188788180396081e-06, + "loss": 1.1759, + "step": 9494 + }, + { + "epoch": 0.29, + "learning_rate": 4.188608318887333e-06, + "loss": 1.1495, + "step": 9495 + }, + { + "epoch": 0.29, + "learning_rate": 4.188428441303848e-06, + "loss": 1.138, + "step": 9496 + }, + { + "epoch": 0.29, + "learning_rate": 4.1882485476473365e-06, + "loss": 1.1138, + "step": 9497 + }, + { + "epoch": 0.29, + "learning_rate": 4.188068637919512e-06, + "loss": 1.2137, + "step": 9498 + }, + { + "epoch": 0.29, + "learning_rate": 4.187888712122088e-06, + "loss": 1.2172, + "step": 9499 + }, + { + "epoch": 0.29, + "learning_rate": 4.1877087702567755e-06, + "loss": 1.1246, + "step": 9500 + }, + { + "epoch": 0.29, + "learning_rate": 4.187528812325288e-06, + "loss": 1.1843, + "step": 9501 + }, + { + "epoch": 0.29, + "learning_rate": 4.187348838329339e-06, + "loss": 1.1258, + "step": 9502 + }, + { + "epoch": 0.29, + "learning_rate": 4.187168848270642e-06, + "loss": 1.0752, + "step": 9503 + }, + { + "epoch": 0.29, + "learning_rate": 4.186988842150911e-06, + "loss": 1.198, + "step": 9504 + }, + { + "epoch": 0.29, + "learning_rate": 4.186808819971858e-06, + "loss": 1.2917, + "step": 9505 + }, + { + "epoch": 0.29, + "learning_rate": 4.1866287817351975e-06, + "loss": 1.105, + "step": 9506 + }, + { + "epoch": 0.29, + "learning_rate": 4.186448727442643e-06, + "loss": 1.0679, + "step": 9507 + }, + { + "epoch": 0.29, + "learning_rate": 4.186268657095909e-06, + "loss": 1.1721, + "step": 9508 + }, + { + "epoch": 0.29, + "learning_rate": 4.1860885706967095e-06, + "loss": 1.1388, + "step": 9509 + }, + { + "epoch": 0.29, + "learning_rate": 4.185908468246759e-06, + "loss": 1.0605, + "step": 9510 + }, + { + "epoch": 0.29, + "learning_rate": 4.1857283497477715e-06, + "loss": 1.0897, + "step": 9511 + }, + { + "epoch": 0.29, + "learning_rate": 4.185548215201463e-06, + "loss": 1.1776, + "step": 9512 + }, + { + "epoch": 0.29, + "learning_rate": 4.185368064609546e-06, + "loss": 1.1985, + "step": 9513 + }, + { + "epoch": 0.29, + "learning_rate": 4.185187897973738e-06, + "loss": 1.0872, + "step": 9514 + }, + { + "epoch": 0.29, + "learning_rate": 4.185007715295752e-06, + "loss": 1.0969, + "step": 9515 + }, + { + "epoch": 0.29, + "learning_rate": 4.184827516577303e-06, + "loss": 1.1403, + "step": 9516 + }, + { + "epoch": 0.29, + "learning_rate": 4.184647301820109e-06, + "loss": 1.1327, + "step": 9517 + }, + { + "epoch": 0.29, + "learning_rate": 4.184467071025884e-06, + "loss": 1.1823, + "step": 9518 + }, + { + "epoch": 0.29, + "learning_rate": 4.1842868241963435e-06, + "loss": 1.1401, + "step": 9519 + }, + { + "epoch": 0.29, + "learning_rate": 4.184106561333203e-06, + "loss": 1.1782, + "step": 9520 + }, + { + "epoch": 0.29, + "learning_rate": 4.18392628243818e-06, + "loss": 1.1351, + "step": 9521 + }, + { + "epoch": 0.29, + "learning_rate": 4.18374598751299e-06, + "loss": 1.0831, + "step": 9522 + }, + { + "epoch": 0.29, + "learning_rate": 4.183565676559349e-06, + "loss": 1.1055, + "step": 9523 + }, + { + "epoch": 0.29, + "learning_rate": 4.183385349578972e-06, + "loss": 1.149, + "step": 9524 + }, + { + "epoch": 0.29, + "learning_rate": 4.183205006573579e-06, + "loss": 1.1682, + "step": 9525 + }, + { + "epoch": 0.29, + "learning_rate": 4.183024647544884e-06, + "loss": 1.1064, + "step": 9526 + }, + { + "epoch": 0.29, + "learning_rate": 4.182844272494606e-06, + "loss": 1.1085, + "step": 9527 + }, + { + "epoch": 0.29, + "learning_rate": 4.1826638814244604e-06, + "loss": 1.1107, + "step": 9528 + }, + { + "epoch": 0.29, + "learning_rate": 4.182483474336164e-06, + "loss": 1.1259, + "step": 9529 + }, + { + "epoch": 0.29, + "learning_rate": 4.182303051231436e-06, + "loss": 1.1759, + "step": 9530 + }, + { + "epoch": 0.29, + "learning_rate": 4.182122612111994e-06, + "loss": 1.1368, + "step": 9531 + }, + { + "epoch": 0.29, + "learning_rate": 4.181942156979555e-06, + "loss": 1.1359, + "step": 9532 + }, + { + "epoch": 0.29, + "learning_rate": 4.181761685835835e-06, + "loss": 1.2273, + "step": 9533 + }, + { + "epoch": 0.29, + "learning_rate": 4.181581198682556e-06, + "loss": 1.1318, + "step": 9534 + }, + { + "epoch": 0.29, + "learning_rate": 4.181400695521432e-06, + "loss": 1.1262, + "step": 9535 + }, + { + "epoch": 0.29, + "learning_rate": 4.181220176354184e-06, + "loss": 1.1763, + "step": 9536 + }, + { + "epoch": 0.29, + "learning_rate": 4.181039641182528e-06, + "loss": 1.316, + "step": 9537 + }, + { + "epoch": 0.29, + "learning_rate": 4.180859090008187e-06, + "loss": 1.167, + "step": 9538 + }, + { + "epoch": 0.29, + "learning_rate": 4.180678522832875e-06, + "loss": 1.1822, + "step": 9539 + }, + { + "epoch": 0.29, + "learning_rate": 4.180497939658314e-06, + "loss": 1.1786, + "step": 9540 + }, + { + "epoch": 0.29, + "learning_rate": 4.180317340486221e-06, + "loss": 1.2173, + "step": 9541 + }, + { + "epoch": 0.29, + "learning_rate": 4.180136725318317e-06, + "loss": 1.1357, + "step": 9542 + }, + { + "epoch": 0.29, + "learning_rate": 4.17995609415632e-06, + "loss": 1.1013, + "step": 9543 + }, + { + "epoch": 0.29, + "learning_rate": 4.1797754470019505e-06, + "loss": 1.2029, + "step": 9544 + }, + { + "epoch": 0.29, + "learning_rate": 4.179594783856927e-06, + "loss": 1.1138, + "step": 9545 + }, + { + "epoch": 0.29, + "learning_rate": 4.179414104722971e-06, + "loss": 1.1283, + "step": 9546 + }, + { + "epoch": 0.29, + "learning_rate": 4.179233409601802e-06, + "loss": 1.0884, + "step": 9547 + }, + { + "epoch": 0.29, + "learning_rate": 4.179052698495138e-06, + "loss": 1.1743, + "step": 9548 + }, + { + "epoch": 0.29, + "learning_rate": 4.178871971404702e-06, + "loss": 1.363, + "step": 9549 + }, + { + "epoch": 0.29, + "learning_rate": 4.178691228332213e-06, + "loss": 1.1027, + "step": 9550 + }, + { + "epoch": 0.29, + "learning_rate": 4.178510469279392e-06, + "loss": 1.0914, + "step": 9551 + }, + { + "epoch": 0.29, + "learning_rate": 4.17832969424796e-06, + "loss": 1.1279, + "step": 9552 + }, + { + "epoch": 0.29, + "learning_rate": 4.178148903239638e-06, + "loss": 1.1829, + "step": 9553 + }, + { + "epoch": 0.29, + "learning_rate": 4.177968096256146e-06, + "loss": 1.2865, + "step": 9554 + }, + { + "epoch": 0.29, + "learning_rate": 4.177787273299207e-06, + "loss": 1.1765, + "step": 9555 + }, + { + "epoch": 0.29, + "learning_rate": 4.1776064343705395e-06, + "loss": 1.2158, + "step": 9556 + }, + { + "epoch": 0.29, + "learning_rate": 4.177425579471867e-06, + "loss": 1.1722, + "step": 9557 + }, + { + "epoch": 0.29, + "learning_rate": 4.1772447086049115e-06, + "loss": 1.193, + "step": 9558 + }, + { + "epoch": 0.29, + "learning_rate": 4.177063821771395e-06, + "loss": 1.172, + "step": 9559 + }, + { + "epoch": 0.29, + "learning_rate": 4.176882918973037e-06, + "loss": 1.1126, + "step": 9560 + }, + { + "epoch": 0.29, + "learning_rate": 4.176702000211562e-06, + "loss": 1.1846, + "step": 9561 + }, + { + "epoch": 0.29, + "learning_rate": 4.176521065488691e-06, + "loss": 1.1702, + "step": 9562 + }, + { + "epoch": 0.29, + "learning_rate": 4.176340114806148e-06, + "loss": 1.2922, + "step": 9563 + }, + { + "epoch": 0.29, + "learning_rate": 4.176159148165654e-06, + "loss": 1.1052, + "step": 9564 + }, + { + "epoch": 0.29, + "learning_rate": 4.1759781655689315e-06, + "loss": 1.1022, + "step": 9565 + }, + { + "epoch": 0.29, + "learning_rate": 4.175797167017704e-06, + "loss": 1.1513, + "step": 9566 + }, + { + "epoch": 0.29, + "learning_rate": 4.1756161525136954e-06, + "loss": 1.1721, + "step": 9567 + }, + { + "epoch": 0.29, + "learning_rate": 4.175435122058627e-06, + "loss": 1.1328, + "step": 9568 + }, + { + "epoch": 0.29, + "learning_rate": 4.1752540756542246e-06, + "loss": 1.152, + "step": 9569 + }, + { + "epoch": 0.29, + "learning_rate": 4.175073013302209e-06, + "loss": 1.1282, + "step": 9570 + }, + { + "epoch": 0.29, + "learning_rate": 4.174891935004306e-06, + "loss": 1.2135, + "step": 9571 + }, + { + "epoch": 0.29, + "learning_rate": 4.174710840762237e-06, + "loss": 1.1877, + "step": 9572 + }, + { + "epoch": 0.29, + "learning_rate": 4.174529730577729e-06, + "loss": 1.2438, + "step": 9573 + }, + { + "epoch": 0.29, + "learning_rate": 4.174348604452504e-06, + "loss": 1.1089, + "step": 9574 + }, + { + "epoch": 0.29, + "learning_rate": 4.174167462388286e-06, + "loss": 0.9628, + "step": 9575 + }, + { + "epoch": 0.29, + "learning_rate": 4.173986304386801e-06, + "loss": 1.2133, + "step": 9576 + }, + { + "epoch": 0.29, + "learning_rate": 4.1738051304497715e-06, + "loss": 1.0756, + "step": 9577 + }, + { + "epoch": 0.29, + "learning_rate": 4.173623940578924e-06, + "loss": 1.1319, + "step": 9578 + }, + { + "epoch": 0.29, + "learning_rate": 4.173442734775983e-06, + "loss": 1.16, + "step": 9579 + }, + { + "epoch": 0.29, + "learning_rate": 4.173261513042673e-06, + "loss": 1.0016, + "step": 9580 + }, + { + "epoch": 0.29, + "learning_rate": 4.173080275380718e-06, + "loss": 1.0426, + "step": 9581 + }, + { + "epoch": 0.29, + "learning_rate": 4.172899021791845e-06, + "loss": 1.1366, + "step": 9582 + }, + { + "epoch": 0.29, + "learning_rate": 4.17271775227778e-06, + "loss": 1.0723, + "step": 9583 + }, + { + "epoch": 0.29, + "learning_rate": 4.172536466840247e-06, + "loss": 1.1069, + "step": 9584 + }, + { + "epoch": 0.29, + "learning_rate": 4.172355165480972e-06, + "loss": 1.1569, + "step": 9585 + }, + { + "epoch": 0.29, + "learning_rate": 4.172173848201682e-06, + "loss": 1.1234, + "step": 9586 + }, + { + "epoch": 0.29, + "learning_rate": 4.1719925150041014e-06, + "loss": 1.2743, + "step": 9587 + }, + { + "epoch": 0.29, + "learning_rate": 4.171811165889959e-06, + "loss": 1.1417, + "step": 9588 + }, + { + "epoch": 0.29, + "learning_rate": 4.171629800860978e-06, + "loss": 1.136, + "step": 9589 + }, + { + "epoch": 0.29, + "learning_rate": 4.171448419918887e-06, + "loss": 1.114, + "step": 9590 + }, + { + "epoch": 0.29, + "learning_rate": 4.171267023065412e-06, + "loss": 1.0451, + "step": 9591 + }, + { + "epoch": 0.29, + "learning_rate": 4.17108561030228e-06, + "loss": 1.0865, + "step": 9592 + }, + { + "epoch": 0.29, + "learning_rate": 4.1709041816312166e-06, + "loss": 1.2806, + "step": 9593 + }, + { + "epoch": 0.29, + "learning_rate": 4.170722737053951e-06, + "loss": 1.1603, + "step": 9594 + }, + { + "epoch": 0.29, + "learning_rate": 4.17054127657221e-06, + "loss": 1.1169, + "step": 9595 + }, + { + "epoch": 0.29, + "learning_rate": 4.17035980018772e-06, + "loss": 1.1422, + "step": 9596 + }, + { + "epoch": 0.29, + "learning_rate": 4.170178307902209e-06, + "loss": 1.0699, + "step": 9597 + }, + { + "epoch": 0.29, + "learning_rate": 4.169996799717405e-06, + "loss": 1.0821, + "step": 9598 + }, + { + "epoch": 0.29, + "learning_rate": 4.169815275635037e-06, + "loss": 1.1057, + "step": 9599 + }, + { + "epoch": 0.29, + "learning_rate": 4.169633735656831e-06, + "loss": 1.2035, + "step": 9600 + }, + { + "epoch": 0.29, + "learning_rate": 4.169452179784516e-06, + "loss": 1.1392, + "step": 9601 + }, + { + "epoch": 0.29, + "learning_rate": 4.169270608019819e-06, + "loss": 1.08, + "step": 9602 + }, + { + "epoch": 0.29, + "learning_rate": 4.1690890203644715e-06, + "loss": 1.1685, + "step": 9603 + }, + { + "epoch": 0.29, + "learning_rate": 4.1689074168202e-06, + "loss": 1.2422, + "step": 9604 + }, + { + "epoch": 0.29, + "learning_rate": 4.168725797388733e-06, + "loss": 1.0953, + "step": 9605 + }, + { + "epoch": 0.29, + "learning_rate": 4.1685441620718e-06, + "loss": 1.3172, + "step": 9606 + }, + { + "epoch": 0.29, + "learning_rate": 4.168362510871131e-06, + "loss": 1.0676, + "step": 9607 + }, + { + "epoch": 0.29, + "learning_rate": 4.168180843788454e-06, + "loss": 1.2297, + "step": 9608 + }, + { + "epoch": 0.29, + "learning_rate": 4.167999160825499e-06, + "loss": 1.1009, + "step": 9609 + }, + { + "epoch": 0.29, + "learning_rate": 4.1678174619839955e-06, + "loss": 1.2348, + "step": 9610 + }, + { + "epoch": 0.29, + "learning_rate": 4.167635747265672e-06, + "loss": 1.1794, + "step": 9611 + }, + { + "epoch": 0.29, + "learning_rate": 4.16745401667226e-06, + "loss": 1.0886, + "step": 9612 + }, + { + "epoch": 0.29, + "learning_rate": 4.167272270205489e-06, + "loss": 1.1249, + "step": 9613 + }, + { + "epoch": 0.29, + "learning_rate": 4.167090507867089e-06, + "loss": 1.1749, + "step": 9614 + }, + { + "epoch": 0.29, + "learning_rate": 4.16690872965879e-06, + "loss": 1.1409, + "step": 9615 + }, + { + "epoch": 0.29, + "learning_rate": 4.166726935582323e-06, + "loss": 1.1743, + "step": 9616 + }, + { + "epoch": 0.29, + "learning_rate": 4.1665451256394175e-06, + "loss": 1.0893, + "step": 9617 + }, + { + "epoch": 0.29, + "learning_rate": 4.166363299831806e-06, + "loss": 1.0935, + "step": 9618 + }, + { + "epoch": 0.29, + "learning_rate": 4.166181458161218e-06, + "loss": 1.0496, + "step": 9619 + }, + { + "epoch": 0.29, + "learning_rate": 4.165999600629385e-06, + "loss": 1.1134, + "step": 9620 + }, + { + "epoch": 0.29, + "learning_rate": 4.165817727238039e-06, + "loss": 1.1317, + "step": 9621 + }, + { + "epoch": 0.29, + "learning_rate": 4.165635837988909e-06, + "loss": 1.0972, + "step": 9622 + }, + { + "epoch": 0.29, + "learning_rate": 4.1654539328837285e-06, + "loss": 1.2238, + "step": 9623 + }, + { + "epoch": 0.29, + "learning_rate": 4.165272011924229e-06, + "loss": 1.2177, + "step": 9624 + }, + { + "epoch": 0.29, + "learning_rate": 4.165090075112142e-06, + "loss": 1.1663, + "step": 9625 + }, + { + "epoch": 0.29, + "learning_rate": 4.1649081224491995e-06, + "loss": 1.2571, + "step": 9626 + }, + { + "epoch": 0.29, + "learning_rate": 4.164726153937133e-06, + "loss": 1.1713, + "step": 9627 + }, + { + "epoch": 0.29, + "learning_rate": 4.164544169577676e-06, + "loss": 1.2252, + "step": 9628 + }, + { + "epoch": 0.29, + "learning_rate": 4.16436216937256e-06, + "loss": 1.0745, + "step": 9629 + }, + { + "epoch": 0.29, + "learning_rate": 4.164180153323517e-06, + "loss": 1.079, + "step": 9630 + }, + { + "epoch": 0.29, + "learning_rate": 4.163998121432281e-06, + "loss": 1.0889, + "step": 9631 + }, + { + "epoch": 0.29, + "learning_rate": 4.163816073700584e-06, + "loss": 1.158, + "step": 9632 + }, + { + "epoch": 0.29, + "learning_rate": 4.16363401013016e-06, + "loss": 1.1964, + "step": 9633 + }, + { + "epoch": 0.29, + "learning_rate": 4.163451930722741e-06, + "loss": 1.2223, + "step": 9634 + }, + { + "epoch": 0.29, + "learning_rate": 4.1632698354800605e-06, + "loss": 1.3336, + "step": 9635 + }, + { + "epoch": 0.29, + "learning_rate": 4.1630877244038525e-06, + "loss": 1.2394, + "step": 9636 + }, + { + "epoch": 0.29, + "learning_rate": 4.162905597495851e-06, + "loss": 1.2026, + "step": 9637 + }, + { + "epoch": 0.29, + "learning_rate": 4.1627234547577876e-06, + "loss": 1.1453, + "step": 9638 + }, + { + "epoch": 0.29, + "learning_rate": 4.162541296191398e-06, + "loss": 1.0596, + "step": 9639 + }, + { + "epoch": 0.29, + "learning_rate": 4.162359121798417e-06, + "loss": 1.0998, + "step": 9640 + }, + { + "epoch": 0.29, + "learning_rate": 4.1621769315805776e-06, + "loss": 1.1863, + "step": 9641 + }, + { + "epoch": 0.29, + "learning_rate": 4.1619947255396146e-06, + "loss": 1.1848, + "step": 9642 + }, + { + "epoch": 0.29, + "learning_rate": 4.161812503677261e-06, + "loss": 1.1863, + "step": 9643 + }, + { + "epoch": 0.29, + "learning_rate": 4.161630265995254e-06, + "loss": 1.1361, + "step": 9644 + }, + { + "epoch": 0.29, + "learning_rate": 4.161448012495326e-06, + "loss": 1.1376, + "step": 9645 + }, + { + "epoch": 0.29, + "learning_rate": 4.161265743179214e-06, + "loss": 1.08, + "step": 9646 + }, + { + "epoch": 0.29, + "learning_rate": 4.161083458048652e-06, + "loss": 1.1837, + "step": 9647 + }, + { + "epoch": 0.29, + "learning_rate": 4.160901157105374e-06, + "loss": 1.1358, + "step": 9648 + }, + { + "epoch": 0.29, + "learning_rate": 4.160718840351119e-06, + "loss": 1.1329, + "step": 9649 + }, + { + "epoch": 0.29, + "learning_rate": 4.16053650778762e-06, + "loss": 1.2667, + "step": 9650 + }, + { + "epoch": 0.29, + "learning_rate": 4.1603541594166134e-06, + "loss": 1.2214, + "step": 9651 + }, + { + "epoch": 0.29, + "learning_rate": 4.160171795239834e-06, + "loss": 1.1671, + "step": 9652 + }, + { + "epoch": 0.29, + "learning_rate": 4.1599894152590195e-06, + "loss": 1.157, + "step": 9653 + }, + { + "epoch": 0.29, + "learning_rate": 4.159807019475904e-06, + "loss": 1.3354, + "step": 9654 + }, + { + "epoch": 0.29, + "learning_rate": 4.159624607892226e-06, + "loss": 1.1206, + "step": 9655 + }, + { + "epoch": 0.29, + "learning_rate": 4.15944218050972e-06, + "loss": 1.223, + "step": 9656 + }, + { + "epoch": 0.29, + "learning_rate": 4.159259737330126e-06, + "loss": 1.1197, + "step": 9657 + }, + { + "epoch": 0.29, + "learning_rate": 4.159077278355177e-06, + "loss": 1.1111, + "step": 9658 + }, + { + "epoch": 0.29, + "learning_rate": 4.158894803586611e-06, + "loss": 1.1804, + "step": 9659 + }, + { + "epoch": 0.29, + "learning_rate": 4.1587123130261655e-06, + "loss": 1.1395, + "step": 9660 + }, + { + "epoch": 0.29, + "learning_rate": 4.158529806675577e-06, + "loss": 1.1776, + "step": 9661 + }, + { + "epoch": 0.29, + "learning_rate": 4.158347284536585e-06, + "loss": 1.1694, + "step": 9662 + }, + { + "epoch": 0.29, + "learning_rate": 4.158164746610925e-06, + "loss": 1.1665, + "step": 9663 + }, + { + "epoch": 0.29, + "learning_rate": 4.157982192900335e-06, + "loss": 1.1953, + "step": 9664 + }, + { + "epoch": 0.29, + "learning_rate": 4.157799623406553e-06, + "loss": 1.0346, + "step": 9665 + }, + { + "epoch": 0.29, + "learning_rate": 4.157617038131317e-06, + "loss": 1.0632, + "step": 9666 + }, + { + "epoch": 0.29, + "learning_rate": 4.157434437076366e-06, + "loss": 1.2751, + "step": 9667 + }, + { + "epoch": 0.29, + "learning_rate": 4.1572518202434366e-06, + "loss": 1.079, + "step": 9668 + }, + { + "epoch": 0.29, + "learning_rate": 4.157069187634268e-06, + "loss": 1.0463, + "step": 9669 + }, + { + "epoch": 0.29, + "learning_rate": 4.156886539250599e-06, + "loss": 1.0957, + "step": 9670 + }, + { + "epoch": 0.29, + "learning_rate": 4.156703875094168e-06, + "loss": 1.2181, + "step": 9671 + }, + { + "epoch": 0.29, + "learning_rate": 4.1565211951667146e-06, + "loss": 1.1816, + "step": 9672 + }, + { + "epoch": 0.29, + "learning_rate": 4.1563384994699766e-06, + "loss": 1.1617, + "step": 9673 + }, + { + "epoch": 0.29, + "learning_rate": 4.156155788005693e-06, + "loss": 1.1229, + "step": 9674 + }, + { + "epoch": 0.29, + "learning_rate": 4.155973060775606e-06, + "loss": 1.2529, + "step": 9675 + }, + { + "epoch": 0.29, + "learning_rate": 4.155790317781452e-06, + "loss": 1.0475, + "step": 9676 + }, + { + "epoch": 0.29, + "learning_rate": 4.155607559024971e-06, + "loss": 1.0893, + "step": 9677 + }, + { + "epoch": 0.29, + "learning_rate": 4.155424784507904e-06, + "loss": 1.1538, + "step": 9678 + }, + { + "epoch": 0.29, + "learning_rate": 4.15524199423199e-06, + "loss": 1.1436, + "step": 9679 + }, + { + "epoch": 0.29, + "learning_rate": 4.15505918819897e-06, + "loss": 1.2129, + "step": 9680 + }, + { + "epoch": 0.29, + "learning_rate": 4.154876366410583e-06, + "loss": 1.1234, + "step": 9681 + }, + { + "epoch": 0.29, + "learning_rate": 4.154693528868571e-06, + "loss": 1.2509, + "step": 9682 + }, + { + "epoch": 0.29, + "learning_rate": 4.1545106755746725e-06, + "loss": 1.0709, + "step": 9683 + }, + { + "epoch": 0.29, + "learning_rate": 4.154327806530629e-06, + "loss": 1.1382, + "step": 9684 + }, + { + "epoch": 0.29, + "learning_rate": 4.154144921738182e-06, + "loss": 1.1365, + "step": 9685 + }, + { + "epoch": 0.29, + "learning_rate": 4.153962021199073e-06, + "loss": 1.1061, + "step": 9686 + }, + { + "epoch": 0.29, + "learning_rate": 4.153779104915041e-06, + "loss": 1.2584, + "step": 9687 + }, + { + "epoch": 0.29, + "learning_rate": 4.153596172887828e-06, + "loss": 1.1842, + "step": 9688 + }, + { + "epoch": 0.29, + "learning_rate": 4.153413225119177e-06, + "loss": 1.1666, + "step": 9689 + }, + { + "epoch": 0.29, + "learning_rate": 4.1532302616108275e-06, + "loss": 1.154, + "step": 9690 + }, + { + "epoch": 0.29, + "learning_rate": 4.153047282364522e-06, + "loss": 1.1003, + "step": 9691 + }, + { + "epoch": 0.29, + "learning_rate": 4.152864287382004e-06, + "loss": 1.1698, + "step": 9692 + }, + { + "epoch": 0.29, + "learning_rate": 4.152681276665013e-06, + "loss": 0.9037, + "step": 9693 + }, + { + "epoch": 0.29, + "learning_rate": 4.152498250215292e-06, + "loss": 1.192, + "step": 9694 + }, + { + "epoch": 0.29, + "learning_rate": 4.152315208034584e-06, + "loss": 1.2195, + "step": 9695 + }, + { + "epoch": 0.29, + "learning_rate": 4.15213215012463e-06, + "loss": 1.0961, + "step": 9696 + }, + { + "epoch": 0.29, + "learning_rate": 4.151949076487175e-06, + "loss": 1.1879, + "step": 9697 + }, + { + "epoch": 0.29, + "learning_rate": 4.151765987123959e-06, + "loss": 1.1563, + "step": 9698 + }, + { + "epoch": 0.29, + "learning_rate": 4.151582882036728e-06, + "loss": 1.1219, + "step": 9699 + }, + { + "epoch": 0.29, + "learning_rate": 4.1513997612272226e-06, + "loss": 1.1359, + "step": 9700 + }, + { + "epoch": 0.29, + "learning_rate": 4.151216624697186e-06, + "loss": 1.1409, + "step": 9701 + }, + { + "epoch": 0.29, + "learning_rate": 4.151033472448363e-06, + "loss": 1.0704, + "step": 9702 + }, + { + "epoch": 0.29, + "learning_rate": 4.150850304482497e-06, + "loss": 1.0979, + "step": 9703 + }, + { + "epoch": 0.29, + "learning_rate": 4.1506671208013305e-06, + "loss": 1.1672, + "step": 9704 + }, + { + "epoch": 0.29, + "learning_rate": 4.150483921406609e-06, + "loss": 1.2411, + "step": 9705 + }, + { + "epoch": 0.29, + "learning_rate": 4.150300706300075e-06, + "loss": 1.0709, + "step": 9706 + }, + { + "epoch": 0.29, + "learning_rate": 4.150117475483472e-06, + "loss": 1.0923, + "step": 9707 + }, + { + "epoch": 0.29, + "learning_rate": 4.1499342289585465e-06, + "loss": 1.139, + "step": 9708 + }, + { + "epoch": 0.29, + "learning_rate": 4.149750966727041e-06, + "loss": 0.9995, + "step": 9709 + }, + { + "epoch": 0.29, + "learning_rate": 4.149567688790702e-06, + "loss": 1.1995, + "step": 9710 + }, + { + "epoch": 0.29, + "learning_rate": 4.149384395151272e-06, + "loss": 1.0845, + "step": 9711 + }, + { + "epoch": 0.29, + "learning_rate": 4.149201085810497e-06, + "loss": 1.1806, + "step": 9712 + }, + { + "epoch": 0.29, + "learning_rate": 4.149017760770123e-06, + "loss": 1.2311, + "step": 9713 + }, + { + "epoch": 0.29, + "learning_rate": 4.148834420031893e-06, + "loss": 1.026, + "step": 9714 + }, + { + "epoch": 0.29, + "learning_rate": 4.148651063597553e-06, + "loss": 1.1995, + "step": 9715 + }, + { + "epoch": 0.29, + "learning_rate": 4.1484676914688505e-06, + "loss": 1.1344, + "step": 9716 + }, + { + "epoch": 0.29, + "learning_rate": 4.148284303647529e-06, + "loss": 1.1312, + "step": 9717 + }, + { + "epoch": 0.29, + "learning_rate": 4.148100900135334e-06, + "loss": 1.0802, + "step": 9718 + }, + { + "epoch": 0.29, + "learning_rate": 4.147917480934013e-06, + "loss": 1.1541, + "step": 9719 + }, + { + "epoch": 0.29, + "learning_rate": 4.1477340460453105e-06, + "loss": 1.1227, + "step": 9720 + }, + { + "epoch": 0.29, + "learning_rate": 4.1475505954709735e-06, + "loss": 1.0814, + "step": 9721 + }, + { + "epoch": 0.29, + "learning_rate": 4.147367129212749e-06, + "loss": 1.1588, + "step": 9722 + }, + { + "epoch": 0.29, + "learning_rate": 4.1471836472723824e-06, + "loss": 1.1249, + "step": 9723 + }, + { + "epoch": 0.29, + "learning_rate": 4.147000149651621e-06, + "loss": 1.1204, + "step": 9724 + }, + { + "epoch": 0.29, + "learning_rate": 4.146816636352211e-06, + "loss": 1.1452, + "step": 9725 + }, + { + "epoch": 0.29, + "learning_rate": 4.146633107375901e-06, + "loss": 1.0214, + "step": 9726 + }, + { + "epoch": 0.29, + "learning_rate": 4.146449562724435e-06, + "loss": 1.0713, + "step": 9727 + }, + { + "epoch": 0.29, + "learning_rate": 4.146266002399563e-06, + "loss": 1.1755, + "step": 9728 + }, + { + "epoch": 0.29, + "learning_rate": 4.146082426403032e-06, + "loss": 1.1697, + "step": 9729 + }, + { + "epoch": 0.29, + "learning_rate": 4.145898834736588e-06, + "loss": 1.231, + "step": 9730 + }, + { + "epoch": 0.29, + "learning_rate": 4.145715227401981e-06, + "loss": 1.2272, + "step": 9731 + }, + { + "epoch": 0.29, + "learning_rate": 4.145531604400956e-06, + "loss": 1.052, + "step": 9732 + }, + { + "epoch": 0.29, + "learning_rate": 4.145347965735265e-06, + "loss": 1.1611, + "step": 9733 + }, + { + "epoch": 0.29, + "learning_rate": 4.145164311406652e-06, + "loss": 1.1027, + "step": 9734 + }, + { + "epoch": 0.29, + "learning_rate": 4.144980641416868e-06, + "loss": 1.1946, + "step": 9735 + }, + { + "epoch": 0.29, + "learning_rate": 4.144796955767659e-06, + "loss": 1.1225, + "step": 9736 + }, + { + "epoch": 0.29, + "learning_rate": 4.144613254460777e-06, + "loss": 1.1417, + "step": 9737 + }, + { + "epoch": 0.29, + "learning_rate": 4.1444295374979685e-06, + "loss": 1.1085, + "step": 9738 + }, + { + "epoch": 0.29, + "learning_rate": 4.144245804880982e-06, + "loss": 1.1996, + "step": 9739 + }, + { + "epoch": 0.29, + "learning_rate": 4.144062056611568e-06, + "loss": 1.0983, + "step": 9740 + }, + { + "epoch": 0.29, + "learning_rate": 4.143878292691474e-06, + "loss": 1.1187, + "step": 9741 + }, + { + "epoch": 0.29, + "learning_rate": 4.143694513122452e-06, + "loss": 1.1061, + "step": 9742 + }, + { + "epoch": 0.29, + "learning_rate": 4.143510717906248e-06, + "loss": 1.2452, + "step": 9743 + }, + { + "epoch": 0.29, + "learning_rate": 4.143326907044616e-06, + "loss": 1.1524, + "step": 9744 + }, + { + "epoch": 0.29, + "learning_rate": 4.143143080539301e-06, + "loss": 1.103, + "step": 9745 + }, + { + "epoch": 0.29, + "learning_rate": 4.1429592383920565e-06, + "loss": 1.0723, + "step": 9746 + }, + { + "epoch": 0.29, + "learning_rate": 4.142775380604631e-06, + "loss": 0.9992, + "step": 9747 + }, + { + "epoch": 0.29, + "learning_rate": 4.1425915071787745e-06, + "loss": 1.1544, + "step": 9748 + }, + { + "epoch": 0.29, + "learning_rate": 4.142407618116239e-06, + "loss": 1.1565, + "step": 9749 + }, + { + "epoch": 0.29, + "learning_rate": 4.142223713418773e-06, + "loss": 1.2004, + "step": 9750 + }, + { + "epoch": 0.29, + "learning_rate": 4.142039793088129e-06, + "loss": 1.1879, + "step": 9751 + }, + { + "epoch": 0.29, + "learning_rate": 4.141855857126057e-06, + "loss": 1.1091, + "step": 9752 + }, + { + "epoch": 0.29, + "learning_rate": 4.141671905534307e-06, + "loss": 1.0287, + "step": 9753 + }, + { + "epoch": 0.29, + "learning_rate": 4.141487938314631e-06, + "loss": 1.2289, + "step": 9754 + }, + { + "epoch": 0.29, + "learning_rate": 4.141303955468782e-06, + "loss": 1.1629, + "step": 9755 + }, + { + "epoch": 0.29, + "learning_rate": 4.141119956998509e-06, + "loss": 1.2401, + "step": 9756 + }, + { + "epoch": 0.29, + "learning_rate": 4.140935942905564e-06, + "loss": 1.2805, + "step": 9757 + }, + { + "epoch": 0.29, + "learning_rate": 4.140751913191699e-06, + "loss": 1.1412, + "step": 9758 + }, + { + "epoch": 0.29, + "learning_rate": 4.140567867858667e-06, + "loss": 1.1589, + "step": 9759 + }, + { + "epoch": 0.29, + "learning_rate": 4.140383806908218e-06, + "loss": 1.0331, + "step": 9760 + }, + { + "epoch": 0.29, + "learning_rate": 4.140199730342106e-06, + "loss": 1.2545, + "step": 9761 + }, + { + "epoch": 0.29, + "learning_rate": 4.140015638162082e-06, + "loss": 1.2242, + "step": 9762 + }, + { + "epoch": 0.29, + "learning_rate": 4.139831530369899e-06, + "loss": 1.1175, + "step": 9763 + }, + { + "epoch": 0.29, + "learning_rate": 4.1396474069673095e-06, + "loss": 1.1933, + "step": 9764 + }, + { + "epoch": 0.29, + "learning_rate": 4.139463267956067e-06, + "loss": 1.1622, + "step": 9765 + }, + { + "epoch": 0.29, + "learning_rate": 4.139279113337923e-06, + "loss": 1.0541, + "step": 9766 + }, + { + "epoch": 0.29, + "learning_rate": 4.139094943114632e-06, + "loss": 1.0701, + "step": 9767 + }, + { + "epoch": 0.29, + "learning_rate": 4.138910757287946e-06, + "loss": 1.1436, + "step": 9768 + }, + { + "epoch": 0.29, + "learning_rate": 4.13872655585962e-06, + "loss": 1.2374, + "step": 9769 + }, + { + "epoch": 0.29, + "learning_rate": 4.138542338831405e-06, + "loss": 1.2314, + "step": 9770 + }, + { + "epoch": 0.29, + "learning_rate": 4.138358106205057e-06, + "loss": 0.9623, + "step": 9771 + }, + { + "epoch": 0.29, + "learning_rate": 4.138173857982329e-06, + "loss": 1.1353, + "step": 9772 + }, + { + "epoch": 0.29, + "learning_rate": 4.137989594164974e-06, + "loss": 1.1803, + "step": 9773 + }, + { + "epoch": 0.29, + "learning_rate": 4.137805314754747e-06, + "loss": 1.1564, + "step": 9774 + }, + { + "epoch": 0.29, + "learning_rate": 4.137621019753403e-06, + "loss": 1.144, + "step": 9775 + }, + { + "epoch": 0.29, + "learning_rate": 4.137436709162695e-06, + "loss": 1.1915, + "step": 9776 + }, + { + "epoch": 0.29, + "learning_rate": 4.137252382984378e-06, + "loss": 1.1621, + "step": 9777 + }, + { + "epoch": 0.29, + "learning_rate": 4.137068041220208e-06, + "loss": 1.1743, + "step": 9778 + }, + { + "epoch": 0.29, + "learning_rate": 4.136883683871937e-06, + "loss": 1.112, + "step": 9779 + }, + { + "epoch": 0.29, + "learning_rate": 4.136699310941324e-06, + "loss": 1.0723, + "step": 9780 + }, + { + "epoch": 0.29, + "learning_rate": 4.136514922430119e-06, + "loss": 1.1245, + "step": 9781 + }, + { + "epoch": 0.29, + "learning_rate": 4.136330518340082e-06, + "loss": 1.183, + "step": 9782 + }, + { + "epoch": 0.29, + "learning_rate": 4.136146098672966e-06, + "loss": 1.0154, + "step": 9783 + }, + { + "epoch": 0.29, + "learning_rate": 4.135961663430527e-06, + "loss": 1.1312, + "step": 9784 + }, + { + "epoch": 0.29, + "learning_rate": 4.135777212614521e-06, + "loss": 1.1436, + "step": 9785 + }, + { + "epoch": 0.29, + "learning_rate": 4.1355927462267046e-06, + "loss": 1.0731, + "step": 9786 + }, + { + "epoch": 0.29, + "learning_rate": 4.135408264268832e-06, + "loss": 1.2017, + "step": 9787 + }, + { + "epoch": 0.29, + "learning_rate": 4.13522376674266e-06, + "loss": 1.0895, + "step": 9788 + }, + { + "epoch": 0.29, + "learning_rate": 4.135039253649946e-06, + "loss": 1.1625, + "step": 9789 + }, + { + "epoch": 0.29, + "learning_rate": 4.134854724992445e-06, + "loss": 1.1297, + "step": 9790 + }, + { + "epoch": 0.29, + "learning_rate": 4.134670180771916e-06, + "loss": 1.1292, + "step": 9791 + }, + { + "epoch": 0.29, + "learning_rate": 4.134485620990113e-06, + "loss": 1.1373, + "step": 9792 + }, + { + "epoch": 0.3, + "learning_rate": 4.134301045648794e-06, + "loss": 1.272, + "step": 9793 + }, + { + "epoch": 0.3, + "learning_rate": 4.134116454749716e-06, + "loss": 1.0109, + "step": 9794 + }, + { + "epoch": 0.3, + "learning_rate": 4.133931848294637e-06, + "loss": 1.1709, + "step": 9795 + }, + { + "epoch": 0.3, + "learning_rate": 4.133747226285314e-06, + "loss": 1.1177, + "step": 9796 + }, + { + "epoch": 0.3, + "learning_rate": 4.133562588723503e-06, + "loss": 1.1746, + "step": 9797 + }, + { + "epoch": 0.3, + "learning_rate": 4.133377935610963e-06, + "loss": 1.2121, + "step": 9798 + }, + { + "epoch": 0.3, + "learning_rate": 4.133193266949453e-06, + "loss": 1.1845, + "step": 9799 + }, + { + "epoch": 0.3, + "learning_rate": 4.1330085827407295e-06, + "loss": 1.0733, + "step": 9800 + }, + { + "epoch": 0.3, + "learning_rate": 4.13282388298655e-06, + "loss": 1.1776, + "step": 9801 + }, + { + "epoch": 0.3, + "learning_rate": 4.132639167688674e-06, + "loss": 1.0918, + "step": 9802 + }, + { + "epoch": 0.3, + "learning_rate": 4.132454436848859e-06, + "loss": 1.1086, + "step": 9803 + }, + { + "epoch": 0.3, + "learning_rate": 4.132269690468865e-06, + "loss": 1.1901, + "step": 9804 + }, + { + "epoch": 0.3, + "learning_rate": 4.132084928550448e-06, + "loss": 1.1762, + "step": 9805 + }, + { + "epoch": 0.3, + "learning_rate": 4.1319001510953696e-06, + "loss": 1.1398, + "step": 9806 + }, + { + "epoch": 0.3, + "learning_rate": 4.1317153581053885e-06, + "loss": 1.229, + "step": 9807 + }, + { + "epoch": 0.3, + "learning_rate": 4.131530549582261e-06, + "loss": 1.1296, + "step": 9808 + }, + { + "epoch": 0.3, + "learning_rate": 4.13134572552775e-06, + "loss": 1.0405, + "step": 9809 + }, + { + "epoch": 0.3, + "learning_rate": 4.131160885943612e-06, + "loss": 1.0872, + "step": 9810 + }, + { + "epoch": 0.3, + "learning_rate": 4.13097603083161e-06, + "loss": 1.1234, + "step": 9811 + }, + { + "epoch": 0.3, + "learning_rate": 4.1307911601935e-06, + "loss": 1.1848, + "step": 9812 + }, + { + "epoch": 0.3, + "learning_rate": 4.130606274031045e-06, + "loss": 1.2623, + "step": 9813 + }, + { + "epoch": 0.3, + "learning_rate": 4.130421372346001e-06, + "loss": 1.1791, + "step": 9814 + }, + { + "epoch": 0.3, + "learning_rate": 4.130236455140134e-06, + "loss": 1.0479, + "step": 9815 + }, + { + "epoch": 0.3, + "learning_rate": 4.130051522415199e-06, + "loss": 0.9941, + "step": 9816 + }, + { + "epoch": 0.3, + "learning_rate": 4.129866574172959e-06, + "loss": 1.1747, + "step": 9817 + }, + { + "epoch": 0.3, + "learning_rate": 4.1296816104151745e-06, + "loss": 1.1959, + "step": 9818 + }, + { + "epoch": 0.3, + "learning_rate": 4.129496631143606e-06, + "loss": 1.0965, + "step": 9819 + }, + { + "epoch": 0.3, + "learning_rate": 4.129311636360014e-06, + "loss": 1.1382, + "step": 9820 + }, + { + "epoch": 0.3, + "learning_rate": 4.12912662606616e-06, + "loss": 1.0879, + "step": 9821 + }, + { + "epoch": 0.3, + "learning_rate": 4.1289416002638056e-06, + "loss": 1.1624, + "step": 9822 + }, + { + "epoch": 0.3, + "learning_rate": 4.1287565589547115e-06, + "loss": 1.194, + "step": 9823 + }, + { + "epoch": 0.3, + "learning_rate": 4.1285715021406396e-06, + "loss": 1.1599, + "step": 9824 + }, + { + "epoch": 0.3, + "learning_rate": 4.12838642982335e-06, + "loss": 1.1587, + "step": 9825 + }, + { + "epoch": 0.3, + "learning_rate": 4.1282013420046076e-06, + "loss": 1.0378, + "step": 9826 + }, + { + "epoch": 0.3, + "learning_rate": 4.128016238686171e-06, + "loss": 1.1061, + "step": 9827 + }, + { + "epoch": 0.3, + "learning_rate": 4.127831119869805e-06, + "loss": 1.1478, + "step": 9828 + }, + { + "epoch": 0.3, + "learning_rate": 4.12764598555727e-06, + "loss": 1.0007, + "step": 9829 + }, + { + "epoch": 0.3, + "learning_rate": 4.12746083575033e-06, + "loss": 1.2175, + "step": 9830 + }, + { + "epoch": 0.3, + "learning_rate": 4.127275670450746e-06, + "loss": 1.2434, + "step": 9831 + }, + { + "epoch": 0.3, + "learning_rate": 4.127090489660281e-06, + "loss": 1.1686, + "step": 9832 + }, + { + "epoch": 0.3, + "learning_rate": 4.1269052933807e-06, + "loss": 1.0873, + "step": 9833 + }, + { + "epoch": 0.3, + "learning_rate": 4.126720081613762e-06, + "loss": 1.1706, + "step": 9834 + }, + { + "epoch": 0.3, + "learning_rate": 4.126534854361234e-06, + "loss": 1.1287, + "step": 9835 + }, + { + "epoch": 0.3, + "learning_rate": 4.126349611624876e-06, + "loss": 1.211, + "step": 9836 + }, + { + "epoch": 0.3, + "learning_rate": 4.126164353406454e-06, + "loss": 1.1652, + "step": 9837 + }, + { + "epoch": 0.3, + "learning_rate": 4.12597907970773e-06, + "loss": 1.0503, + "step": 9838 + }, + { + "epoch": 0.3, + "learning_rate": 4.125793790530469e-06, + "loss": 1.1912, + "step": 9839 + }, + { + "epoch": 0.3, + "learning_rate": 4.125608485876433e-06, + "loss": 1.0571, + "step": 9840 + }, + { + "epoch": 0.3, + "learning_rate": 4.1254231657473876e-06, + "loss": 1.1249, + "step": 9841 + }, + { + "epoch": 0.3, + "learning_rate": 4.125237830145097e-06, + "loss": 1.1879, + "step": 9842 + }, + { + "epoch": 0.3, + "learning_rate": 4.125052479071324e-06, + "loss": 1.1505, + "step": 9843 + }, + { + "epoch": 0.3, + "learning_rate": 4.124867112527835e-06, + "loss": 1.2619, + "step": 9844 + }, + { + "epoch": 0.3, + "learning_rate": 4.124681730516394e-06, + "loss": 1.1738, + "step": 9845 + }, + { + "epoch": 0.3, + "learning_rate": 4.124496333038764e-06, + "loss": 1.0844, + "step": 9846 + }, + { + "epoch": 0.3, + "learning_rate": 4.124310920096712e-06, + "loss": 1.1323, + "step": 9847 + }, + { + "epoch": 0.3, + "learning_rate": 4.1241254916920025e-06, + "loss": 1.0178, + "step": 9848 + }, + { + "epoch": 0.3, + "learning_rate": 4.123940047826401e-06, + "loss": 1.2441, + "step": 9849 + }, + { + "epoch": 0.3, + "learning_rate": 4.123754588501671e-06, + "loss": 1.1227, + "step": 9850 + }, + { + "epoch": 0.3, + "learning_rate": 4.12356911371958e-06, + "loss": 1.1286, + "step": 9851 + }, + { + "epoch": 0.3, + "learning_rate": 4.123383623481893e-06, + "loss": 1.1221, + "step": 9852 + }, + { + "epoch": 0.3, + "learning_rate": 4.123198117790375e-06, + "loss": 1.1612, + "step": 9853 + }, + { + "epoch": 0.3, + "learning_rate": 4.123012596646795e-06, + "loss": 1.1901, + "step": 9854 + }, + { + "epoch": 0.3, + "learning_rate": 4.122827060052914e-06, + "loss": 1.1395, + "step": 9855 + }, + { + "epoch": 0.3, + "learning_rate": 4.122641508010503e-06, + "loss": 1.2546, + "step": 9856 + }, + { + "epoch": 0.3, + "learning_rate": 4.122455940521326e-06, + "loss": 1.0449, + "step": 9857 + }, + { + "epoch": 0.3, + "learning_rate": 4.122270357587148e-06, + "loss": 1.2397, + "step": 9858 + }, + { + "epoch": 0.3, + "learning_rate": 4.12208475920974e-06, + "loss": 1.2028, + "step": 9859 + }, + { + "epoch": 0.3, + "learning_rate": 4.121899145390864e-06, + "loss": 1.1909, + "step": 9860 + }, + { + "epoch": 0.3, + "learning_rate": 4.1217135161322915e-06, + "loss": 1.1641, + "step": 9861 + }, + { + "epoch": 0.3, + "learning_rate": 4.121527871435786e-06, + "loss": 1.2375, + "step": 9862 + }, + { + "epoch": 0.3, + "learning_rate": 4.121342211303116e-06, + "loss": 1.0848, + "step": 9863 + }, + { + "epoch": 0.3, + "learning_rate": 4.12115653573605e-06, + "loss": 1.1084, + "step": 9864 + }, + { + "epoch": 0.3, + "learning_rate": 4.120970844736354e-06, + "loss": 1.1794, + "step": 9865 + }, + { + "epoch": 0.3, + "learning_rate": 4.120785138305796e-06, + "loss": 1.15, + "step": 9866 + }, + { + "epoch": 0.3, + "learning_rate": 4.1205994164461445e-06, + "loss": 1.1822, + "step": 9867 + }, + { + "epoch": 0.3, + "learning_rate": 4.120413679159167e-06, + "loss": 1.0887, + "step": 9868 + }, + { + "epoch": 0.3, + "learning_rate": 4.120227926446632e-06, + "loss": 1.1868, + "step": 9869 + }, + { + "epoch": 0.3, + "learning_rate": 4.1200421583103065e-06, + "loss": 1.0864, + "step": 9870 + }, + { + "epoch": 0.3, + "learning_rate": 4.119856374751961e-06, + "loss": 1.229, + "step": 9871 + }, + { + "epoch": 0.3, + "learning_rate": 4.1196705757733625e-06, + "loss": 1.2103, + "step": 9872 + }, + { + "epoch": 0.3, + "learning_rate": 4.119484761376279e-06, + "loss": 1.1919, + "step": 9873 + }, + { + "epoch": 0.3, + "learning_rate": 4.119298931562482e-06, + "loss": 1.0676, + "step": 9874 + }, + { + "epoch": 0.3, + "learning_rate": 4.119113086333739e-06, + "loss": 1.1521, + "step": 9875 + }, + { + "epoch": 0.3, + "learning_rate": 4.118927225691819e-06, + "loss": 1.1499, + "step": 9876 + }, + { + "epoch": 0.3, + "learning_rate": 4.118741349638492e-06, + "loss": 1.1293, + "step": 9877 + }, + { + "epoch": 0.3, + "learning_rate": 4.118555458175526e-06, + "loss": 1.0995, + "step": 9878 + }, + { + "epoch": 0.3, + "learning_rate": 4.118369551304692e-06, + "loss": 0.9854, + "step": 9879 + }, + { + "epoch": 0.3, + "learning_rate": 4.1181836290277586e-06, + "loss": 1.1115, + "step": 9880 + }, + { + "epoch": 0.3, + "learning_rate": 4.117997691346498e-06, + "loss": 1.2133, + "step": 9881 + }, + { + "epoch": 0.3, + "learning_rate": 4.117811738262677e-06, + "loss": 1.1517, + "step": 9882 + }, + { + "epoch": 0.3, + "learning_rate": 4.117625769778068e-06, + "loss": 1.1006, + "step": 9883 + }, + { + "epoch": 0.3, + "learning_rate": 4.117439785894442e-06, + "loss": 1.2326, + "step": 9884 + }, + { + "epoch": 0.3, + "learning_rate": 4.117253786613566e-06, + "loss": 1.1127, + "step": 9885 + }, + { + "epoch": 0.3, + "learning_rate": 4.117067771937214e-06, + "loss": 1.0957, + "step": 9886 + }, + { + "epoch": 0.3, + "learning_rate": 4.116881741867156e-06, + "loss": 1.278, + "step": 9887 + }, + { + "epoch": 0.3, + "learning_rate": 4.116695696405162e-06, + "loss": 1.152, + "step": 9888 + }, + { + "epoch": 0.3, + "learning_rate": 4.116509635553003e-06, + "loss": 1.1487, + "step": 9889 + }, + { + "epoch": 0.3, + "learning_rate": 4.116323559312452e-06, + "loss": 1.1134, + "step": 9890 + }, + { + "epoch": 0.3, + "learning_rate": 4.116137467685278e-06, + "loss": 1.1039, + "step": 9891 + }, + { + "epoch": 0.3, + "learning_rate": 4.115951360673255e-06, + "loss": 1.228, + "step": 9892 + }, + { + "epoch": 0.3, + "learning_rate": 4.115765238278153e-06, + "loss": 1.244, + "step": 9893 + }, + { + "epoch": 0.3, + "learning_rate": 4.115579100501743e-06, + "loss": 1.2045, + "step": 9894 + }, + { + "epoch": 0.3, + "learning_rate": 4.115392947345799e-06, + "loss": 1.1718, + "step": 9895 + }, + { + "epoch": 0.3, + "learning_rate": 4.115206778812092e-06, + "loss": 0.9818, + "step": 9896 + }, + { + "epoch": 0.3, + "learning_rate": 4.1150205949023945e-06, + "loss": 1.1551, + "step": 9897 + }, + { + "epoch": 0.3, + "learning_rate": 4.114834395618478e-06, + "loss": 1.1331, + "step": 9898 + }, + { + "epoch": 0.3, + "learning_rate": 4.114648180962116e-06, + "loss": 1.0781, + "step": 9899 + }, + { + "epoch": 0.3, + "learning_rate": 4.114461950935082e-06, + "loss": 1.0768, + "step": 9900 + }, + { + "epoch": 0.3, + "learning_rate": 4.114275705539147e-06, + "loss": 1.2082, + "step": 9901 + }, + { + "epoch": 0.3, + "learning_rate": 4.114089444776085e-06, + "loss": 1.1804, + "step": 9902 + }, + { + "epoch": 0.3, + "learning_rate": 4.113903168647669e-06, + "loss": 1.1207, + "step": 9903 + }, + { + "epoch": 0.3, + "learning_rate": 4.113716877155671e-06, + "loss": 1.1506, + "step": 9904 + }, + { + "epoch": 0.3, + "learning_rate": 4.113530570301867e-06, + "loss": 1.1027, + "step": 9905 + }, + { + "epoch": 0.3, + "learning_rate": 4.113344248088028e-06, + "loss": 1.1887, + "step": 9906 + }, + { + "epoch": 0.3, + "learning_rate": 4.113157910515929e-06, + "loss": 1.1719, + "step": 9907 + }, + { + "epoch": 0.3, + "learning_rate": 4.112971557587344e-06, + "loss": 1.1108, + "step": 9908 + }, + { + "epoch": 0.3, + "learning_rate": 4.112785189304046e-06, + "loss": 1.0629, + "step": 9909 + }, + { + "epoch": 0.3, + "learning_rate": 4.112598805667811e-06, + "loss": 1.2697, + "step": 9910 + }, + { + "epoch": 0.3, + "learning_rate": 4.112412406680411e-06, + "loss": 1.3131, + "step": 9911 + }, + { + "epoch": 0.3, + "learning_rate": 4.112225992343621e-06, + "loss": 1.1946, + "step": 9912 + }, + { + "epoch": 0.3, + "learning_rate": 4.112039562659217e-06, + "loss": 1.0739, + "step": 9913 + }, + { + "epoch": 0.3, + "learning_rate": 4.111853117628972e-06, + "loss": 1.1919, + "step": 9914 + }, + { + "epoch": 0.3, + "learning_rate": 4.111666657254663e-06, + "loss": 1.1151, + "step": 9915 + }, + { + "epoch": 0.3, + "learning_rate": 4.111480181538062e-06, + "loss": 1.1309, + "step": 9916 + }, + { + "epoch": 0.3, + "learning_rate": 4.111293690480947e-06, + "loss": 1.1885, + "step": 9917 + }, + { + "epoch": 0.3, + "learning_rate": 4.1111071840850905e-06, + "loss": 1.2582, + "step": 9918 + }, + { + "epoch": 0.3, + "learning_rate": 4.110920662352271e-06, + "loss": 1.2014, + "step": 9919 + }, + { + "epoch": 0.3, + "learning_rate": 4.110734125284262e-06, + "loss": 1.2196, + "step": 9920 + }, + { + "epoch": 0.3, + "learning_rate": 4.1105475728828405e-06, + "loss": 1.1223, + "step": 9921 + }, + { + "epoch": 0.3, + "learning_rate": 4.110361005149781e-06, + "loss": 1.161, + "step": 9922 + }, + { + "epoch": 0.3, + "learning_rate": 4.110174422086861e-06, + "loss": 1.2574, + "step": 9923 + }, + { + "epoch": 0.3, + "learning_rate": 4.109987823695855e-06, + "loss": 1.2155, + "step": 9924 + }, + { + "epoch": 0.3, + "learning_rate": 4.109801209978541e-06, + "loss": 1.1965, + "step": 9925 + }, + { + "epoch": 0.3, + "learning_rate": 4.109614580936695e-06, + "loss": 1.1501, + "step": 9926 + }, + { + "epoch": 0.3, + "learning_rate": 4.1094279365720925e-06, + "loss": 1.1118, + "step": 9927 + }, + { + "epoch": 0.3, + "learning_rate": 4.109241276886513e-06, + "loss": 1.058, + "step": 9928 + }, + { + "epoch": 0.3, + "learning_rate": 4.10905460188173e-06, + "loss": 1.2595, + "step": 9929 + }, + { + "epoch": 0.3, + "learning_rate": 4.108867911559523e-06, + "loss": 1.1948, + "step": 9930 + }, + { + "epoch": 0.3, + "learning_rate": 4.108681205921667e-06, + "loss": 1.2026, + "step": 9931 + }, + { + "epoch": 0.3, + "learning_rate": 4.108494484969942e-06, + "loss": 1.0459, + "step": 9932 + }, + { + "epoch": 0.3, + "learning_rate": 4.108307748706124e-06, + "loss": 1.0341, + "step": 9933 + }, + { + "epoch": 0.3, + "learning_rate": 4.10812099713199e-06, + "loss": 1.0862, + "step": 9934 + }, + { + "epoch": 0.3, + "learning_rate": 4.10793423024932e-06, + "loss": 1.0978, + "step": 9935 + }, + { + "epoch": 0.3, + "learning_rate": 4.107747448059889e-06, + "loss": 1.2947, + "step": 9936 + }, + { + "epoch": 0.3, + "learning_rate": 4.107560650565477e-06, + "loss": 1.2062, + "step": 9937 + }, + { + "epoch": 0.3, + "learning_rate": 4.107373837767863e-06, + "loss": 1.0739, + "step": 9938 + }, + { + "epoch": 0.3, + "learning_rate": 4.107187009668823e-06, + "loss": 1.1517, + "step": 9939 + }, + { + "epoch": 0.3, + "learning_rate": 4.107000166270137e-06, + "loss": 1.1888, + "step": 9940 + }, + { + "epoch": 0.3, + "learning_rate": 4.106813307573584e-06, + "loss": 1.1345, + "step": 9941 + }, + { + "epoch": 0.3, + "learning_rate": 4.106626433580941e-06, + "loss": 1.0248, + "step": 9942 + }, + { + "epoch": 0.3, + "learning_rate": 4.106439544293989e-06, + "loss": 1.2134, + "step": 9943 + }, + { + "epoch": 0.3, + "learning_rate": 4.106252639714506e-06, + "loss": 1.1412, + "step": 9944 + }, + { + "epoch": 0.3, + "learning_rate": 4.106065719844272e-06, + "loss": 1.1289, + "step": 9945 + }, + { + "epoch": 0.3, + "learning_rate": 4.105878784685064e-06, + "loss": 1.152, + "step": 9946 + }, + { + "epoch": 0.3, + "learning_rate": 4.105691834238665e-06, + "loss": 1.1224, + "step": 9947 + }, + { + "epoch": 0.3, + "learning_rate": 4.105504868506853e-06, + "loss": 1.1908, + "step": 9948 + }, + { + "epoch": 0.3, + "learning_rate": 4.1053178874914075e-06, + "loss": 1.0343, + "step": 9949 + }, + { + "epoch": 0.3, + "learning_rate": 4.105130891194109e-06, + "loss": 1.0865, + "step": 9950 + }, + { + "epoch": 0.3, + "learning_rate": 4.104943879616738e-06, + "loss": 1.1331, + "step": 9951 + }, + { + "epoch": 0.3, + "learning_rate": 4.104756852761073e-06, + "loss": 1.1252, + "step": 9952 + }, + { + "epoch": 0.3, + "learning_rate": 4.1045698106288966e-06, + "loss": 1.1588, + "step": 9953 + }, + { + "epoch": 0.3, + "learning_rate": 4.104382753221988e-06, + "loss": 1.0928, + "step": 9954 + }, + { + "epoch": 0.3, + "learning_rate": 4.104195680542129e-06, + "loss": 1.144, + "step": 9955 + }, + { + "epoch": 0.3, + "learning_rate": 4.104008592591099e-06, + "loss": 1.2859, + "step": 9956 + }, + { + "epoch": 0.3, + "learning_rate": 4.103821489370679e-06, + "loss": 1.2067, + "step": 9957 + }, + { + "epoch": 0.3, + "learning_rate": 4.103634370882653e-06, + "loss": 1.1135, + "step": 9958 + }, + { + "epoch": 0.3, + "learning_rate": 4.103447237128798e-06, + "loss": 1.0145, + "step": 9959 + }, + { + "epoch": 0.3, + "learning_rate": 4.103260088110899e-06, + "loss": 1.132, + "step": 9960 + }, + { + "epoch": 0.3, + "learning_rate": 4.103072923830735e-06, + "loss": 1.0706, + "step": 9961 + }, + { + "epoch": 0.3, + "learning_rate": 4.10288574429009e-06, + "loss": 1.1431, + "step": 9962 + }, + { + "epoch": 0.3, + "learning_rate": 4.102698549490743e-06, + "loss": 1.1324, + "step": 9963 + }, + { + "epoch": 0.3, + "learning_rate": 4.1025113394344795e-06, + "loss": 1.1288, + "step": 9964 + }, + { + "epoch": 0.3, + "learning_rate": 4.102324114123079e-06, + "loss": 1.1053, + "step": 9965 + }, + { + "epoch": 0.3, + "learning_rate": 4.102136873558325e-06, + "loss": 1.1105, + "step": 9966 + }, + { + "epoch": 0.3, + "learning_rate": 4.1019496177419995e-06, + "loss": 1.0883, + "step": 9967 + }, + { + "epoch": 0.3, + "learning_rate": 4.101762346675885e-06, + "loss": 1.129, + "step": 9968 + }, + { + "epoch": 0.3, + "learning_rate": 4.101575060361764e-06, + "loss": 1.1165, + "step": 9969 + }, + { + "epoch": 0.3, + "learning_rate": 4.10138775880142e-06, + "loss": 1.0329, + "step": 9970 + }, + { + "epoch": 0.3, + "learning_rate": 4.101200441996636e-06, + "loss": 1.1515, + "step": 9971 + }, + { + "epoch": 0.3, + "learning_rate": 4.101013109949195e-06, + "loss": 1.1216, + "step": 9972 + }, + { + "epoch": 0.3, + "learning_rate": 4.10082576266088e-06, + "loss": 1.0887, + "step": 9973 + }, + { + "epoch": 0.3, + "learning_rate": 4.100638400133475e-06, + "loss": 1.1234, + "step": 9974 + }, + { + "epoch": 0.3, + "learning_rate": 4.100451022368763e-06, + "loss": 1.2047, + "step": 9975 + }, + { + "epoch": 0.3, + "learning_rate": 4.100263629368528e-06, + "loss": 1.1671, + "step": 9976 + }, + { + "epoch": 0.3, + "learning_rate": 4.1000762211345545e-06, + "loss": 1.0895, + "step": 9977 + }, + { + "epoch": 0.3, + "learning_rate": 4.099888797668626e-06, + "loss": 1.0972, + "step": 9978 + }, + { + "epoch": 0.3, + "learning_rate": 4.099701358972527e-06, + "loss": 1.0827, + "step": 9979 + }, + { + "epoch": 0.3, + "learning_rate": 4.0995139050480406e-06, + "loss": 1.0312, + "step": 9980 + }, + { + "epoch": 0.3, + "learning_rate": 4.099326435896952e-06, + "loss": 1.2051, + "step": 9981 + }, + { + "epoch": 0.3, + "learning_rate": 4.099138951521047e-06, + "loss": 1.0886, + "step": 9982 + }, + { + "epoch": 0.3, + "learning_rate": 4.098951451922108e-06, + "loss": 1.069, + "step": 9983 + }, + { + "epoch": 0.3, + "learning_rate": 4.098763937101923e-06, + "loss": 1.1318, + "step": 9984 + }, + { + "epoch": 0.3, + "learning_rate": 4.0985764070622735e-06, + "loss": 1.131, + "step": 9985 + }, + { + "epoch": 0.3, + "learning_rate": 4.098388861804948e-06, + "loss": 1.165, + "step": 9986 + }, + { + "epoch": 0.3, + "learning_rate": 4.09820130133173e-06, + "loss": 1.0767, + "step": 9987 + }, + { + "epoch": 0.3, + "learning_rate": 4.098013725644405e-06, + "loss": 1.2391, + "step": 9988 + }, + { + "epoch": 0.3, + "learning_rate": 4.097826134744758e-06, + "loss": 1.152, + "step": 9989 + }, + { + "epoch": 0.3, + "learning_rate": 4.097638528634578e-06, + "loss": 1.1578, + "step": 9990 + }, + { + "epoch": 0.3, + "learning_rate": 4.097450907315647e-06, + "loss": 1.1172, + "step": 9991 + }, + { + "epoch": 0.3, + "learning_rate": 4.097263270789753e-06, + "loss": 1.1099, + "step": 9992 + }, + { + "epoch": 0.3, + "learning_rate": 4.097075619058682e-06, + "loss": 1.1518, + "step": 9993 + }, + { + "epoch": 0.3, + "learning_rate": 4.09688795212422e-06, + "loss": 1.0294, + "step": 9994 + }, + { + "epoch": 0.3, + "learning_rate": 4.096700269988154e-06, + "loss": 1.0969, + "step": 9995 + }, + { + "epoch": 0.3, + "learning_rate": 4.096512572652271e-06, + "loss": 1.1898, + "step": 9996 + }, + { + "epoch": 0.3, + "learning_rate": 4.096324860118357e-06, + "loss": 1.1284, + "step": 9997 + }, + { + "epoch": 0.3, + "learning_rate": 4.096137132388199e-06, + "loss": 1.1827, + "step": 9998 + }, + { + "epoch": 0.3, + "learning_rate": 4.095949389463584e-06, + "loss": 1.2163, + "step": 9999 + }, + { + "epoch": 0.3, + "learning_rate": 4.0957616313463e-06, + "loss": 1.0914, + "step": 10000 + }, + { + "epoch": 0.3, + "learning_rate": 4.0955738580381335e-06, + "loss": 1.1614, + "step": 10001 + }, + { + "epoch": 0.3, + "learning_rate": 4.095386069540872e-06, + "loss": 1.0653, + "step": 10002 + }, + { + "epoch": 0.3, + "learning_rate": 4.095198265856304e-06, + "loss": 1.1837, + "step": 10003 + }, + { + "epoch": 0.3, + "learning_rate": 4.095010446986216e-06, + "loss": 1.1422, + "step": 10004 + }, + { + "epoch": 0.3, + "learning_rate": 4.094822612932397e-06, + "loss": 1.2029, + "step": 10005 + }, + { + "epoch": 0.3, + "learning_rate": 4.094634763696635e-06, + "loss": 1.1937, + "step": 10006 + }, + { + "epoch": 0.3, + "learning_rate": 4.094446899280719e-06, + "loss": 1.2389, + "step": 10007 + }, + { + "epoch": 0.3, + "learning_rate": 4.094259019686435e-06, + "loss": 1.105, + "step": 10008 + }, + { + "epoch": 0.3, + "learning_rate": 4.094071124915573e-06, + "loss": 1.0355, + "step": 10009 + }, + { + "epoch": 0.3, + "learning_rate": 4.093883214969922e-06, + "loss": 1.0706, + "step": 10010 + }, + { + "epoch": 0.3, + "learning_rate": 4.093695289851271e-06, + "loss": 1.2085, + "step": 10011 + }, + { + "epoch": 0.3, + "learning_rate": 4.0935073495614085e-06, + "loss": 1.3231, + "step": 10012 + }, + { + "epoch": 0.3, + "learning_rate": 4.093319394102123e-06, + "loss": 1.129, + "step": 10013 + }, + { + "epoch": 0.3, + "learning_rate": 4.093131423475204e-06, + "loss": 1.1317, + "step": 10014 + }, + { + "epoch": 0.3, + "learning_rate": 4.092943437682441e-06, + "loss": 1.1503, + "step": 10015 + }, + { + "epoch": 0.3, + "learning_rate": 4.092755436725624e-06, + "loss": 1.1278, + "step": 10016 + }, + { + "epoch": 0.3, + "learning_rate": 4.092567420606542e-06, + "loss": 1.1334, + "step": 10017 + }, + { + "epoch": 0.3, + "learning_rate": 4.092379389326986e-06, + "loss": 1.2568, + "step": 10018 + }, + { + "epoch": 0.3, + "learning_rate": 4.092191342888745e-06, + "loss": 0.9924, + "step": 10019 + }, + { + "epoch": 0.3, + "learning_rate": 4.092003281293608e-06, + "loss": 1.116, + "step": 10020 + }, + { + "epoch": 0.3, + "learning_rate": 4.091815204543368e-06, + "loss": 1.1427, + "step": 10021 + }, + { + "epoch": 0.3, + "learning_rate": 4.091627112639813e-06, + "loss": 1.0361, + "step": 10022 + }, + { + "epoch": 0.3, + "learning_rate": 4.091439005584735e-06, + "loss": 1.1656, + "step": 10023 + }, + { + "epoch": 0.3, + "learning_rate": 4.091250883379924e-06, + "loss": 1.0895, + "step": 10024 + }, + { + "epoch": 0.3, + "learning_rate": 4.09106274602717e-06, + "loss": 1.1416, + "step": 10025 + }, + { + "epoch": 0.3, + "learning_rate": 4.090874593528265e-06, + "loss": 1.1525, + "step": 10026 + }, + { + "epoch": 0.3, + "learning_rate": 4.090686425885002e-06, + "loss": 1.2397, + "step": 10027 + }, + { + "epoch": 0.3, + "learning_rate": 4.0904982430991695e-06, + "loss": 1.0984, + "step": 10028 + }, + { + "epoch": 0.3, + "learning_rate": 4.090310045172559e-06, + "loss": 1.1357, + "step": 10029 + }, + { + "epoch": 0.3, + "learning_rate": 4.090121832106962e-06, + "loss": 1.1328, + "step": 10030 + }, + { + "epoch": 0.3, + "learning_rate": 4.089933603904173e-06, + "loss": 1.074, + "step": 10031 + }, + { + "epoch": 0.3, + "learning_rate": 4.089745360565981e-06, + "loss": 1.1788, + "step": 10032 + }, + { + "epoch": 0.3, + "learning_rate": 4.0895571020941784e-06, + "loss": 1.1847, + "step": 10033 + }, + { + "epoch": 0.3, + "learning_rate": 4.0893688284905585e-06, + "loss": 1.2043, + "step": 10034 + }, + { + "epoch": 0.3, + "learning_rate": 4.0891805397569124e-06, + "loss": 1.1945, + "step": 10035 + }, + { + "epoch": 0.3, + "learning_rate": 4.088992235895033e-06, + "loss": 1.1995, + "step": 10036 + }, + { + "epoch": 0.3, + "learning_rate": 4.088803916906712e-06, + "loss": 1.1744, + "step": 10037 + }, + { + "epoch": 0.3, + "learning_rate": 4.0886155827937445e-06, + "loss": 1.0411, + "step": 10038 + }, + { + "epoch": 0.3, + "learning_rate": 4.088427233557921e-06, + "loss": 1.0939, + "step": 10039 + }, + { + "epoch": 0.3, + "learning_rate": 4.088238869201035e-06, + "loss": 1.1204, + "step": 10040 + }, + { + "epoch": 0.3, + "learning_rate": 4.08805048972488e-06, + "loss": 1.2311, + "step": 10041 + }, + { + "epoch": 0.3, + "learning_rate": 4.087862095131249e-06, + "loss": 1.1502, + "step": 10042 + }, + { + "epoch": 0.3, + "learning_rate": 4.087673685421936e-06, + "loss": 1.1774, + "step": 10043 + }, + { + "epoch": 0.3, + "learning_rate": 4.087485260598734e-06, + "loss": 1.124, + "step": 10044 + }, + { + "epoch": 0.3, + "learning_rate": 4.0872968206634366e-06, + "loss": 1.1833, + "step": 10045 + }, + { + "epoch": 0.3, + "learning_rate": 4.087108365617838e-06, + "loss": 1.1857, + "step": 10046 + }, + { + "epoch": 0.3, + "learning_rate": 4.086919895463733e-06, + "loss": 0.9757, + "step": 10047 + }, + { + "epoch": 0.3, + "learning_rate": 4.086731410202914e-06, + "loss": 1.1901, + "step": 10048 + }, + { + "epoch": 0.3, + "learning_rate": 4.086542909837176e-06, + "loss": 1.1264, + "step": 10049 + }, + { + "epoch": 0.3, + "learning_rate": 4.086354394368314e-06, + "loss": 1.2325, + "step": 10050 + }, + { + "epoch": 0.3, + "learning_rate": 4.086165863798123e-06, + "loss": 1.1382, + "step": 10051 + }, + { + "epoch": 0.3, + "learning_rate": 4.085977318128395e-06, + "loss": 1.0564, + "step": 10052 + }, + { + "epoch": 0.3, + "learning_rate": 4.085788757360929e-06, + "loss": 1.0932, + "step": 10053 + }, + { + "epoch": 0.3, + "learning_rate": 4.085600181497516e-06, + "loss": 1.1896, + "step": 10054 + }, + { + "epoch": 0.3, + "learning_rate": 4.085411590539954e-06, + "loss": 1.1016, + "step": 10055 + }, + { + "epoch": 0.3, + "learning_rate": 4.085222984490036e-06, + "loss": 1.2921, + "step": 10056 + }, + { + "epoch": 0.3, + "learning_rate": 4.08503436334956e-06, + "loss": 1.2048, + "step": 10057 + }, + { + "epoch": 0.3, + "learning_rate": 4.084845727120319e-06, + "loss": 1.1332, + "step": 10058 + }, + { + "epoch": 0.3, + "learning_rate": 4.0846570758041115e-06, + "loss": 1.0916, + "step": 10059 + }, + { + "epoch": 0.3, + "learning_rate": 4.08446840940273e-06, + "loss": 1.2599, + "step": 10060 + }, + { + "epoch": 0.3, + "learning_rate": 4.0842797279179735e-06, + "loss": 1.04, + "step": 10061 + }, + { + "epoch": 0.3, + "learning_rate": 4.084091031351637e-06, + "loss": 1.2423, + "step": 10062 + }, + { + "epoch": 0.3, + "learning_rate": 4.083902319705517e-06, + "loss": 1.1963, + "step": 10063 + }, + { + "epoch": 0.3, + "learning_rate": 4.0837135929814085e-06, + "loss": 1.1412, + "step": 10064 + }, + { + "epoch": 0.3, + "learning_rate": 4.083524851181111e-06, + "loss": 1.197, + "step": 10065 + }, + { + "epoch": 0.3, + "learning_rate": 4.083336094306419e-06, + "loss": 1.215, + "step": 10066 + }, + { + "epoch": 0.3, + "learning_rate": 4.083147322359129e-06, + "loss": 1.0853, + "step": 10067 + }, + { + "epoch": 0.3, + "learning_rate": 4.08295853534104e-06, + "loss": 1.254, + "step": 10068 + }, + { + "epoch": 0.3, + "learning_rate": 4.082769733253948e-06, + "loss": 1.2221, + "step": 10069 + }, + { + "epoch": 0.3, + "learning_rate": 4.0825809160996495e-06, + "loss": 1.1762, + "step": 10070 + }, + { + "epoch": 0.3, + "learning_rate": 4.082392083879944e-06, + "loss": 1.0903, + "step": 10071 + }, + { + "epoch": 0.3, + "learning_rate": 4.082203236596628e-06, + "loss": 1.0743, + "step": 10072 + }, + { + "epoch": 0.3, + "learning_rate": 4.082014374251498e-06, + "loss": 1.2034, + "step": 10073 + }, + { + "epoch": 0.3, + "learning_rate": 4.081825496846354e-06, + "loss": 1.2487, + "step": 10074 + }, + { + "epoch": 0.3, + "learning_rate": 4.081636604382994e-06, + "loss": 1.2573, + "step": 10075 + }, + { + "epoch": 0.3, + "learning_rate": 4.081447696863214e-06, + "loss": 1.1698, + "step": 10076 + }, + { + "epoch": 0.3, + "learning_rate": 4.081258774288814e-06, + "loss": 1.1201, + "step": 10077 + }, + { + "epoch": 0.3, + "learning_rate": 4.081069836661591e-06, + "loss": 1.1195, + "step": 10078 + }, + { + "epoch": 0.3, + "learning_rate": 4.0808808839833455e-06, + "loss": 1.1664, + "step": 10079 + }, + { + "epoch": 0.3, + "learning_rate": 4.080691916255875e-06, + "loss": 1.1678, + "step": 10080 + }, + { + "epoch": 0.3, + "learning_rate": 4.08050293348098e-06, + "loss": 1.0999, + "step": 10081 + }, + { + "epoch": 0.3, + "learning_rate": 4.080313935660456e-06, + "loss": 1.1555, + "step": 10082 + }, + { + "epoch": 0.3, + "learning_rate": 4.0801249227961065e-06, + "loss": 1.1567, + "step": 10083 + }, + { + "epoch": 0.3, + "learning_rate": 4.079935894889728e-06, + "loss": 1.1218, + "step": 10084 + }, + { + "epoch": 0.3, + "learning_rate": 4.07974685194312e-06, + "loss": 1.1613, + "step": 10085 + }, + { + "epoch": 0.3, + "learning_rate": 4.0795577939580844e-06, + "loss": 0.9985, + "step": 10086 + }, + { + "epoch": 0.3, + "learning_rate": 4.079368720936418e-06, + "loss": 1.1166, + "step": 10087 + }, + { + "epoch": 0.3, + "learning_rate": 4.079179632879923e-06, + "loss": 1.1261, + "step": 10088 + }, + { + "epoch": 0.3, + "learning_rate": 4.078990529790398e-06, + "loss": 1.1124, + "step": 10089 + }, + { + "epoch": 0.3, + "learning_rate": 4.078801411669643e-06, + "loss": 1.0189, + "step": 10090 + }, + { + "epoch": 0.3, + "learning_rate": 4.078612278519459e-06, + "loss": 1.1625, + "step": 10091 + }, + { + "epoch": 0.3, + "learning_rate": 4.078423130341648e-06, + "loss": 1.1736, + "step": 10092 + }, + { + "epoch": 0.3, + "learning_rate": 4.078233967138007e-06, + "loss": 1.2054, + "step": 10093 + }, + { + "epoch": 0.3, + "learning_rate": 4.07804478891034e-06, + "loss": 1.163, + "step": 10094 + }, + { + "epoch": 0.3, + "learning_rate": 4.077855595660446e-06, + "loss": 1.1141, + "step": 10095 + }, + { + "epoch": 0.3, + "learning_rate": 4.077666387390127e-06, + "loss": 1.085, + "step": 10096 + }, + { + "epoch": 0.3, + "learning_rate": 4.077477164101183e-06, + "loss": 1.0945, + "step": 10097 + }, + { + "epoch": 0.3, + "learning_rate": 4.077287925795418e-06, + "loss": 1.141, + "step": 10098 + }, + { + "epoch": 0.3, + "learning_rate": 4.07709867247463e-06, + "loss": 1.002, + "step": 10099 + }, + { + "epoch": 0.3, + "learning_rate": 4.076909404140622e-06, + "loss": 1.0905, + "step": 10100 + }, + { + "epoch": 0.3, + "learning_rate": 4.0767201207951975e-06, + "loss": 1.2178, + "step": 10101 + }, + { + "epoch": 0.3, + "learning_rate": 4.076530822440156e-06, + "loss": 1.1934, + "step": 10102 + }, + { + "epoch": 0.3, + "learning_rate": 4.0763415090773e-06, + "loss": 1.0613, + "step": 10103 + }, + { + "epoch": 0.3, + "learning_rate": 4.076152180708433e-06, + "loss": 1.1722, + "step": 10104 + }, + { + "epoch": 0.3, + "learning_rate": 4.075962837335356e-06, + "loss": 1.2038, + "step": 10105 + }, + { + "epoch": 0.3, + "learning_rate": 4.07577347895987e-06, + "loss": 1.305, + "step": 10106 + }, + { + "epoch": 0.3, + "learning_rate": 4.075584105583782e-06, + "loss": 1.1104, + "step": 10107 + }, + { + "epoch": 0.3, + "learning_rate": 4.07539471720889e-06, + "loss": 1.1353, + "step": 10108 + }, + { + "epoch": 0.3, + "learning_rate": 4.075205313837e-06, + "loss": 1.2454, + "step": 10109 + }, + { + "epoch": 0.3, + "learning_rate": 4.075015895469915e-06, + "loss": 1.1125, + "step": 10110 + }, + { + "epoch": 0.3, + "learning_rate": 4.074826462109436e-06, + "loss": 1.1473, + "step": 10111 + }, + { + "epoch": 0.3, + "learning_rate": 4.074637013757368e-06, + "loss": 1.2164, + "step": 10112 + }, + { + "epoch": 0.3, + "learning_rate": 4.074447550415513e-06, + "loss": 1.1144, + "step": 10113 + }, + { + "epoch": 0.3, + "learning_rate": 4.074258072085677e-06, + "loss": 1.0328, + "step": 10114 + }, + { + "epoch": 0.3, + "learning_rate": 4.074068578769661e-06, + "loss": 1.2117, + "step": 10115 + }, + { + "epoch": 0.3, + "learning_rate": 4.073879070469271e-06, + "loss": 1.1312, + "step": 10116 + }, + { + "epoch": 0.3, + "learning_rate": 4.073689547186311e-06, + "loss": 1.0637, + "step": 10117 + }, + { + "epoch": 0.3, + "learning_rate": 4.073500008922583e-06, + "loss": 1.0377, + "step": 10118 + }, + { + "epoch": 0.3, + "learning_rate": 4.073310455679894e-06, + "loss": 1.1194, + "step": 10119 + }, + { + "epoch": 0.3, + "learning_rate": 4.073120887460047e-06, + "loss": 1.1047, + "step": 10120 + }, + { + "epoch": 0.3, + "learning_rate": 4.072931304264846e-06, + "loss": 1.0847, + "step": 10121 + }, + { + "epoch": 0.3, + "learning_rate": 4.072741706096097e-06, + "loss": 1.2738, + "step": 10122 + }, + { + "epoch": 0.3, + "learning_rate": 4.072552092955604e-06, + "loss": 1.1864, + "step": 10123 + }, + { + "epoch": 0.3, + "learning_rate": 4.072362464845173e-06, + "loss": 1.2369, + "step": 10124 + }, + { + "epoch": 0.31, + "learning_rate": 4.072172821766608e-06, + "loss": 1.1143, + "step": 10125 + }, + { + "epoch": 0.31, + "learning_rate": 4.0719831637217154e-06, + "loss": 1.1852, + "step": 10126 + }, + { + "epoch": 0.31, + "learning_rate": 4.0717934907123e-06, + "loss": 1.0833, + "step": 10127 + }, + { + "epoch": 0.31, + "learning_rate": 4.071603802740168e-06, + "loss": 1.1497, + "step": 10128 + }, + { + "epoch": 0.31, + "learning_rate": 4.071414099807125e-06, + "loss": 1.1605, + "step": 10129 + }, + { + "epoch": 0.31, + "learning_rate": 4.0712243819149755e-06, + "loss": 1.098, + "step": 10130 + }, + { + "epoch": 0.31, + "learning_rate": 4.071034649065528e-06, + "loss": 1.122, + "step": 10131 + }, + { + "epoch": 0.31, + "learning_rate": 4.070844901260586e-06, + "loss": 1.1776, + "step": 10132 + }, + { + "epoch": 0.31, + "learning_rate": 4.070655138501956e-06, + "loss": 1.1677, + "step": 10133 + }, + { + "epoch": 0.31, + "learning_rate": 4.070465360791448e-06, + "loss": 1.1572, + "step": 10134 + }, + { + "epoch": 0.31, + "learning_rate": 4.070275568130865e-06, + "loss": 1.1218, + "step": 10135 + }, + { + "epoch": 0.31, + "learning_rate": 4.070085760522015e-06, + "loss": 1.2822, + "step": 10136 + }, + { + "epoch": 0.31, + "learning_rate": 4.069895937966705e-06, + "loss": 1.2728, + "step": 10137 + }, + { + "epoch": 0.31, + "learning_rate": 4.069706100466741e-06, + "loss": 1.0971, + "step": 10138 + }, + { + "epoch": 0.31, + "learning_rate": 4.0695162480239315e-06, + "loss": 1.101, + "step": 10139 + }, + { + "epoch": 0.31, + "learning_rate": 4.069326380640083e-06, + "loss": 1.1124, + "step": 10140 + }, + { + "epoch": 0.31, + "learning_rate": 4.0691364983170035e-06, + "loss": 1.2338, + "step": 10141 + }, + { + "epoch": 0.31, + "learning_rate": 4.0689466010565006e-06, + "loss": 1.1014, + "step": 10142 + }, + { + "epoch": 0.31, + "learning_rate": 4.06875668886038e-06, + "loss": 1.2367, + "step": 10143 + }, + { + "epoch": 0.31, + "learning_rate": 4.068566761730453e-06, + "loss": 1.0699, + "step": 10144 + }, + { + "epoch": 0.31, + "learning_rate": 4.068376819668525e-06, + "loss": 1.1138, + "step": 10145 + }, + { + "epoch": 0.31, + "learning_rate": 4.068186862676405e-06, + "loss": 1.1321, + "step": 10146 + }, + { + "epoch": 0.31, + "learning_rate": 4.067996890755902e-06, + "loss": 1.2275, + "step": 10147 + }, + { + "epoch": 0.31, + "learning_rate": 4.0678069039088236e-06, + "loss": 1.0549, + "step": 10148 + }, + { + "epoch": 0.31, + "learning_rate": 4.067616902136978e-06, + "loss": 1.2181, + "step": 10149 + }, + { + "epoch": 0.31, + "learning_rate": 4.067426885442175e-06, + "loss": 1.0813, + "step": 10150 + }, + { + "epoch": 0.31, + "learning_rate": 4.067236853826223e-06, + "loss": 1.1931, + "step": 10151 + }, + { + "epoch": 0.31, + "learning_rate": 4.067046807290931e-06, + "loss": 1.1769, + "step": 10152 + }, + { + "epoch": 0.31, + "learning_rate": 4.066856745838107e-06, + "loss": 1.2437, + "step": 10153 + }, + { + "epoch": 0.31, + "learning_rate": 4.0666666694695625e-06, + "loss": 1.234, + "step": 10154 + }, + { + "epoch": 0.31, + "learning_rate": 4.066476578187106e-06, + "loss": 1.2228, + "step": 10155 + }, + { + "epoch": 0.31, + "learning_rate": 4.0662864719925465e-06, + "loss": 1.1017, + "step": 10156 + }, + { + "epoch": 0.31, + "learning_rate": 4.0660963508876935e-06, + "loss": 0.9763, + "step": 10157 + }, + { + "epoch": 0.31, + "learning_rate": 4.065906214874359e-06, + "loss": 1.0759, + "step": 10158 + }, + { + "epoch": 0.31, + "learning_rate": 4.0657160639543506e-06, + "loss": 1.1483, + "step": 10159 + }, + { + "epoch": 0.31, + "learning_rate": 4.065525898129478e-06, + "loss": 1.1333, + "step": 10160 + }, + { + "epoch": 0.31, + "learning_rate": 4.065335717401555e-06, + "loss": 1.1536, + "step": 10161 + }, + { + "epoch": 0.31, + "learning_rate": 4.065145521772389e-06, + "loss": 1.1459, + "step": 10162 + }, + { + "epoch": 0.31, + "learning_rate": 4.064955311243792e-06, + "loss": 1.0714, + "step": 10163 + }, + { + "epoch": 0.31, + "learning_rate": 4.064765085817574e-06, + "loss": 1.1463, + "step": 10164 + }, + { + "epoch": 0.31, + "learning_rate": 4.064574845495545e-06, + "loss": 1.0656, + "step": 10165 + }, + { + "epoch": 0.31, + "learning_rate": 4.064384590279517e-06, + "loss": 1.2289, + "step": 10166 + }, + { + "epoch": 0.31, + "learning_rate": 4.064194320171303e-06, + "loss": 1.0198, + "step": 10167 + }, + { + "epoch": 0.31, + "learning_rate": 4.064004035172711e-06, + "loss": 1.1606, + "step": 10168 + }, + { + "epoch": 0.31, + "learning_rate": 4.063813735285554e-06, + "loss": 1.1411, + "step": 10169 + }, + { + "epoch": 0.31, + "learning_rate": 4.063623420511643e-06, + "loss": 1.0795, + "step": 10170 + }, + { + "epoch": 0.31, + "learning_rate": 4.0634330908527905e-06, + "loss": 1.1871, + "step": 10171 + }, + { + "epoch": 0.31, + "learning_rate": 4.063242746310808e-06, + "loss": 1.0734, + "step": 10172 + }, + { + "epoch": 0.31, + "learning_rate": 4.0630523868875075e-06, + "loss": 1.2523, + "step": 10173 + }, + { + "epoch": 0.31, + "learning_rate": 4.062862012584702e-06, + "loss": 1.0998, + "step": 10174 + }, + { + "epoch": 0.31, + "learning_rate": 4.062671623404201e-06, + "loss": 1.1341, + "step": 10175 + }, + { + "epoch": 0.31, + "learning_rate": 4.06248121934782e-06, + "loss": 1.1763, + "step": 10176 + }, + { + "epoch": 0.31, + "learning_rate": 4.06229080041737e-06, + "loss": 1.0812, + "step": 10177 + }, + { + "epoch": 0.31, + "learning_rate": 4.062100366614664e-06, + "loss": 1.1714, + "step": 10178 + }, + { + "epoch": 0.31, + "learning_rate": 4.061909917941515e-06, + "loss": 1.0039, + "step": 10179 + }, + { + "epoch": 0.31, + "learning_rate": 4.061719454399735e-06, + "loss": 1.1827, + "step": 10180 + }, + { + "epoch": 0.31, + "learning_rate": 4.061528975991138e-06, + "loss": 1.2041, + "step": 10181 + }, + { + "epoch": 0.31, + "learning_rate": 4.0613384827175386e-06, + "loss": 1.1453, + "step": 10182 + }, + { + "epoch": 0.31, + "learning_rate": 4.061147974580748e-06, + "loss": 1.0822, + "step": 10183 + }, + { + "epoch": 0.31, + "learning_rate": 4.0609574515825805e-06, + "loss": 1.1788, + "step": 10184 + }, + { + "epoch": 0.31, + "learning_rate": 4.060766913724849e-06, + "loss": 1.1097, + "step": 10185 + }, + { + "epoch": 0.31, + "learning_rate": 4.06057636100937e-06, + "loss": 1.0635, + "step": 10186 + }, + { + "epoch": 0.31, + "learning_rate": 4.060385793437954e-06, + "loss": 1.0522, + "step": 10187 + }, + { + "epoch": 0.31, + "learning_rate": 4.060195211012418e-06, + "loss": 1.1661, + "step": 10188 + }, + { + "epoch": 0.31, + "learning_rate": 4.060004613734574e-06, + "loss": 1.1008, + "step": 10189 + }, + { + "epoch": 0.31, + "learning_rate": 4.059814001606238e-06, + "loss": 1.2606, + "step": 10190 + }, + { + "epoch": 0.31, + "learning_rate": 4.059623374629224e-06, + "loss": 1.116, + "step": 10191 + }, + { + "epoch": 0.31, + "learning_rate": 4.059432732805346e-06, + "loss": 1.1479, + "step": 10192 + }, + { + "epoch": 0.31, + "learning_rate": 4.0592420761364195e-06, + "loss": 1.261, + "step": 10193 + }, + { + "epoch": 0.31, + "learning_rate": 4.05905140462426e-06, + "loss": 1.2662, + "step": 10194 + }, + { + "epoch": 0.31, + "learning_rate": 4.0588607182706815e-06, + "loss": 1.045, + "step": 10195 + }, + { + "epoch": 0.31, + "learning_rate": 4.0586700170775e-06, + "loss": 1.0954, + "step": 10196 + }, + { + "epoch": 0.31, + "learning_rate": 4.0584793010465304e-06, + "loss": 1.2181, + "step": 10197 + }, + { + "epoch": 0.31, + "learning_rate": 4.058288570179589e-06, + "loss": 1.2256, + "step": 10198 + }, + { + "epoch": 0.31, + "learning_rate": 4.0580978244784905e-06, + "loss": 1.2106, + "step": 10199 + }, + { + "epoch": 0.31, + "learning_rate": 4.057907063945051e-06, + "loss": 1.0932, + "step": 10200 + }, + { + "epoch": 0.31, + "learning_rate": 4.0577162885810865e-06, + "loss": 1.1363, + "step": 10201 + }, + { + "epoch": 0.31, + "learning_rate": 4.057525498388414e-06, + "loss": 1.0909, + "step": 10202 + }, + { + "epoch": 0.31, + "learning_rate": 4.057334693368848e-06, + "loss": 1.1407, + "step": 10203 + }, + { + "epoch": 0.31, + "learning_rate": 4.057143873524206e-06, + "loss": 1.2061, + "step": 10204 + }, + { + "epoch": 0.31, + "learning_rate": 4.056953038856304e-06, + "loss": 1.172, + "step": 10205 + }, + { + "epoch": 0.31, + "learning_rate": 4.056762189366959e-06, + "loss": 1.1124, + "step": 10206 + }, + { + "epoch": 0.31, + "learning_rate": 4.056571325057988e-06, + "loss": 1.2313, + "step": 10207 + }, + { + "epoch": 0.31, + "learning_rate": 4.056380445931208e-06, + "loss": 1.0823, + "step": 10208 + }, + { + "epoch": 0.31, + "learning_rate": 4.056189551988435e-06, + "loss": 1.1032, + "step": 10209 + }, + { + "epoch": 0.31, + "learning_rate": 4.0559986432314865e-06, + "loss": 1.109, + "step": 10210 + }, + { + "epoch": 0.31, + "learning_rate": 4.0558077196621815e-06, + "loss": 1.0253, + "step": 10211 + }, + { + "epoch": 0.31, + "learning_rate": 4.055616781282335e-06, + "loss": 1.2036, + "step": 10212 + }, + { + "epoch": 0.31, + "learning_rate": 4.055425828093768e-06, + "loss": 1.12, + "step": 10213 + }, + { + "epoch": 0.31, + "learning_rate": 4.055234860098295e-06, + "loss": 1.1929, + "step": 10214 + }, + { + "epoch": 0.31, + "learning_rate": 4.0550438772977354e-06, + "loss": 1.1744, + "step": 10215 + }, + { + "epoch": 0.31, + "learning_rate": 4.054852879693906e-06, + "loss": 1.1407, + "step": 10216 + }, + { + "epoch": 0.31, + "learning_rate": 4.0546618672886275e-06, + "loss": 1.2477, + "step": 10217 + }, + { + "epoch": 0.31, + "learning_rate": 4.0544708400837165e-06, + "loss": 1.1721, + "step": 10218 + }, + { + "epoch": 0.31, + "learning_rate": 4.054279798080991e-06, + "loss": 1.0205, + "step": 10219 + }, + { + "epoch": 0.31, + "learning_rate": 4.054088741282271e-06, + "loss": 1.1035, + "step": 10220 + }, + { + "epoch": 0.31, + "learning_rate": 4.053897669689374e-06, + "loss": 1.1109, + "step": 10221 + }, + { + "epoch": 0.31, + "learning_rate": 4.05370658330412e-06, + "loss": 1.1222, + "step": 10222 + }, + { + "epoch": 0.31, + "learning_rate": 4.0535154821283275e-06, + "loss": 1.0482, + "step": 10223 + }, + { + "epoch": 0.31, + "learning_rate": 4.0533243661638165e-06, + "loss": 1.2543, + "step": 10224 + }, + { + "epoch": 0.31, + "learning_rate": 4.053133235412404e-06, + "loss": 1.0768, + "step": 10225 + }, + { + "epoch": 0.31, + "learning_rate": 4.052942089875913e-06, + "loss": 1.2316, + "step": 10226 + }, + { + "epoch": 0.31, + "learning_rate": 4.05275092955616e-06, + "loss": 1.1245, + "step": 10227 + }, + { + "epoch": 0.31, + "learning_rate": 4.052559754454966e-06, + "loss": 1.1315, + "step": 10228 + }, + { + "epoch": 0.31, + "learning_rate": 4.052368564574151e-06, + "loss": 1.1902, + "step": 10229 + }, + { + "epoch": 0.31, + "learning_rate": 4.052177359915536e-06, + "loss": 1.1949, + "step": 10230 + }, + { + "epoch": 0.31, + "learning_rate": 4.051986140480939e-06, + "loss": 1.0196, + "step": 10231 + }, + { + "epoch": 0.31, + "learning_rate": 4.051794906272182e-06, + "loss": 1.1765, + "step": 10232 + }, + { + "epoch": 0.31, + "learning_rate": 4.051603657291084e-06, + "loss": 1.0203, + "step": 10233 + }, + { + "epoch": 0.31, + "learning_rate": 4.051412393539468e-06, + "loss": 1.1162, + "step": 10234 + }, + { + "epoch": 0.31, + "learning_rate": 4.051221115019151e-06, + "loss": 1.1208, + "step": 10235 + }, + { + "epoch": 0.31, + "learning_rate": 4.051029821731958e-06, + "loss": 1.1666, + "step": 10236 + }, + { + "epoch": 0.31, + "learning_rate": 4.050838513679707e-06, + "loss": 1.1889, + "step": 10237 + }, + { + "epoch": 0.31, + "learning_rate": 4.050647190864221e-06, + "loss": 1.0987, + "step": 10238 + }, + { + "epoch": 0.31, + "learning_rate": 4.050455853287321e-06, + "loss": 1.0685, + "step": 10239 + }, + { + "epoch": 0.31, + "learning_rate": 4.050264500950826e-06, + "loss": 1.118, + "step": 10240 + }, + { + "epoch": 0.31, + "learning_rate": 4.0500731338565615e-06, + "loss": 1.2034, + "step": 10241 + }, + { + "epoch": 0.31, + "learning_rate": 4.049881752006346e-06, + "loss": 1.1823, + "step": 10242 + }, + { + "epoch": 0.31, + "learning_rate": 4.049690355402004e-06, + "loss": 1.207, + "step": 10243 + }, + { + "epoch": 0.31, + "learning_rate": 4.049498944045355e-06, + "loss": 1.201, + "step": 10244 + }, + { + "epoch": 0.31, + "learning_rate": 4.049307517938223e-06, + "loss": 1.1763, + "step": 10245 + }, + { + "epoch": 0.31, + "learning_rate": 4.049116077082429e-06, + "loss": 1.1572, + "step": 10246 + }, + { + "epoch": 0.31, + "learning_rate": 4.0489246214797965e-06, + "loss": 1.173, + "step": 10247 + }, + { + "epoch": 0.31, + "learning_rate": 4.048733151132147e-06, + "loss": 1.2016, + "step": 10248 + }, + { + "epoch": 0.31, + "learning_rate": 4.048541666041304e-06, + "loss": 1.1501, + "step": 10249 + }, + { + "epoch": 0.31, + "learning_rate": 4.048350166209091e-06, + "loss": 1.1863, + "step": 10250 + }, + { + "epoch": 0.31, + "learning_rate": 4.048158651637329e-06, + "loss": 1.2219, + "step": 10251 + }, + { + "epoch": 0.31, + "learning_rate": 4.047967122327844e-06, + "loss": 1.1171, + "step": 10252 + }, + { + "epoch": 0.31, + "learning_rate": 4.0477755782824556e-06, + "loss": 1.1216, + "step": 10253 + }, + { + "epoch": 0.31, + "learning_rate": 4.04758401950299e-06, + "loss": 1.0707, + "step": 10254 + }, + { + "epoch": 0.31, + "learning_rate": 4.047392445991269e-06, + "loss": 1.0812, + "step": 10255 + }, + { + "epoch": 0.31, + "learning_rate": 4.0472008577491185e-06, + "loss": 1.1754, + "step": 10256 + }, + { + "epoch": 0.31, + "learning_rate": 4.04700925477836e-06, + "loss": 1.2228, + "step": 10257 + }, + { + "epoch": 0.31, + "learning_rate": 4.046817637080819e-06, + "loss": 1.0179, + "step": 10258 + }, + { + "epoch": 0.31, + "learning_rate": 4.046626004658319e-06, + "loss": 1.1217, + "step": 10259 + }, + { + "epoch": 0.31, + "learning_rate": 4.046434357512684e-06, + "loss": 1.1237, + "step": 10260 + }, + { + "epoch": 0.31, + "learning_rate": 4.046242695645739e-06, + "loss": 1.2048, + "step": 10261 + }, + { + "epoch": 0.31, + "learning_rate": 4.046051019059308e-06, + "loss": 1.2523, + "step": 10262 + }, + { + "epoch": 0.31, + "learning_rate": 4.045859327755216e-06, + "loss": 1.2537, + "step": 10263 + }, + { + "epoch": 0.31, + "learning_rate": 4.045667621735288e-06, + "loss": 1.0999, + "step": 10264 + }, + { + "epoch": 0.31, + "learning_rate": 4.045475901001349e-06, + "loss": 1.0597, + "step": 10265 + }, + { + "epoch": 0.31, + "learning_rate": 4.0452841655552226e-06, + "loss": 1.1774, + "step": 10266 + }, + { + "epoch": 0.31, + "learning_rate": 4.045092415398736e-06, + "loss": 1.0837, + "step": 10267 + }, + { + "epoch": 0.31, + "learning_rate": 4.0449006505337125e-06, + "loss": 1.1476, + "step": 10268 + }, + { + "epoch": 0.31, + "learning_rate": 4.044708870961981e-06, + "loss": 1.0966, + "step": 10269 + }, + { + "epoch": 0.31, + "learning_rate": 4.044517076685364e-06, + "loss": 1.1435, + "step": 10270 + }, + { + "epoch": 0.31, + "learning_rate": 4.0443252677056875e-06, + "loss": 1.1859, + "step": 10271 + }, + { + "epoch": 0.31, + "learning_rate": 4.04413344402478e-06, + "loss": 1.0615, + "step": 10272 + }, + { + "epoch": 0.31, + "learning_rate": 4.043941605644464e-06, + "loss": 1.1167, + "step": 10273 + }, + { + "epoch": 0.31, + "learning_rate": 4.0437497525665685e-06, + "loss": 1.1609, + "step": 10274 + }, + { + "epoch": 0.31, + "learning_rate": 4.043557884792918e-06, + "loss": 1.076, + "step": 10275 + }, + { + "epoch": 0.31, + "learning_rate": 4.0433660023253405e-06, + "loss": 1.081, + "step": 10276 + }, + { + "epoch": 0.31, + "learning_rate": 4.043174105165661e-06, + "loss": 1.0626, + "step": 10277 + }, + { + "epoch": 0.31, + "learning_rate": 4.042982193315709e-06, + "loss": 1.1754, + "step": 10278 + }, + { + "epoch": 0.31, + "learning_rate": 4.042790266777308e-06, + "loss": 1.2939, + "step": 10279 + }, + { + "epoch": 0.31, + "learning_rate": 4.042598325552288e-06, + "loss": 1.1716, + "step": 10280 + }, + { + "epoch": 0.31, + "learning_rate": 4.042406369642475e-06, + "loss": 1.1556, + "step": 10281 + }, + { + "epoch": 0.31, + "learning_rate": 4.042214399049695e-06, + "loss": 1.1774, + "step": 10282 + }, + { + "epoch": 0.31, + "learning_rate": 4.042022413775777e-06, + "loss": 1.1431, + "step": 10283 + }, + { + "epoch": 0.31, + "learning_rate": 4.041830413822549e-06, + "loss": 1.092, + "step": 10284 + }, + { + "epoch": 0.31, + "learning_rate": 4.0416383991918365e-06, + "loss": 1.1396, + "step": 10285 + }, + { + "epoch": 0.31, + "learning_rate": 4.04144636988547e-06, + "loss": 1.1299, + "step": 10286 + }, + { + "epoch": 0.31, + "learning_rate": 4.041254325905277e-06, + "loss": 1.2035, + "step": 10287 + }, + { + "epoch": 0.31, + "learning_rate": 4.041062267253084e-06, + "loss": 1.121, + "step": 10288 + }, + { + "epoch": 0.31, + "learning_rate": 4.04087019393072e-06, + "loss": 1.145, + "step": 10289 + }, + { + "epoch": 0.31, + "learning_rate": 4.040678105940016e-06, + "loss": 1.1034, + "step": 10290 + }, + { + "epoch": 0.31, + "learning_rate": 4.040486003282797e-06, + "loss": 1.153, + "step": 10291 + }, + { + "epoch": 0.31, + "learning_rate": 4.0402938859608935e-06, + "loss": 1.1409, + "step": 10292 + }, + { + "epoch": 0.31, + "learning_rate": 4.040101753976133e-06, + "loss": 1.2387, + "step": 10293 + }, + { + "epoch": 0.31, + "learning_rate": 4.039909607330347e-06, + "loss": 1.2274, + "step": 10294 + }, + { + "epoch": 0.31, + "learning_rate": 4.039717446025363e-06, + "loss": 1.1188, + "step": 10295 + }, + { + "epoch": 0.31, + "learning_rate": 4.0395252700630095e-06, + "loss": 1.0495, + "step": 10296 + }, + { + "epoch": 0.31, + "learning_rate": 4.039333079445118e-06, + "loss": 1.1313, + "step": 10297 + }, + { + "epoch": 0.31, + "learning_rate": 4.039140874173516e-06, + "loss": 1.1692, + "step": 10298 + }, + { + "epoch": 0.31, + "learning_rate": 4.038948654250034e-06, + "loss": 1.0314, + "step": 10299 + }, + { + "epoch": 0.31, + "learning_rate": 4.038756419676503e-06, + "loss": 1.0992, + "step": 10300 + }, + { + "epoch": 0.31, + "learning_rate": 4.038564170454752e-06, + "loss": 1.0471, + "step": 10301 + }, + { + "epoch": 0.31, + "learning_rate": 4.038371906586611e-06, + "loss": 1.0923, + "step": 10302 + }, + { + "epoch": 0.31, + "learning_rate": 4.0381796280739095e-06, + "loss": 1.0692, + "step": 10303 + }, + { + "epoch": 0.31, + "learning_rate": 4.0379873349184795e-06, + "loss": 1.1288, + "step": 10304 + }, + { + "epoch": 0.31, + "learning_rate": 4.03779502712215e-06, + "loss": 1.3125, + "step": 10305 + }, + { + "epoch": 0.31, + "learning_rate": 4.037602704686754e-06, + "loss": 1.0709, + "step": 10306 + }, + { + "epoch": 0.31, + "learning_rate": 4.037410367614119e-06, + "loss": 1.1037, + "step": 10307 + }, + { + "epoch": 0.31, + "learning_rate": 4.0372180159060795e-06, + "loss": 1.0377, + "step": 10308 + }, + { + "epoch": 0.31, + "learning_rate": 4.037025649564463e-06, + "loss": 1.1296, + "step": 10309 + }, + { + "epoch": 0.31, + "learning_rate": 4.036833268591104e-06, + "loss": 1.0659, + "step": 10310 + }, + { + "epoch": 0.31, + "learning_rate": 4.0366408729878315e-06, + "loss": 1.2375, + "step": 10311 + }, + { + "epoch": 0.31, + "learning_rate": 4.036448462756478e-06, + "loss": 1.1771, + "step": 10312 + }, + { + "epoch": 0.31, + "learning_rate": 4.036256037898876e-06, + "loss": 1.1844, + "step": 10313 + }, + { + "epoch": 0.31, + "learning_rate": 4.036063598416856e-06, + "loss": 1.1656, + "step": 10314 + }, + { + "epoch": 0.31, + "learning_rate": 4.03587114431225e-06, + "loss": 1.006, + "step": 10315 + }, + { + "epoch": 0.31, + "learning_rate": 4.0356786755868905e-06, + "loss": 1.1232, + "step": 10316 + }, + { + "epoch": 0.31, + "learning_rate": 4.03548619224261e-06, + "loss": 1.1118, + "step": 10317 + }, + { + "epoch": 0.31, + "learning_rate": 4.03529369428124e-06, + "loss": 1.1945, + "step": 10318 + }, + { + "epoch": 0.31, + "learning_rate": 4.035101181704613e-06, + "loss": 1.1266, + "step": 10319 + }, + { + "epoch": 0.31, + "learning_rate": 4.0349086545145636e-06, + "loss": 1.0864, + "step": 10320 + }, + { + "epoch": 0.31, + "learning_rate": 4.034716112712922e-06, + "loss": 1.1467, + "step": 10321 + }, + { + "epoch": 0.31, + "learning_rate": 4.034523556301523e-06, + "loss": 1.1501, + "step": 10322 + }, + { + "epoch": 0.31, + "learning_rate": 4.034330985282198e-06, + "loss": 1.1185, + "step": 10323 + }, + { + "epoch": 0.31, + "learning_rate": 4.034138399656781e-06, + "loss": 1.2042, + "step": 10324 + }, + { + "epoch": 0.31, + "learning_rate": 4.033945799427105e-06, + "loss": 1.1445, + "step": 10325 + }, + { + "epoch": 0.31, + "learning_rate": 4.033753184595004e-06, + "loss": 1.1109, + "step": 10326 + }, + { + "epoch": 0.31, + "learning_rate": 4.033560555162311e-06, + "loss": 1.0106, + "step": 10327 + }, + { + "epoch": 0.31, + "learning_rate": 4.033367911130862e-06, + "loss": 1.1114, + "step": 10328 + }, + { + "epoch": 0.31, + "learning_rate": 4.033175252502487e-06, + "loss": 1.2789, + "step": 10329 + }, + { + "epoch": 0.31, + "learning_rate": 4.032982579279023e-06, + "loss": 1.0266, + "step": 10330 + }, + { + "epoch": 0.31, + "learning_rate": 4.032789891462302e-06, + "loss": 0.9451, + "step": 10331 + }, + { + "epoch": 0.31, + "learning_rate": 4.032597189054161e-06, + "loss": 1.246, + "step": 10332 + }, + { + "epoch": 0.31, + "learning_rate": 4.032404472056432e-06, + "loss": 1.0908, + "step": 10333 + }, + { + "epoch": 0.31, + "learning_rate": 4.03221174047095e-06, + "loss": 1.1401, + "step": 10334 + }, + { + "epoch": 0.31, + "learning_rate": 4.032018994299551e-06, + "loss": 1.0665, + "step": 10335 + }, + { + "epoch": 0.31, + "learning_rate": 4.0318262335440694e-06, + "loss": 1.051, + "step": 10336 + }, + { + "epoch": 0.31, + "learning_rate": 4.031633458206339e-06, + "loss": 1.139, + "step": 10337 + }, + { + "epoch": 0.31, + "learning_rate": 4.031440668288196e-06, + "loss": 1.1265, + "step": 10338 + }, + { + "epoch": 0.31, + "learning_rate": 4.031247863791475e-06, + "loss": 1.1139, + "step": 10339 + }, + { + "epoch": 0.31, + "learning_rate": 4.031055044718012e-06, + "loss": 1.1577, + "step": 10340 + }, + { + "epoch": 0.31, + "learning_rate": 4.030862211069643e-06, + "loss": 1.1646, + "step": 10341 + }, + { + "epoch": 0.31, + "learning_rate": 4.030669362848202e-06, + "loss": 1.158, + "step": 10342 + }, + { + "epoch": 0.31, + "learning_rate": 4.030476500055527e-06, + "loss": 1.2438, + "step": 10343 + }, + { + "epoch": 0.31, + "learning_rate": 4.030283622693452e-06, + "loss": 1.097, + "step": 10344 + }, + { + "epoch": 0.31, + "learning_rate": 4.0300907307638134e-06, + "loss": 1.0731, + "step": 10345 + }, + { + "epoch": 0.31, + "learning_rate": 4.029897824268449e-06, + "loss": 1.1813, + "step": 10346 + }, + { + "epoch": 0.31, + "learning_rate": 4.029704903209194e-06, + "loss": 1.1366, + "step": 10347 + }, + { + "epoch": 0.31, + "learning_rate": 4.029511967587885e-06, + "loss": 1.1295, + "step": 10348 + }, + { + "epoch": 0.31, + "learning_rate": 4.029319017406359e-06, + "loss": 1.1686, + "step": 10349 + }, + { + "epoch": 0.31, + "learning_rate": 4.029126052666452e-06, + "loss": 1.1707, + "step": 10350 + }, + { + "epoch": 0.31, + "learning_rate": 4.0289330733700015e-06, + "loss": 1.2001, + "step": 10351 + }, + { + "epoch": 0.31, + "learning_rate": 4.028740079518844e-06, + "loss": 1.1458, + "step": 10352 + }, + { + "epoch": 0.31, + "learning_rate": 4.028547071114818e-06, + "loss": 1.0965, + "step": 10353 + }, + { + "epoch": 0.31, + "learning_rate": 4.02835404815976e-06, + "loss": 1.177, + "step": 10354 + }, + { + "epoch": 0.31, + "learning_rate": 4.0281610106555066e-06, + "loss": 1.1562, + "step": 10355 + }, + { + "epoch": 0.31, + "learning_rate": 4.0279679586038975e-06, + "loss": 1.1841, + "step": 10356 + }, + { + "epoch": 0.31, + "learning_rate": 4.027774892006769e-06, + "loss": 1.1354, + "step": 10357 + }, + { + "epoch": 0.31, + "learning_rate": 4.027581810865959e-06, + "loss": 1.138, + "step": 10358 + }, + { + "epoch": 0.31, + "learning_rate": 4.027388715183306e-06, + "loss": 1.1128, + "step": 10359 + }, + { + "epoch": 0.31, + "learning_rate": 4.027195604960649e-06, + "loss": 1.0076, + "step": 10360 + }, + { + "epoch": 0.31, + "learning_rate": 4.027002480199824e-06, + "loss": 1.2086, + "step": 10361 + }, + { + "epoch": 0.31, + "learning_rate": 4.026809340902672e-06, + "loss": 1.2316, + "step": 10362 + }, + { + "epoch": 0.31, + "learning_rate": 4.02661618707103e-06, + "loss": 1.2454, + "step": 10363 + }, + { + "epoch": 0.31, + "learning_rate": 4.026423018706737e-06, + "loss": 1.061, + "step": 10364 + }, + { + "epoch": 0.31, + "learning_rate": 4.026229835811631e-06, + "loss": 1.0676, + "step": 10365 + }, + { + "epoch": 0.31, + "learning_rate": 4.0260366383875525e-06, + "loss": 1.0837, + "step": 10366 + }, + { + "epoch": 0.31, + "learning_rate": 4.025843426436341e-06, + "loss": 1.2296, + "step": 10367 + }, + { + "epoch": 0.31, + "learning_rate": 4.025650199959835e-06, + "loss": 1.1958, + "step": 10368 + }, + { + "epoch": 0.31, + "learning_rate": 4.025456958959874e-06, + "loss": 1.0295, + "step": 10369 + }, + { + "epoch": 0.31, + "learning_rate": 4.025263703438296e-06, + "loss": 1.0918, + "step": 10370 + }, + { + "epoch": 0.31, + "learning_rate": 4.025070433396943e-06, + "loss": 1.1219, + "step": 10371 + }, + { + "epoch": 0.31, + "learning_rate": 4.024877148837654e-06, + "loss": 1.0754, + "step": 10372 + }, + { + "epoch": 0.31, + "learning_rate": 4.024683849762269e-06, + "loss": 1.2504, + "step": 10373 + }, + { + "epoch": 0.31, + "learning_rate": 4.024490536172628e-06, + "loss": 1.1631, + "step": 10374 + }, + { + "epoch": 0.31, + "learning_rate": 4.024297208070571e-06, + "loss": 1.1603, + "step": 10375 + }, + { + "epoch": 0.31, + "learning_rate": 4.024103865457939e-06, + "loss": 1.1485, + "step": 10376 + }, + { + "epoch": 0.31, + "learning_rate": 4.023910508336573e-06, + "loss": 1.1053, + "step": 10377 + }, + { + "epoch": 0.31, + "learning_rate": 4.023717136708311e-06, + "loss": 1.1544, + "step": 10378 + }, + { + "epoch": 0.31, + "learning_rate": 4.023523750574997e-06, + "loss": 1.1713, + "step": 10379 + }, + { + "epoch": 0.31, + "learning_rate": 4.023330349938471e-06, + "loss": 1.1049, + "step": 10380 + }, + { + "epoch": 0.31, + "learning_rate": 4.023136934800573e-06, + "loss": 1.1478, + "step": 10381 + }, + { + "epoch": 0.31, + "learning_rate": 4.022943505163145e-06, + "loss": 1.1838, + "step": 10382 + }, + { + "epoch": 0.31, + "learning_rate": 4.022750061028029e-06, + "loss": 1.1557, + "step": 10383 + }, + { + "epoch": 0.31, + "learning_rate": 4.0225566023970655e-06, + "loss": 1.0837, + "step": 10384 + }, + { + "epoch": 0.31, + "learning_rate": 4.022363129272095e-06, + "loss": 1.1329, + "step": 10385 + }, + { + "epoch": 0.31, + "learning_rate": 4.022169641654963e-06, + "loss": 1.1564, + "step": 10386 + }, + { + "epoch": 0.31, + "learning_rate": 4.021976139547507e-06, + "loss": 1.0578, + "step": 10387 + }, + { + "epoch": 0.31, + "learning_rate": 4.021782622951573e-06, + "loss": 1.1483, + "step": 10388 + }, + { + "epoch": 0.31, + "learning_rate": 4.021589091869e-06, + "loss": 1.1927, + "step": 10389 + }, + { + "epoch": 0.31, + "learning_rate": 4.021395546301633e-06, + "loss": 1.1732, + "step": 10390 + }, + { + "epoch": 0.31, + "learning_rate": 4.021201986251312e-06, + "loss": 1.2123, + "step": 10391 + }, + { + "epoch": 0.31, + "learning_rate": 4.021008411719881e-06, + "loss": 1.187, + "step": 10392 + }, + { + "epoch": 0.31, + "learning_rate": 4.020814822709183e-06, + "loss": 1.2204, + "step": 10393 + }, + { + "epoch": 0.31, + "learning_rate": 4.02062121922106e-06, + "loss": 1.1274, + "step": 10394 + }, + { + "epoch": 0.31, + "learning_rate": 4.020427601257355e-06, + "loss": 1.177, + "step": 10395 + }, + { + "epoch": 0.31, + "learning_rate": 4.020233968819911e-06, + "loss": 1.078, + "step": 10396 + }, + { + "epoch": 0.31, + "learning_rate": 4.020040321910574e-06, + "loss": 1.2035, + "step": 10397 + }, + { + "epoch": 0.31, + "learning_rate": 4.019846660531182e-06, + "loss": 1.1465, + "step": 10398 + }, + { + "epoch": 0.31, + "learning_rate": 4.019652984683584e-06, + "loss": 1.1877, + "step": 10399 + }, + { + "epoch": 0.31, + "learning_rate": 4.019459294369621e-06, + "loss": 1.1901, + "step": 10400 + }, + { + "epoch": 0.31, + "learning_rate": 4.019265589591138e-06, + "loss": 1.1504, + "step": 10401 + }, + { + "epoch": 0.31, + "learning_rate": 4.019071870349977e-06, + "loss": 1.1025, + "step": 10402 + }, + { + "epoch": 0.31, + "learning_rate": 4.0188781366479845e-06, + "loss": 1.1677, + "step": 10403 + }, + { + "epoch": 0.31, + "learning_rate": 4.018684388487003e-06, + "loss": 1.1859, + "step": 10404 + }, + { + "epoch": 0.31, + "learning_rate": 4.018490625868877e-06, + "loss": 1.1692, + "step": 10405 + }, + { + "epoch": 0.31, + "learning_rate": 4.018296848795452e-06, + "loss": 1.0898, + "step": 10406 + }, + { + "epoch": 0.31, + "learning_rate": 4.018103057268573e-06, + "loss": 1.1477, + "step": 10407 + }, + { + "epoch": 0.31, + "learning_rate": 4.017909251290083e-06, + "loss": 1.1616, + "step": 10408 + }, + { + "epoch": 0.31, + "learning_rate": 4.017715430861829e-06, + "loss": 1.1425, + "step": 10409 + }, + { + "epoch": 0.31, + "learning_rate": 4.017521595985655e-06, + "loss": 1.1782, + "step": 10410 + }, + { + "epoch": 0.31, + "learning_rate": 4.017327746663406e-06, + "loss": 1.1207, + "step": 10411 + }, + { + "epoch": 0.31, + "learning_rate": 4.017133882896927e-06, + "loss": 1.248, + "step": 10412 + }, + { + "epoch": 0.31, + "learning_rate": 4.016940004688064e-06, + "loss": 1.1887, + "step": 10413 + }, + { + "epoch": 0.31, + "learning_rate": 4.016746112038664e-06, + "loss": 1.1758, + "step": 10414 + }, + { + "epoch": 0.31, + "learning_rate": 4.0165522049505705e-06, + "loss": 1.1321, + "step": 10415 + }, + { + "epoch": 0.31, + "learning_rate": 4.016358283425631e-06, + "loss": 1.1248, + "step": 10416 + }, + { + "epoch": 0.31, + "learning_rate": 4.01616434746569e-06, + "loss": 1.0544, + "step": 10417 + }, + { + "epoch": 0.31, + "learning_rate": 4.015970397072595e-06, + "loss": 1.1318, + "step": 10418 + }, + { + "epoch": 0.31, + "learning_rate": 4.015776432248193e-06, + "loss": 1.1371, + "step": 10419 + }, + { + "epoch": 0.31, + "learning_rate": 4.015582452994328e-06, + "loss": 1.1093, + "step": 10420 + }, + { + "epoch": 0.31, + "learning_rate": 4.0153884593128485e-06, + "loss": 1.1455, + "step": 10421 + }, + { + "epoch": 0.31, + "learning_rate": 4.0151944512056016e-06, + "loss": 1.1174, + "step": 10422 + }, + { + "epoch": 0.31, + "learning_rate": 4.015000428674433e-06, + "loss": 1.1624, + "step": 10423 + }, + { + "epoch": 0.31, + "learning_rate": 4.0148063917211885e-06, + "loss": 1.2302, + "step": 10424 + }, + { + "epoch": 0.31, + "learning_rate": 4.014612340347718e-06, + "loss": 1.2484, + "step": 10425 + }, + { + "epoch": 0.31, + "learning_rate": 4.014418274555867e-06, + "loss": 1.1152, + "step": 10426 + }, + { + "epoch": 0.31, + "learning_rate": 4.014224194347483e-06, + "loss": 1.0928, + "step": 10427 + }, + { + "epoch": 0.31, + "learning_rate": 4.014030099724415e-06, + "loss": 1.1824, + "step": 10428 + }, + { + "epoch": 0.31, + "learning_rate": 4.013835990688509e-06, + "loss": 1.049, + "step": 10429 + }, + { + "epoch": 0.31, + "learning_rate": 4.013641867241613e-06, + "loss": 1.1743, + "step": 10430 + }, + { + "epoch": 0.31, + "learning_rate": 4.013447729385576e-06, + "loss": 1.0594, + "step": 10431 + }, + { + "epoch": 0.31, + "learning_rate": 4.013253577122246e-06, + "loss": 1.1964, + "step": 10432 + }, + { + "epoch": 0.31, + "learning_rate": 4.01305941045347e-06, + "loss": 1.1301, + "step": 10433 + }, + { + "epoch": 0.31, + "learning_rate": 4.012865229381098e-06, + "loss": 1.1731, + "step": 10434 + }, + { + "epoch": 0.31, + "learning_rate": 4.012671033906977e-06, + "loss": 1.0541, + "step": 10435 + }, + { + "epoch": 0.31, + "learning_rate": 4.012476824032956e-06, + "loss": 1.0247, + "step": 10436 + }, + { + "epoch": 0.31, + "learning_rate": 4.0122825997608835e-06, + "loss": 1.2188, + "step": 10437 + }, + { + "epoch": 0.31, + "learning_rate": 4.01208836109261e-06, + "loss": 1.2303, + "step": 10438 + }, + { + "epoch": 0.31, + "learning_rate": 4.011894108029983e-06, + "loss": 1.1035, + "step": 10439 + }, + { + "epoch": 0.31, + "learning_rate": 4.011699840574853e-06, + "loss": 1.1331, + "step": 10440 + }, + { + "epoch": 0.31, + "learning_rate": 4.011505558729069e-06, + "loss": 1.1219, + "step": 10441 + }, + { + "epoch": 0.31, + "learning_rate": 4.011311262494479e-06, + "loss": 1.2502, + "step": 10442 + }, + { + "epoch": 0.31, + "learning_rate": 4.011116951872933e-06, + "loss": 1.1761, + "step": 10443 + }, + { + "epoch": 0.31, + "learning_rate": 4.010922626866283e-06, + "loss": 1.0863, + "step": 10444 + }, + { + "epoch": 0.31, + "learning_rate": 4.010728287476377e-06, + "loss": 1.1627, + "step": 10445 + }, + { + "epoch": 0.31, + "learning_rate": 4.0105339337050644e-06, + "loss": 1.0433, + "step": 10446 + }, + { + "epoch": 0.31, + "learning_rate": 4.0103395655541965e-06, + "loss": 1.0894, + "step": 10447 + }, + { + "epoch": 0.31, + "learning_rate": 4.010145183025624e-06, + "loss": 1.1462, + "step": 10448 + }, + { + "epoch": 0.31, + "learning_rate": 4.009950786121196e-06, + "loss": 1.2529, + "step": 10449 + }, + { + "epoch": 0.31, + "learning_rate": 4.0097563748427635e-06, + "loss": 1.0975, + "step": 10450 + }, + { + "epoch": 0.31, + "learning_rate": 4.009561949192179e-06, + "loss": 1.0382, + "step": 10451 + }, + { + "epoch": 0.31, + "learning_rate": 4.00936750917129e-06, + "loss": 1.1663, + "step": 10452 + }, + { + "epoch": 0.31, + "learning_rate": 4.00917305478195e-06, + "loss": 1.0093, + "step": 10453 + }, + { + "epoch": 0.31, + "learning_rate": 4.008978586026009e-06, + "loss": 1.248, + "step": 10454 + }, + { + "epoch": 0.31, + "learning_rate": 4.00878410290532e-06, + "loss": 1.1777, + "step": 10455 + }, + { + "epoch": 0.31, + "learning_rate": 4.008589605421731e-06, + "loss": 1.145, + "step": 10456 + }, + { + "epoch": 0.32, + "learning_rate": 4.008395093577097e-06, + "loss": 1.1592, + "step": 10457 + }, + { + "epoch": 0.32, + "learning_rate": 4.008200567373267e-06, + "loss": 1.2009, + "step": 10458 + }, + { + "epoch": 0.32, + "learning_rate": 4.008006026812095e-06, + "loss": 1.0914, + "step": 10459 + }, + { + "epoch": 0.32, + "learning_rate": 4.0078114718954305e-06, + "loss": 1.2372, + "step": 10460 + }, + { + "epoch": 0.32, + "learning_rate": 4.007616902625128e-06, + "loss": 1.3004, + "step": 10461 + }, + { + "epoch": 0.32, + "learning_rate": 4.007422319003039e-06, + "loss": 1.248, + "step": 10462 + }, + { + "epoch": 0.32, + "learning_rate": 4.007227721031015e-06, + "loss": 1.0767, + "step": 10463 + }, + { + "epoch": 0.32, + "learning_rate": 4.007033108710909e-06, + "loss": 1.1021, + "step": 10464 + }, + { + "epoch": 0.32, + "learning_rate": 4.006838482044574e-06, + "loss": 1.1082, + "step": 10465 + }, + { + "epoch": 0.32, + "learning_rate": 4.006643841033862e-06, + "loss": 1.1002, + "step": 10466 + }, + { + "epoch": 0.32, + "learning_rate": 4.006449185680627e-06, + "loss": 1.2366, + "step": 10467 + }, + { + "epoch": 0.32, + "learning_rate": 4.006254515986721e-06, + "loss": 1.137, + "step": 10468 + }, + { + "epoch": 0.32, + "learning_rate": 4.006059831953996e-06, + "loss": 1.1829, + "step": 10469 + }, + { + "epoch": 0.32, + "learning_rate": 4.0058651335843076e-06, + "loss": 1.1392, + "step": 10470 + }, + { + "epoch": 0.32, + "learning_rate": 4.005670420879509e-06, + "loss": 1.0908, + "step": 10471 + }, + { + "epoch": 0.32, + "learning_rate": 4.005475693841453e-06, + "loss": 1.1371, + "step": 10472 + }, + { + "epoch": 0.32, + "learning_rate": 4.005280952471993e-06, + "loss": 1.2518, + "step": 10473 + }, + { + "epoch": 0.32, + "learning_rate": 4.005086196772984e-06, + "loss": 1.0688, + "step": 10474 + }, + { + "epoch": 0.32, + "learning_rate": 4.004891426746279e-06, + "loss": 1.1096, + "step": 10475 + }, + { + "epoch": 0.32, + "learning_rate": 4.004696642393732e-06, + "loss": 1.1697, + "step": 10476 + }, + { + "epoch": 0.32, + "learning_rate": 4.004501843717198e-06, + "loss": 1.1443, + "step": 10477 + }, + { + "epoch": 0.32, + "learning_rate": 4.004307030718531e-06, + "loss": 1.1062, + "step": 10478 + }, + { + "epoch": 0.32, + "learning_rate": 4.004112203399585e-06, + "loss": 1.0556, + "step": 10479 + }, + { + "epoch": 0.32, + "learning_rate": 4.003917361762216e-06, + "loss": 1.2336, + "step": 10480 + }, + { + "epoch": 0.32, + "learning_rate": 4.003722505808277e-06, + "loss": 1.1093, + "step": 10481 + }, + { + "epoch": 0.32, + "learning_rate": 4.0035276355396255e-06, + "loss": 1.1203, + "step": 10482 + }, + { + "epoch": 0.32, + "learning_rate": 4.003332750958114e-06, + "loss": 1.0668, + "step": 10483 + }, + { + "epoch": 0.32, + "learning_rate": 4.003137852065599e-06, + "loss": 1.066, + "step": 10484 + }, + { + "epoch": 0.32, + "learning_rate": 4.0029429388639354e-06, + "loss": 1.1964, + "step": 10485 + }, + { + "epoch": 0.32, + "learning_rate": 4.002748011354979e-06, + "loss": 1.1721, + "step": 10486 + }, + { + "epoch": 0.32, + "learning_rate": 4.002553069540585e-06, + "loss": 1.2316, + "step": 10487 + }, + { + "epoch": 0.32, + "learning_rate": 4.002358113422609e-06, + "loss": 1.1347, + "step": 10488 + }, + { + "epoch": 0.32, + "learning_rate": 4.002163143002909e-06, + "loss": 1.0148, + "step": 10489 + }, + { + "epoch": 0.32, + "learning_rate": 4.001968158283338e-06, + "loss": 1.1055, + "step": 10490 + }, + { + "epoch": 0.32, + "learning_rate": 4.001773159265754e-06, + "loss": 1.1696, + "step": 10491 + }, + { + "epoch": 0.32, + "learning_rate": 4.001578145952013e-06, + "loss": 1.2183, + "step": 10492 + }, + { + "epoch": 0.32, + "learning_rate": 4.001383118343971e-06, + "loss": 1.0115, + "step": 10493 + }, + { + "epoch": 0.32, + "learning_rate": 4.0011880764434856e-06, + "loss": 1.0792, + "step": 10494 + }, + { + "epoch": 0.32, + "learning_rate": 4.000993020252411e-06, + "loss": 1.1988, + "step": 10495 + }, + { + "epoch": 0.32, + "learning_rate": 4.000797949772607e-06, + "loss": 1.1319, + "step": 10496 + }, + { + "epoch": 0.32, + "learning_rate": 4.000602865005928e-06, + "loss": 1.1716, + "step": 10497 + }, + { + "epoch": 0.32, + "learning_rate": 4.000407765954234e-06, + "loss": 1.2169, + "step": 10498 + }, + { + "epoch": 0.32, + "learning_rate": 4.00021265261938e-06, + "loss": 1.2073, + "step": 10499 + }, + { + "epoch": 0.32, + "learning_rate": 4.000017525003224e-06, + "loss": 1.1629, + "step": 10500 + }, + { + "epoch": 0.32, + "learning_rate": 3.999822383107624e-06, + "loss": 1.1044, + "step": 10501 + }, + { + "epoch": 0.32, + "learning_rate": 3.999627226934437e-06, + "loss": 1.095, + "step": 10502 + }, + { + "epoch": 0.32, + "learning_rate": 3.999432056485521e-06, + "loss": 1.0811, + "step": 10503 + }, + { + "epoch": 0.32, + "learning_rate": 3.999236871762734e-06, + "loss": 1.2385, + "step": 10504 + }, + { + "epoch": 0.32, + "learning_rate": 3.999041672767933e-06, + "loss": 1.201, + "step": 10505 + }, + { + "epoch": 0.32, + "learning_rate": 3.998846459502979e-06, + "loss": 1.0993, + "step": 10506 + }, + { + "epoch": 0.32, + "learning_rate": 3.9986512319697275e-06, + "loss": 1.1526, + "step": 10507 + }, + { + "epoch": 0.32, + "learning_rate": 3.998455990170039e-06, + "loss": 1.1164, + "step": 10508 + }, + { + "epoch": 0.32, + "learning_rate": 3.99826073410577e-06, + "loss": 1.1324, + "step": 10509 + }, + { + "epoch": 0.32, + "learning_rate": 3.998065463778781e-06, + "loss": 1.1595, + "step": 10510 + }, + { + "epoch": 0.32, + "learning_rate": 3.99787017919093e-06, + "loss": 1.2644, + "step": 10511 + }, + { + "epoch": 0.32, + "learning_rate": 3.997674880344078e-06, + "loss": 1.1653, + "step": 10512 + }, + { + "epoch": 0.32, + "learning_rate": 3.99747956724008e-06, + "loss": 1.0759, + "step": 10513 + }, + { + "epoch": 0.32, + "learning_rate": 3.997284239880799e-06, + "loss": 1.0551, + "step": 10514 + }, + { + "epoch": 0.32, + "learning_rate": 3.997088898268093e-06, + "loss": 1.1052, + "step": 10515 + }, + { + "epoch": 0.32, + "learning_rate": 3.9968935424038216e-06, + "loss": 1.1611, + "step": 10516 + }, + { + "epoch": 0.32, + "learning_rate": 3.9966981722898444e-06, + "loss": 1.0844, + "step": 10517 + }, + { + "epoch": 0.32, + "learning_rate": 3.996502787928022e-06, + "loss": 1.0613, + "step": 10518 + }, + { + "epoch": 0.32, + "learning_rate": 3.996307389320213e-06, + "loss": 1.1053, + "step": 10519 + }, + { + "epoch": 0.32, + "learning_rate": 3.996111976468279e-06, + "loss": 1.2008, + "step": 10520 + }, + { + "epoch": 0.32, + "learning_rate": 3.995916549374079e-06, + "loss": 1.1196, + "step": 10521 + }, + { + "epoch": 0.32, + "learning_rate": 3.995721108039474e-06, + "loss": 1.204, + "step": 10522 + }, + { + "epoch": 0.32, + "learning_rate": 3.995525652466324e-06, + "loss": 1.0634, + "step": 10523 + }, + { + "epoch": 0.32, + "learning_rate": 3.995330182656491e-06, + "loss": 1.1051, + "step": 10524 + }, + { + "epoch": 0.32, + "learning_rate": 3.995134698611834e-06, + "loss": 1.2432, + "step": 10525 + }, + { + "epoch": 0.32, + "learning_rate": 3.994939200334216e-06, + "loss": 1.1157, + "step": 10526 + }, + { + "epoch": 0.32, + "learning_rate": 3.994743687825496e-06, + "loss": 1.0895, + "step": 10527 + }, + { + "epoch": 0.32, + "learning_rate": 3.994548161087536e-06, + "loss": 1.1469, + "step": 10528 + }, + { + "epoch": 0.32, + "learning_rate": 3.994352620122197e-06, + "loss": 1.1069, + "step": 10529 + }, + { + "epoch": 0.32, + "learning_rate": 3.9941570649313414e-06, + "loss": 1.1566, + "step": 10530 + }, + { + "epoch": 0.32, + "learning_rate": 3.993961495516829e-06, + "loss": 1.1917, + "step": 10531 + }, + { + "epoch": 0.32, + "learning_rate": 3.993765911880524e-06, + "loss": 1.1522, + "step": 10532 + }, + { + "epoch": 0.32, + "learning_rate": 3.993570314024287e-06, + "loss": 1.0983, + "step": 10533 + }, + { + "epoch": 0.32, + "learning_rate": 3.993374701949979e-06, + "loss": 1.0328, + "step": 10534 + }, + { + "epoch": 0.32, + "learning_rate": 3.993179075659463e-06, + "loss": 1.084, + "step": 10535 + }, + { + "epoch": 0.32, + "learning_rate": 3.992983435154602e-06, + "loss": 1.1183, + "step": 10536 + }, + { + "epoch": 0.32, + "learning_rate": 3.992787780437258e-06, + "loss": 1.29, + "step": 10537 + }, + { + "epoch": 0.32, + "learning_rate": 3.9925921115092925e-06, + "loss": 1.0511, + "step": 10538 + }, + { + "epoch": 0.32, + "learning_rate": 3.992396428372569e-06, + "loss": 1.1677, + "step": 10539 + }, + { + "epoch": 0.32, + "learning_rate": 3.992200731028951e-06, + "loss": 1.0206, + "step": 10540 + }, + { + "epoch": 0.32, + "learning_rate": 3.9920050194803e-06, + "loss": 1.1812, + "step": 10541 + }, + { + "epoch": 0.32, + "learning_rate": 3.99180929372848e-06, + "loss": 1.1236, + "step": 10542 + }, + { + "epoch": 0.32, + "learning_rate": 3.991613553775354e-06, + "loss": 1.2388, + "step": 10543 + }, + { + "epoch": 0.32, + "learning_rate": 3.9914177996227855e-06, + "loss": 1.2332, + "step": 10544 + }, + { + "epoch": 0.32, + "learning_rate": 3.991222031272637e-06, + "loss": 1.1066, + "step": 10545 + }, + { + "epoch": 0.32, + "learning_rate": 3.9910262487267745e-06, + "loss": 1.1689, + "step": 10546 + }, + { + "epoch": 0.32, + "learning_rate": 3.990830451987059e-06, + "loss": 1.0651, + "step": 10547 + }, + { + "epoch": 0.32, + "learning_rate": 3.990634641055356e-06, + "loss": 1.1478, + "step": 10548 + }, + { + "epoch": 0.32, + "learning_rate": 3.990438815933529e-06, + "loss": 1.1174, + "step": 10549 + }, + { + "epoch": 0.32, + "learning_rate": 3.990242976623443e-06, + "loss": 1.1019, + "step": 10550 + }, + { + "epoch": 0.32, + "learning_rate": 3.990047123126961e-06, + "loss": 1.1611, + "step": 10551 + }, + { + "epoch": 0.32, + "learning_rate": 3.989851255445948e-06, + "loss": 1.1138, + "step": 10552 + }, + { + "epoch": 0.32, + "learning_rate": 3.989655373582268e-06, + "loss": 1.1112, + "step": 10553 + }, + { + "epoch": 0.32, + "learning_rate": 3.989459477537787e-06, + "loss": 1.2566, + "step": 10554 + }, + { + "epoch": 0.32, + "learning_rate": 3.989263567314369e-06, + "loss": 1.1953, + "step": 10555 + }, + { + "epoch": 0.32, + "learning_rate": 3.989067642913879e-06, + "loss": 1.0744, + "step": 10556 + }, + { + "epoch": 0.32, + "learning_rate": 3.988871704338183e-06, + "loss": 1.1869, + "step": 10557 + }, + { + "epoch": 0.32, + "learning_rate": 3.988675751589145e-06, + "loss": 1.0911, + "step": 10558 + }, + { + "epoch": 0.32, + "learning_rate": 3.98847978466863e-06, + "loss": 1.0786, + "step": 10559 + }, + { + "epoch": 0.32, + "learning_rate": 3.988283803578505e-06, + "loss": 1.0482, + "step": 10560 + }, + { + "epoch": 0.32, + "learning_rate": 3.988087808320635e-06, + "loss": 1.1973, + "step": 10561 + }, + { + "epoch": 0.32, + "learning_rate": 3.9878917988968856e-06, + "loss": 1.2367, + "step": 10562 + }, + { + "epoch": 0.32, + "learning_rate": 3.9876957753091225e-06, + "loss": 1.1248, + "step": 10563 + }, + { + "epoch": 0.32, + "learning_rate": 3.9874997375592126e-06, + "loss": 1.0973, + "step": 10564 + }, + { + "epoch": 0.32, + "learning_rate": 3.987303685649021e-06, + "loss": 1.0686, + "step": 10565 + }, + { + "epoch": 0.32, + "learning_rate": 3.987107619580416e-06, + "loss": 1.1152, + "step": 10566 + }, + { + "epoch": 0.32, + "learning_rate": 3.986911539355261e-06, + "loss": 1.203, + "step": 10567 + }, + { + "epoch": 0.32, + "learning_rate": 3.986715444975426e-06, + "loss": 1.1345, + "step": 10568 + }, + { + "epoch": 0.32, + "learning_rate": 3.986519336442774e-06, + "loss": 1.207, + "step": 10569 + }, + { + "epoch": 0.32, + "learning_rate": 3.986323213759176e-06, + "loss": 1.1248, + "step": 10570 + }, + { + "epoch": 0.32, + "learning_rate": 3.986127076926495e-06, + "loss": 1.0522, + "step": 10571 + }, + { + "epoch": 0.32, + "learning_rate": 3.985930925946601e-06, + "loss": 1.0813, + "step": 10572 + }, + { + "epoch": 0.32, + "learning_rate": 3.985734760821361e-06, + "loss": 1.274, + "step": 10573 + }, + { + "epoch": 0.32, + "learning_rate": 3.98553858155264e-06, + "loss": 1.1654, + "step": 10574 + }, + { + "epoch": 0.32, + "learning_rate": 3.985342388142307e-06, + "loss": 1.1221, + "step": 10575 + }, + { + "epoch": 0.32, + "learning_rate": 3.985146180592231e-06, + "loss": 1.2432, + "step": 10576 + }, + { + "epoch": 0.32, + "learning_rate": 3.984949958904279e-06, + "loss": 1.1581, + "step": 10577 + }, + { + "epoch": 0.32, + "learning_rate": 3.984753723080317e-06, + "loss": 1.1391, + "step": 10578 + }, + { + "epoch": 0.32, + "learning_rate": 3.984557473122216e-06, + "loss": 1.0671, + "step": 10579 + }, + { + "epoch": 0.32, + "learning_rate": 3.984361209031841e-06, + "loss": 1.1345, + "step": 10580 + }, + { + "epoch": 0.32, + "learning_rate": 3.984164930811064e-06, + "loss": 1.0135, + "step": 10581 + }, + { + "epoch": 0.32, + "learning_rate": 3.983968638461752e-06, + "loss": 1.1393, + "step": 10582 + }, + { + "epoch": 0.32, + "learning_rate": 3.983772331985772e-06, + "loss": 1.0478, + "step": 10583 + }, + { + "epoch": 0.32, + "learning_rate": 3.983576011384994e-06, + "loss": 1.034, + "step": 10584 + }, + { + "epoch": 0.32, + "learning_rate": 3.983379676661287e-06, + "loss": 1.0715, + "step": 10585 + }, + { + "epoch": 0.32, + "learning_rate": 3.983183327816521e-06, + "loss": 1.1971, + "step": 10586 + }, + { + "epoch": 0.32, + "learning_rate": 3.982986964852564e-06, + "loss": 1.1448, + "step": 10587 + }, + { + "epoch": 0.32, + "learning_rate": 3.982790587771284e-06, + "loss": 1.0583, + "step": 10588 + }, + { + "epoch": 0.32, + "learning_rate": 3.982594196574552e-06, + "loss": 1.1463, + "step": 10589 + }, + { + "epoch": 0.32, + "learning_rate": 3.982397791264237e-06, + "loss": 1.0603, + "step": 10590 + }, + { + "epoch": 0.32, + "learning_rate": 3.982201371842209e-06, + "loss": 1.1745, + "step": 10591 + }, + { + "epoch": 0.32, + "learning_rate": 3.9820049383103385e-06, + "loss": 1.2842, + "step": 10592 + }, + { + "epoch": 0.32, + "learning_rate": 3.981808490670494e-06, + "loss": 1.1752, + "step": 10593 + }, + { + "epoch": 0.32, + "learning_rate": 3.9816120289245485e-06, + "loss": 1.1559, + "step": 10594 + }, + { + "epoch": 0.32, + "learning_rate": 3.981415553074368e-06, + "loss": 1.1476, + "step": 10595 + }, + { + "epoch": 0.32, + "learning_rate": 3.981219063121825e-06, + "loss": 1.2113, + "step": 10596 + }, + { + "epoch": 0.32, + "learning_rate": 3.98102255906879e-06, + "loss": 1.0681, + "step": 10597 + }, + { + "epoch": 0.32, + "learning_rate": 3.980826040917135e-06, + "loss": 1.0986, + "step": 10598 + }, + { + "epoch": 0.32, + "learning_rate": 3.980629508668728e-06, + "loss": 1.0745, + "step": 10599 + }, + { + "epoch": 0.32, + "learning_rate": 3.980432962325441e-06, + "loss": 1.1158, + "step": 10600 + }, + { + "epoch": 0.32, + "learning_rate": 3.9802364018891456e-06, + "loss": 1.099, + "step": 10601 + }, + { + "epoch": 0.32, + "learning_rate": 3.9800398273617125e-06, + "loss": 1.147, + "step": 10602 + }, + { + "epoch": 0.32, + "learning_rate": 3.979843238745013e-06, + "loss": 1.1125, + "step": 10603 + }, + { + "epoch": 0.32, + "learning_rate": 3.979646636040918e-06, + "loss": 1.1595, + "step": 10604 + }, + { + "epoch": 0.32, + "learning_rate": 3.9794500192513e-06, + "loss": 1.0569, + "step": 10605 + }, + { + "epoch": 0.32, + "learning_rate": 3.97925338837803e-06, + "loss": 1.1454, + "step": 10606 + }, + { + "epoch": 0.32, + "learning_rate": 3.979056743422982e-06, + "loss": 1.1347, + "step": 10607 + }, + { + "epoch": 0.32, + "learning_rate": 3.978860084388025e-06, + "loss": 1.1367, + "step": 10608 + }, + { + "epoch": 0.32, + "learning_rate": 3.978663411275032e-06, + "loss": 1.0425, + "step": 10609 + }, + { + "epoch": 0.32, + "learning_rate": 3.978466724085876e-06, + "loss": 1.2788, + "step": 10610 + }, + { + "epoch": 0.32, + "learning_rate": 3.978270022822428e-06, + "loss": 1.1321, + "step": 10611 + }, + { + "epoch": 0.32, + "learning_rate": 3.978073307486561e-06, + "loss": 1.1912, + "step": 10612 + }, + { + "epoch": 0.32, + "learning_rate": 3.97787657808015e-06, + "loss": 1.149, + "step": 10613 + }, + { + "epoch": 0.32, + "learning_rate": 3.977679834605064e-06, + "loss": 1.1643, + "step": 10614 + }, + { + "epoch": 0.32, + "learning_rate": 3.977483077063178e-06, + "loss": 1.1033, + "step": 10615 + }, + { + "epoch": 0.32, + "learning_rate": 3.977286305456365e-06, + "loss": 1.1008, + "step": 10616 + }, + { + "epoch": 0.32, + "learning_rate": 3.977089519786497e-06, + "loss": 1.1292, + "step": 10617 + }, + { + "epoch": 0.32, + "learning_rate": 3.976892720055448e-06, + "loss": 1.1076, + "step": 10618 + }, + { + "epoch": 0.32, + "learning_rate": 3.976695906265093e-06, + "loss": 1.1439, + "step": 10619 + }, + { + "epoch": 0.32, + "learning_rate": 3.976499078417304e-06, + "loss": 1.2174, + "step": 10620 + }, + { + "epoch": 0.32, + "learning_rate": 3.976302236513955e-06, + "loss": 1.0042, + "step": 10621 + }, + { + "epoch": 0.32, + "learning_rate": 3.976105380556919e-06, + "loss": 1.1235, + "step": 10622 + }, + { + "epoch": 0.32, + "learning_rate": 3.975908510548071e-06, + "loss": 1.1158, + "step": 10623 + }, + { + "epoch": 0.32, + "learning_rate": 3.975711626489285e-06, + "loss": 1.2093, + "step": 10624 + }, + { + "epoch": 0.32, + "learning_rate": 3.975514728382433e-06, + "loss": 1.1267, + "step": 10625 + }, + { + "epoch": 0.32, + "learning_rate": 3.9753178162293944e-06, + "loss": 1.066, + "step": 10626 + }, + { + "epoch": 0.32, + "learning_rate": 3.9751208900320395e-06, + "loss": 1.0615, + "step": 10627 + }, + { + "epoch": 0.32, + "learning_rate": 3.9749239497922445e-06, + "loss": 1.0277, + "step": 10628 + }, + { + "epoch": 0.32, + "learning_rate": 3.974726995511883e-06, + "loss": 1.2012, + "step": 10629 + }, + { + "epoch": 0.32, + "learning_rate": 3.974530027192831e-06, + "loss": 1.309, + "step": 10630 + }, + { + "epoch": 0.32, + "learning_rate": 3.974333044836964e-06, + "loss": 1.0936, + "step": 10631 + }, + { + "epoch": 0.32, + "learning_rate": 3.974136048446155e-06, + "loss": 1.1257, + "step": 10632 + }, + { + "epoch": 0.32, + "learning_rate": 3.9739390380222835e-06, + "loss": 1.2662, + "step": 10633 + }, + { + "epoch": 0.32, + "learning_rate": 3.97374201356722e-06, + "loss": 1.123, + "step": 10634 + }, + { + "epoch": 0.32, + "learning_rate": 3.973544975082843e-06, + "loss": 1.1589, + "step": 10635 + }, + { + "epoch": 0.32, + "learning_rate": 3.973347922571027e-06, + "loss": 1.2373, + "step": 10636 + }, + { + "epoch": 0.32, + "learning_rate": 3.973150856033648e-06, + "loss": 1.1257, + "step": 10637 + }, + { + "epoch": 0.32, + "learning_rate": 3.972953775472584e-06, + "loss": 1.1584, + "step": 10638 + }, + { + "epoch": 0.32, + "learning_rate": 3.972756680889709e-06, + "loss": 1.1042, + "step": 10639 + }, + { + "epoch": 0.32, + "learning_rate": 3.972559572286899e-06, + "loss": 1.0947, + "step": 10640 + }, + { + "epoch": 0.32, + "learning_rate": 3.972362449666031e-06, + "loss": 1.0415, + "step": 10641 + }, + { + "epoch": 0.32, + "learning_rate": 3.972165313028982e-06, + "loss": 1.0959, + "step": 10642 + }, + { + "epoch": 0.32, + "learning_rate": 3.971968162377628e-06, + "loss": 1.0414, + "step": 10643 + }, + { + "epoch": 0.32, + "learning_rate": 3.971770997713847e-06, + "loss": 1.1181, + "step": 10644 + }, + { + "epoch": 0.32, + "learning_rate": 3.9715738190395135e-06, + "loss": 1.1152, + "step": 10645 + }, + { + "epoch": 0.32, + "learning_rate": 3.971376626356507e-06, + "loss": 1.1846, + "step": 10646 + }, + { + "epoch": 0.32, + "learning_rate": 3.971179419666703e-06, + "loss": 1.0968, + "step": 10647 + }, + { + "epoch": 0.32, + "learning_rate": 3.97098219897198e-06, + "loss": 1.2258, + "step": 10648 + }, + { + "epoch": 0.32, + "learning_rate": 3.9707849642742145e-06, + "loss": 1.0967, + "step": 10649 + }, + { + "epoch": 0.32, + "learning_rate": 3.970587715575285e-06, + "loss": 1.1, + "step": 10650 + }, + { + "epoch": 0.32, + "learning_rate": 3.970390452877068e-06, + "loss": 1.175, + "step": 10651 + }, + { + "epoch": 0.32, + "learning_rate": 3.9701931761814424e-06, + "loss": 1.0978, + "step": 10652 + }, + { + "epoch": 0.32, + "learning_rate": 3.969995885490285e-06, + "loss": 1.0355, + "step": 10653 + }, + { + "epoch": 0.32, + "learning_rate": 3.969798580805476e-06, + "loss": 1.0957, + "step": 10654 + }, + { + "epoch": 0.32, + "learning_rate": 3.969601262128892e-06, + "loss": 1.2228, + "step": 10655 + }, + { + "epoch": 0.32, + "learning_rate": 3.969403929462412e-06, + "loss": 1.1294, + "step": 10656 + }, + { + "epoch": 0.32, + "learning_rate": 3.969206582807914e-06, + "loss": 1.1888, + "step": 10657 + }, + { + "epoch": 0.32, + "learning_rate": 3.9690092221672765e-06, + "loss": 1.0966, + "step": 10658 + }, + { + "epoch": 0.32, + "learning_rate": 3.968811847542379e-06, + "loss": 1.1292, + "step": 10659 + }, + { + "epoch": 0.32, + "learning_rate": 3.968614458935101e-06, + "loss": 1.0689, + "step": 10660 + }, + { + "epoch": 0.32, + "learning_rate": 3.96841705634732e-06, + "loss": 1.0872, + "step": 10661 + }, + { + "epoch": 0.32, + "learning_rate": 3.968219639780915e-06, + "loss": 1.2256, + "step": 10662 + }, + { + "epoch": 0.32, + "learning_rate": 3.968022209237768e-06, + "loss": 1.3354, + "step": 10663 + }, + { + "epoch": 0.32, + "learning_rate": 3.967824764719754e-06, + "loss": 1.1561, + "step": 10664 + }, + { + "epoch": 0.32, + "learning_rate": 3.967627306228757e-06, + "loss": 1.0381, + "step": 10665 + }, + { + "epoch": 0.32, + "learning_rate": 3.967429833766655e-06, + "loss": 1.0506, + "step": 10666 + }, + { + "epoch": 0.32, + "learning_rate": 3.967232347335327e-06, + "loss": 1.177, + "step": 10667 + }, + { + "epoch": 0.32, + "learning_rate": 3.967034846936654e-06, + "loss": 1.1331, + "step": 10668 + }, + { + "epoch": 0.32, + "learning_rate": 3.9668373325725165e-06, + "loss": 1.359, + "step": 10669 + }, + { + "epoch": 0.32, + "learning_rate": 3.966639804244793e-06, + "loss": 0.9466, + "step": 10670 + }, + { + "epoch": 0.32, + "learning_rate": 3.966442261955365e-06, + "loss": 1.2065, + "step": 10671 + }, + { + "epoch": 0.32, + "learning_rate": 3.966244705706113e-06, + "loss": 1.0777, + "step": 10672 + }, + { + "epoch": 0.32, + "learning_rate": 3.966047135498917e-06, + "loss": 1.0813, + "step": 10673 + }, + { + "epoch": 0.32, + "learning_rate": 3.96584955133566e-06, + "loss": 1.1962, + "step": 10674 + }, + { + "epoch": 0.32, + "learning_rate": 3.96565195321822e-06, + "loss": 1.1246, + "step": 10675 + }, + { + "epoch": 0.32, + "learning_rate": 3.9654543411484805e-06, + "loss": 1.1189, + "step": 10676 + }, + { + "epoch": 0.32, + "learning_rate": 3.965256715128319e-06, + "loss": 1.1422, + "step": 10677 + }, + { + "epoch": 0.32, + "learning_rate": 3.965059075159622e-06, + "loss": 1.1667, + "step": 10678 + }, + { + "epoch": 0.32, + "learning_rate": 3.964861421244266e-06, + "loss": 1.2151, + "step": 10679 + }, + { + "epoch": 0.32, + "learning_rate": 3.964663753384137e-06, + "loss": 1.2306, + "step": 10680 + }, + { + "epoch": 0.32, + "learning_rate": 3.964466071581113e-06, + "loss": 1.1843, + "step": 10681 + }, + { + "epoch": 0.32, + "learning_rate": 3.964268375837077e-06, + "loss": 1.1824, + "step": 10682 + }, + { + "epoch": 0.32, + "learning_rate": 3.964070666153913e-06, + "loss": 1.178, + "step": 10683 + }, + { + "epoch": 0.32, + "learning_rate": 3.963872942533499e-06, + "loss": 1.1252, + "step": 10684 + }, + { + "epoch": 0.32, + "learning_rate": 3.963675204977722e-06, + "loss": 1.1852, + "step": 10685 + }, + { + "epoch": 0.32, + "learning_rate": 3.96347745348846e-06, + "loss": 1.1038, + "step": 10686 + }, + { + "epoch": 0.32, + "learning_rate": 3.963279688067598e-06, + "loss": 1.0657, + "step": 10687 + }, + { + "epoch": 0.32, + "learning_rate": 3.9630819087170196e-06, + "loss": 1.2084, + "step": 10688 + }, + { + "epoch": 0.32, + "learning_rate": 3.9628841154386045e-06, + "loss": 1.0806, + "step": 10689 + }, + { + "epoch": 0.32, + "learning_rate": 3.962686308234237e-06, + "loss": 1.1242, + "step": 10690 + }, + { + "epoch": 0.32, + "learning_rate": 3.962488487105801e-06, + "loss": 1.2128, + "step": 10691 + }, + { + "epoch": 0.32, + "learning_rate": 3.962290652055179e-06, + "loss": 1.2303, + "step": 10692 + }, + { + "epoch": 0.32, + "learning_rate": 3.962092803084254e-06, + "loss": 1.1125, + "step": 10693 + }, + { + "epoch": 0.32, + "learning_rate": 3.96189494019491e-06, + "loss": 1.0852, + "step": 10694 + }, + { + "epoch": 0.32, + "learning_rate": 3.96169706338903e-06, + "loss": 1.2003, + "step": 10695 + }, + { + "epoch": 0.32, + "learning_rate": 3.961499172668498e-06, + "loss": 1.0457, + "step": 10696 + }, + { + "epoch": 0.32, + "learning_rate": 3.961301268035197e-06, + "loss": 1.0368, + "step": 10697 + }, + { + "epoch": 0.32, + "learning_rate": 3.961103349491013e-06, + "loss": 1.0425, + "step": 10698 + }, + { + "epoch": 0.32, + "learning_rate": 3.960905417037828e-06, + "loss": 1.1694, + "step": 10699 + }, + { + "epoch": 0.32, + "learning_rate": 3.9607074706775275e-06, + "loss": 1.0845, + "step": 10700 + }, + { + "epoch": 0.32, + "learning_rate": 3.960509510411995e-06, + "loss": 1.1373, + "step": 10701 + }, + { + "epoch": 0.32, + "learning_rate": 3.960311536243116e-06, + "loss": 1.2296, + "step": 10702 + }, + { + "epoch": 0.32, + "learning_rate": 3.9601135481727736e-06, + "loss": 1.1427, + "step": 10703 + }, + { + "epoch": 0.32, + "learning_rate": 3.959915546202854e-06, + "loss": 1.2384, + "step": 10704 + }, + { + "epoch": 0.32, + "learning_rate": 3.959717530335241e-06, + "loss": 1.1359, + "step": 10705 + }, + { + "epoch": 0.32, + "learning_rate": 3.959519500571821e-06, + "loss": 1.199, + "step": 10706 + }, + { + "epoch": 0.32, + "learning_rate": 3.959321456914477e-06, + "loss": 1.103, + "step": 10707 + }, + { + "epoch": 0.32, + "learning_rate": 3.959123399365097e-06, + "loss": 1.0267, + "step": 10708 + }, + { + "epoch": 0.32, + "learning_rate": 3.9589253279255635e-06, + "loss": 1.2277, + "step": 10709 + }, + { + "epoch": 0.32, + "learning_rate": 3.958727242597765e-06, + "loss": 1.0142, + "step": 10710 + }, + { + "epoch": 0.32, + "learning_rate": 3.958529143383585e-06, + "loss": 1.0508, + "step": 10711 + }, + { + "epoch": 0.32, + "learning_rate": 3.95833103028491e-06, + "loss": 1.2543, + "step": 10712 + }, + { + "epoch": 0.32, + "learning_rate": 3.958132903303626e-06, + "loss": 1.1965, + "step": 10713 + }, + { + "epoch": 0.32, + "learning_rate": 3.957934762441619e-06, + "loss": 1.0305, + "step": 10714 + }, + { + "epoch": 0.32, + "learning_rate": 3.957736607700775e-06, + "loss": 1.0993, + "step": 10715 + }, + { + "epoch": 0.32, + "learning_rate": 3.9575384390829804e-06, + "loss": 1.1095, + "step": 10716 + }, + { + "epoch": 0.32, + "learning_rate": 3.9573402565901225e-06, + "loss": 1.1325, + "step": 10717 + }, + { + "epoch": 0.32, + "learning_rate": 3.957142060224087e-06, + "loss": 1.2188, + "step": 10718 + }, + { + "epoch": 0.32, + "learning_rate": 3.956943849986761e-06, + "loss": 1.1465, + "step": 10719 + }, + { + "epoch": 0.32, + "learning_rate": 3.95674562588003e-06, + "loss": 1.1373, + "step": 10720 + }, + { + "epoch": 0.32, + "learning_rate": 3.956547387905784e-06, + "loss": 1.1838, + "step": 10721 + }, + { + "epoch": 0.32, + "learning_rate": 3.956349136065908e-06, + "loss": 1.1133, + "step": 10722 + }, + { + "epoch": 0.32, + "learning_rate": 3.956150870362289e-06, + "loss": 1.2027, + "step": 10723 + }, + { + "epoch": 0.32, + "learning_rate": 3.955952590796816e-06, + "loss": 1.1536, + "step": 10724 + }, + { + "epoch": 0.32, + "learning_rate": 3.955754297371374e-06, + "loss": 1.1031, + "step": 10725 + }, + { + "epoch": 0.32, + "learning_rate": 3.955555990087853e-06, + "loss": 1.1827, + "step": 10726 + }, + { + "epoch": 0.32, + "learning_rate": 3.9553576689481395e-06, + "loss": 1.2281, + "step": 10727 + }, + { + "epoch": 0.32, + "learning_rate": 3.955159333954123e-06, + "loss": 1.033, + "step": 10728 + }, + { + "epoch": 0.32, + "learning_rate": 3.95496098510769e-06, + "loss": 1.0958, + "step": 10729 + }, + { + "epoch": 0.32, + "learning_rate": 3.95476262241073e-06, + "loss": 1.255, + "step": 10730 + }, + { + "epoch": 0.32, + "learning_rate": 3.954564245865129e-06, + "loss": 0.9637, + "step": 10731 + }, + { + "epoch": 0.32, + "learning_rate": 3.9543658554727775e-06, + "loss": 1.08, + "step": 10732 + }, + { + "epoch": 0.32, + "learning_rate": 3.954167451235563e-06, + "loss": 1.0528, + "step": 10733 + }, + { + "epoch": 0.32, + "learning_rate": 3.953969033155375e-06, + "loss": 1.0516, + "step": 10734 + }, + { + "epoch": 0.32, + "learning_rate": 3.953770601234103e-06, + "loss": 1.1326, + "step": 10735 + }, + { + "epoch": 0.32, + "learning_rate": 3.953572155473634e-06, + "loss": 1.2197, + "step": 10736 + }, + { + "epoch": 0.32, + "learning_rate": 3.9533736958758584e-06, + "loss": 1.0997, + "step": 10737 + }, + { + "epoch": 0.32, + "learning_rate": 3.953175222442665e-06, + "loss": 1.0736, + "step": 10738 + }, + { + "epoch": 0.32, + "learning_rate": 3.952976735175944e-06, + "loss": 1.1959, + "step": 10739 + }, + { + "epoch": 0.32, + "learning_rate": 3.952778234077583e-06, + "loss": 1.1084, + "step": 10740 + }, + { + "epoch": 0.32, + "learning_rate": 3.952579719149474e-06, + "loss": 1.1194, + "step": 10741 + }, + { + "epoch": 0.32, + "learning_rate": 3.9523811903935055e-06, + "loss": 1.0822, + "step": 10742 + }, + { + "epoch": 0.32, + "learning_rate": 3.952182647811568e-06, + "loss": 1.1827, + "step": 10743 + }, + { + "epoch": 0.32, + "learning_rate": 3.9519840914055505e-06, + "loss": 1.1684, + "step": 10744 + }, + { + "epoch": 0.32, + "learning_rate": 3.951785521177344e-06, + "loss": 1.1509, + "step": 10745 + }, + { + "epoch": 0.32, + "learning_rate": 3.951586937128838e-06, + "loss": 1.101, + "step": 10746 + }, + { + "epoch": 0.32, + "learning_rate": 3.951388339261923e-06, + "loss": 1.1688, + "step": 10747 + }, + { + "epoch": 0.32, + "learning_rate": 3.951189727578491e-06, + "loss": 1.1866, + "step": 10748 + }, + { + "epoch": 0.32, + "learning_rate": 3.950991102080433e-06, + "loss": 1.1227, + "step": 10749 + }, + { + "epoch": 0.32, + "learning_rate": 3.950792462769636e-06, + "loss": 1.1068, + "step": 10750 + }, + { + "epoch": 0.32, + "learning_rate": 3.950593809647994e-06, + "loss": 1.0745, + "step": 10751 + }, + { + "epoch": 0.32, + "learning_rate": 3.950395142717399e-06, + "loss": 1.1141, + "step": 10752 + }, + { + "epoch": 0.32, + "learning_rate": 3.95019646197974e-06, + "loss": 1.0352, + "step": 10753 + }, + { + "epoch": 0.32, + "learning_rate": 3.949997767436908e-06, + "loss": 1.1215, + "step": 10754 + }, + { + "epoch": 0.32, + "learning_rate": 3.949799059090797e-06, + "loss": 1.2484, + "step": 10755 + }, + { + "epoch": 0.32, + "learning_rate": 3.949600336943296e-06, + "loss": 1.2727, + "step": 10756 + }, + { + "epoch": 0.32, + "learning_rate": 3.9494016009963e-06, + "loss": 1.0946, + "step": 10757 + }, + { + "epoch": 0.32, + "learning_rate": 3.949202851251698e-06, + "loss": 1.1368, + "step": 10758 + }, + { + "epoch": 0.32, + "learning_rate": 3.949004087711381e-06, + "loss": 1.2011, + "step": 10759 + }, + { + "epoch": 0.32, + "learning_rate": 3.948805310377245e-06, + "loss": 1.1089, + "step": 10760 + }, + { + "epoch": 0.32, + "learning_rate": 3.948606519251179e-06, + "loss": 1.1993, + "step": 10761 + }, + { + "epoch": 0.32, + "learning_rate": 3.948407714335078e-06, + "loss": 1.1795, + "step": 10762 + }, + { + "epoch": 0.32, + "learning_rate": 3.9482088956308315e-06, + "loss": 1.1678, + "step": 10763 + }, + { + "epoch": 0.32, + "learning_rate": 3.9480100631403355e-06, + "loss": 1.2229, + "step": 10764 + }, + { + "epoch": 0.32, + "learning_rate": 3.947811216865479e-06, + "loss": 1.2427, + "step": 10765 + }, + { + "epoch": 0.32, + "learning_rate": 3.947612356808159e-06, + "loss": 1.1741, + "step": 10766 + }, + { + "epoch": 0.32, + "learning_rate": 3.947413482970265e-06, + "loss": 1.181, + "step": 10767 + }, + { + "epoch": 0.32, + "learning_rate": 3.947214595353694e-06, + "loss": 1.1777, + "step": 10768 + }, + { + "epoch": 0.32, + "learning_rate": 3.947015693960334e-06, + "loss": 1.182, + "step": 10769 + }, + { + "epoch": 0.32, + "learning_rate": 3.946816778792083e-06, + "loss": 1.0992, + "step": 10770 + }, + { + "epoch": 0.32, + "learning_rate": 3.946617849850833e-06, + "loss": 1.009, + "step": 10771 + }, + { + "epoch": 0.32, + "learning_rate": 3.946418907138478e-06, + "loss": 1.1152, + "step": 10772 + }, + { + "epoch": 0.32, + "learning_rate": 3.946219950656912e-06, + "loss": 1.1342, + "step": 10773 + }, + { + "epoch": 0.32, + "learning_rate": 3.946020980408029e-06, + "loss": 1.1835, + "step": 10774 + }, + { + "epoch": 0.32, + "learning_rate": 3.945821996393721e-06, + "loss": 1.1877, + "step": 10775 + }, + { + "epoch": 0.32, + "learning_rate": 3.945622998615884e-06, + "loss": 1.1142, + "step": 10776 + }, + { + "epoch": 0.32, + "learning_rate": 3.945423987076414e-06, + "loss": 0.9841, + "step": 10777 + }, + { + "epoch": 0.32, + "learning_rate": 3.945224961777202e-06, + "loss": 1.1286, + "step": 10778 + }, + { + "epoch": 0.32, + "learning_rate": 3.945025922720145e-06, + "loss": 1.0847, + "step": 10779 + }, + { + "epoch": 0.32, + "learning_rate": 3.944826869907138e-06, + "loss": 1.1782, + "step": 10780 + }, + { + "epoch": 0.32, + "learning_rate": 3.944627803340074e-06, + "loss": 1.2266, + "step": 10781 + }, + { + "epoch": 0.32, + "learning_rate": 3.94442872302085e-06, + "loss": 1.1779, + "step": 10782 + }, + { + "epoch": 0.32, + "learning_rate": 3.944229628951359e-06, + "loss": 1.0611, + "step": 10783 + }, + { + "epoch": 0.32, + "learning_rate": 3.944030521133499e-06, + "loss": 1.0989, + "step": 10784 + }, + { + "epoch": 0.32, + "learning_rate": 3.9438313995691624e-06, + "loss": 1.1125, + "step": 10785 + }, + { + "epoch": 0.32, + "learning_rate": 3.9436322642602474e-06, + "loss": 1.1202, + "step": 10786 + }, + { + "epoch": 0.32, + "learning_rate": 3.943433115208648e-06, + "loss": 1.1345, + "step": 10787 + }, + { + "epoch": 0.32, + "learning_rate": 3.943233952416261e-06, + "loss": 1.0759, + "step": 10788 + }, + { + "epoch": 0.33, + "learning_rate": 3.943034775884981e-06, + "loss": 1.1689, + "step": 10789 + }, + { + "epoch": 0.33, + "learning_rate": 3.942835585616706e-06, + "loss": 1.0616, + "step": 10790 + }, + { + "epoch": 0.33, + "learning_rate": 3.94263638161333e-06, + "loss": 1.1753, + "step": 10791 + }, + { + "epoch": 0.33, + "learning_rate": 3.942437163876751e-06, + "loss": 1.0539, + "step": 10792 + }, + { + "epoch": 0.33, + "learning_rate": 3.942237932408865e-06, + "loss": 1.2488, + "step": 10793 + }, + { + "epoch": 0.33, + "learning_rate": 3.942038687211568e-06, + "loss": 1.1293, + "step": 10794 + }, + { + "epoch": 0.33, + "learning_rate": 3.9418394282867575e-06, + "loss": 1.1611, + "step": 10795 + }, + { + "epoch": 0.33, + "learning_rate": 3.941640155636331e-06, + "loss": 1.1161, + "step": 10796 + }, + { + "epoch": 0.33, + "learning_rate": 3.941440869262183e-06, + "loss": 1.2592, + "step": 10797 + }, + { + "epoch": 0.33, + "learning_rate": 3.941241569166212e-06, + "loss": 1.0863, + "step": 10798 + }, + { + "epoch": 0.33, + "learning_rate": 3.941042255350317e-06, + "loss": 1.1343, + "step": 10799 + }, + { + "epoch": 0.33, + "learning_rate": 3.940842927816393e-06, + "loss": 1.327, + "step": 10800 + }, + { + "epoch": 0.33, + "learning_rate": 3.940643586566338e-06, + "loss": 1.1729, + "step": 10801 + }, + { + "epoch": 0.33, + "learning_rate": 3.9404442316020495e-06, + "loss": 1.1735, + "step": 10802 + }, + { + "epoch": 0.33, + "learning_rate": 3.940244862925427e-06, + "loss": 1.0878, + "step": 10803 + }, + { + "epoch": 0.33, + "learning_rate": 3.940045480538366e-06, + "loss": 1.1334, + "step": 10804 + }, + { + "epoch": 0.33, + "learning_rate": 3.939846084442765e-06, + "loss": 1.204, + "step": 10805 + }, + { + "epoch": 0.33, + "learning_rate": 3.939646674640525e-06, + "loss": 1.1739, + "step": 10806 + }, + { + "epoch": 0.33, + "learning_rate": 3.93944725113354e-06, + "loss": 1.1594, + "step": 10807 + }, + { + "epoch": 0.33, + "learning_rate": 3.9392478139237115e-06, + "loss": 1.0867, + "step": 10808 + }, + { + "epoch": 0.33, + "learning_rate": 3.939048363012936e-06, + "loss": 1.1806, + "step": 10809 + }, + { + "epoch": 0.33, + "learning_rate": 3.938848898403114e-06, + "loss": 1.2643, + "step": 10810 + }, + { + "epoch": 0.33, + "learning_rate": 3.9386494200961425e-06, + "loss": 1.1063, + "step": 10811 + }, + { + "epoch": 0.33, + "learning_rate": 3.9384499280939225e-06, + "loss": 1.2484, + "step": 10812 + }, + { + "epoch": 0.33, + "learning_rate": 3.938250422398351e-06, + "loss": 1.0979, + "step": 10813 + }, + { + "epoch": 0.33, + "learning_rate": 3.938050903011329e-06, + "loss": 1.1427, + "step": 10814 + }, + { + "epoch": 0.33, + "learning_rate": 3.937851369934755e-06, + "loss": 1.1973, + "step": 10815 + }, + { + "epoch": 0.33, + "learning_rate": 3.937651823170528e-06, + "loss": 1.0704, + "step": 10816 + }, + { + "epoch": 0.33, + "learning_rate": 3.937452262720548e-06, + "loss": 1.205, + "step": 10817 + }, + { + "epoch": 0.33, + "learning_rate": 3.937252688586714e-06, + "loss": 1.0963, + "step": 10818 + }, + { + "epoch": 0.33, + "learning_rate": 3.937053100770928e-06, + "loss": 1.1598, + "step": 10819 + }, + { + "epoch": 0.33, + "learning_rate": 3.936853499275089e-06, + "loss": 1.1053, + "step": 10820 + }, + { + "epoch": 0.33, + "learning_rate": 3.936653884101095e-06, + "loss": 1.0992, + "step": 10821 + }, + { + "epoch": 0.33, + "learning_rate": 3.936454255250849e-06, + "loss": 0.9929, + "step": 10822 + }, + { + "epoch": 0.33, + "learning_rate": 3.93625461272625e-06, + "loss": 1.2273, + "step": 10823 + }, + { + "epoch": 0.33, + "learning_rate": 3.936054956529199e-06, + "loss": 1.3809, + "step": 10824 + }, + { + "epoch": 0.33, + "learning_rate": 3.935855286661596e-06, + "loss": 1.2554, + "step": 10825 + }, + { + "epoch": 0.33, + "learning_rate": 3.9356556031253425e-06, + "loss": 1.0939, + "step": 10826 + }, + { + "epoch": 0.33, + "learning_rate": 3.9354559059223396e-06, + "loss": 1.1232, + "step": 10827 + }, + { + "epoch": 0.33, + "learning_rate": 3.935256195054487e-06, + "loss": 1.0787, + "step": 10828 + }, + { + "epoch": 0.33, + "learning_rate": 3.935056470523687e-06, + "loss": 1.2544, + "step": 10829 + }, + { + "epoch": 0.33, + "learning_rate": 3.934856732331841e-06, + "loss": 1.0881, + "step": 10830 + }, + { + "epoch": 0.33, + "learning_rate": 3.934656980480849e-06, + "loss": 1.0731, + "step": 10831 + }, + { + "epoch": 0.33, + "learning_rate": 3.934457214972614e-06, + "loss": 0.9772, + "step": 10832 + }, + { + "epoch": 0.33, + "learning_rate": 3.934257435809037e-06, + "loss": 1.1126, + "step": 10833 + }, + { + "epoch": 0.33, + "learning_rate": 3.934057642992021e-06, + "loss": 1.1791, + "step": 10834 + }, + { + "epoch": 0.33, + "learning_rate": 3.933857836523465e-06, + "loss": 1.2272, + "step": 10835 + }, + { + "epoch": 0.33, + "learning_rate": 3.933658016405274e-06, + "loss": 1.1739, + "step": 10836 + }, + { + "epoch": 0.33, + "learning_rate": 3.93345818263935e-06, + "loss": 1.2311, + "step": 10837 + }, + { + "epoch": 0.33, + "learning_rate": 3.933258335227593e-06, + "loss": 1.2527, + "step": 10838 + }, + { + "epoch": 0.33, + "learning_rate": 3.933058474171908e-06, + "loss": 1.0889, + "step": 10839 + }, + { + "epoch": 0.33, + "learning_rate": 3.9328585994741965e-06, + "loss": 1.1902, + "step": 10840 + }, + { + "epoch": 0.33, + "learning_rate": 3.93265871113636e-06, + "loss": 1.0881, + "step": 10841 + }, + { + "epoch": 0.33, + "learning_rate": 3.9324588091603035e-06, + "loss": 1.1936, + "step": 10842 + }, + { + "epoch": 0.33, + "learning_rate": 3.932258893547929e-06, + "loss": 1.1523, + "step": 10843 + }, + { + "epoch": 0.33, + "learning_rate": 3.932058964301139e-06, + "loss": 1.1624, + "step": 10844 + }, + { + "epoch": 0.33, + "learning_rate": 3.931859021421838e-06, + "loss": 1.051, + "step": 10845 + }, + { + "epoch": 0.33, + "learning_rate": 3.931659064911928e-06, + "loss": 1.1912, + "step": 10846 + }, + { + "epoch": 0.33, + "learning_rate": 3.931459094773314e-06, + "loss": 1.1533, + "step": 10847 + }, + { + "epoch": 0.33, + "learning_rate": 3.931259111007899e-06, + "loss": 1.171, + "step": 10848 + }, + { + "epoch": 0.33, + "learning_rate": 3.931059113617587e-06, + "loss": 1.1191, + "step": 10849 + }, + { + "epoch": 0.33, + "learning_rate": 3.93085910260428e-06, + "loss": 1.0244, + "step": 10850 + }, + { + "epoch": 0.33, + "learning_rate": 3.930659077969884e-06, + "loss": 1.1515, + "step": 10851 + }, + { + "epoch": 0.33, + "learning_rate": 3.930459039716304e-06, + "loss": 1.1637, + "step": 10852 + }, + { + "epoch": 0.33, + "learning_rate": 3.930258987845441e-06, + "loss": 1.0787, + "step": 10853 + }, + { + "epoch": 0.33, + "learning_rate": 3.930058922359202e-06, + "loss": 1.1429, + "step": 10854 + }, + { + "epoch": 0.33, + "learning_rate": 3.929858843259491e-06, + "loss": 1.1463, + "step": 10855 + }, + { + "epoch": 0.33, + "learning_rate": 3.929658750548212e-06, + "loss": 1.1321, + "step": 10856 + }, + { + "epoch": 0.33, + "learning_rate": 3.92945864422727e-06, + "loss": 1.1346, + "step": 10857 + }, + { + "epoch": 0.33, + "learning_rate": 3.92925852429857e-06, + "loss": 1.1371, + "step": 10858 + }, + { + "epoch": 0.33, + "learning_rate": 3.929058390764018e-06, + "loss": 1.1436, + "step": 10859 + }, + { + "epoch": 0.33, + "learning_rate": 3.928858243625519e-06, + "loss": 1.1039, + "step": 10860 + }, + { + "epoch": 0.33, + "learning_rate": 3.928658082884976e-06, + "loss": 1.1871, + "step": 10861 + }, + { + "epoch": 0.33, + "learning_rate": 3.928457908544297e-06, + "loss": 1.1142, + "step": 10862 + }, + { + "epoch": 0.33, + "learning_rate": 3.928257720605387e-06, + "loss": 1.2249, + "step": 10863 + }, + { + "epoch": 0.33, + "learning_rate": 3.928057519070151e-06, + "loss": 1.1114, + "step": 10864 + }, + { + "epoch": 0.33, + "learning_rate": 3.927857303940495e-06, + "loss": 1.1273, + "step": 10865 + }, + { + "epoch": 0.33, + "learning_rate": 3.927657075218326e-06, + "loss": 1.1594, + "step": 10866 + }, + { + "epoch": 0.33, + "learning_rate": 3.927456832905548e-06, + "loss": 1.1869, + "step": 10867 + }, + { + "epoch": 0.33, + "learning_rate": 3.927256577004069e-06, + "loss": 1.131, + "step": 10868 + }, + { + "epoch": 0.33, + "learning_rate": 3.927056307515795e-06, + "loss": 1.1384, + "step": 10869 + }, + { + "epoch": 0.33, + "learning_rate": 3.926856024442632e-06, + "loss": 1.093, + "step": 10870 + }, + { + "epoch": 0.33, + "learning_rate": 3.926655727786487e-06, + "loss": 1.0601, + "step": 10871 + }, + { + "epoch": 0.33, + "learning_rate": 3.926455417549266e-06, + "loss": 1.0828, + "step": 10872 + }, + { + "epoch": 0.33, + "learning_rate": 3.926255093732877e-06, + "loss": 1.2162, + "step": 10873 + }, + { + "epoch": 0.33, + "learning_rate": 3.926054756339226e-06, + "loss": 1.2398, + "step": 10874 + }, + { + "epoch": 0.33, + "learning_rate": 3.925854405370222e-06, + "loss": 1.176, + "step": 10875 + }, + { + "epoch": 0.33, + "learning_rate": 3.9256540408277686e-06, + "loss": 1.1324, + "step": 10876 + }, + { + "epoch": 0.33, + "learning_rate": 3.925453662713777e-06, + "loss": 1.1017, + "step": 10877 + }, + { + "epoch": 0.33, + "learning_rate": 3.925253271030152e-06, + "loss": 1.1099, + "step": 10878 + }, + { + "epoch": 0.33, + "learning_rate": 3.925052865778803e-06, + "loss": 1.1559, + "step": 10879 + }, + { + "epoch": 0.33, + "learning_rate": 3.9248524469616365e-06, + "loss": 1.1293, + "step": 10880 + }, + { + "epoch": 0.33, + "learning_rate": 3.924652014580561e-06, + "loss": 1.1293, + "step": 10881 + }, + { + "epoch": 0.33, + "learning_rate": 3.924451568637485e-06, + "loss": 1.0853, + "step": 10882 + }, + { + "epoch": 0.33, + "learning_rate": 3.924251109134315e-06, + "loss": 1.1863, + "step": 10883 + }, + { + "epoch": 0.33, + "learning_rate": 3.924050636072961e-06, + "loss": 1.0093, + "step": 10884 + }, + { + "epoch": 0.33, + "learning_rate": 3.923850149455332e-06, + "loss": 1.0979, + "step": 10885 + }, + { + "epoch": 0.33, + "learning_rate": 3.923649649283333e-06, + "loss": 1.1603, + "step": 10886 + }, + { + "epoch": 0.33, + "learning_rate": 3.923449135558877e-06, + "loss": 1.0992, + "step": 10887 + }, + { + "epoch": 0.33, + "learning_rate": 3.92324860828387e-06, + "loss": 1.1294, + "step": 10888 + }, + { + "epoch": 0.33, + "learning_rate": 3.923048067460221e-06, + "loss": 1.0845, + "step": 10889 + }, + { + "epoch": 0.33, + "learning_rate": 3.922847513089841e-06, + "loss": 1.0802, + "step": 10890 + }, + { + "epoch": 0.33, + "learning_rate": 3.922646945174638e-06, + "loss": 1.0969, + "step": 10891 + }, + { + "epoch": 0.33, + "learning_rate": 3.922446363716521e-06, + "loss": 1.1499, + "step": 10892 + }, + { + "epoch": 0.33, + "learning_rate": 3.922245768717399e-06, + "loss": 1.1916, + "step": 10893 + }, + { + "epoch": 0.33, + "learning_rate": 3.9220451601791824e-06, + "loss": 1.14, + "step": 10894 + }, + { + "epoch": 0.33, + "learning_rate": 3.921844538103781e-06, + "loss": 1.0661, + "step": 10895 + }, + { + "epoch": 0.33, + "learning_rate": 3.921643902493104e-06, + "loss": 1.1312, + "step": 10896 + }, + { + "epoch": 0.33, + "learning_rate": 3.921443253349063e-06, + "loss": 1.1139, + "step": 10897 + }, + { + "epoch": 0.33, + "learning_rate": 3.921242590673565e-06, + "loss": 1.1827, + "step": 10898 + }, + { + "epoch": 0.33, + "learning_rate": 3.921041914468523e-06, + "loss": 1.1291, + "step": 10899 + }, + { + "epoch": 0.33, + "learning_rate": 3.920841224735847e-06, + "loss": 1.1379, + "step": 10900 + }, + { + "epoch": 0.33, + "learning_rate": 3.9206405214774455e-06, + "loss": 1.187, + "step": 10901 + }, + { + "epoch": 0.33, + "learning_rate": 3.920439804695232e-06, + "loss": 1.1955, + "step": 10902 + }, + { + "epoch": 0.33, + "learning_rate": 3.920239074391114e-06, + "loss": 1.0866, + "step": 10903 + }, + { + "epoch": 0.33, + "learning_rate": 3.920038330567005e-06, + "loss": 1.1343, + "step": 10904 + }, + { + "epoch": 0.33, + "learning_rate": 3.919837573224815e-06, + "loss": 1.2744, + "step": 10905 + }, + { + "epoch": 0.33, + "learning_rate": 3.919636802366454e-06, + "loss": 1.0972, + "step": 10906 + }, + { + "epoch": 0.33, + "learning_rate": 3.919436017993836e-06, + "loss": 1.1439, + "step": 10907 + }, + { + "epoch": 0.33, + "learning_rate": 3.91923522010887e-06, + "loss": 1.1313, + "step": 10908 + }, + { + "epoch": 0.33, + "learning_rate": 3.919034408713468e-06, + "loss": 1.1545, + "step": 10909 + }, + { + "epoch": 0.33, + "learning_rate": 3.9188335838095424e-06, + "loss": 1.1577, + "step": 10910 + }, + { + "epoch": 0.33, + "learning_rate": 3.918632745399004e-06, + "loss": 1.1662, + "step": 10911 + }, + { + "epoch": 0.33, + "learning_rate": 3.918431893483765e-06, + "loss": 1.0966, + "step": 10912 + }, + { + "epoch": 0.33, + "learning_rate": 3.918231028065738e-06, + "loss": 1.1461, + "step": 10913 + }, + { + "epoch": 0.33, + "learning_rate": 3.9180301491468344e-06, + "loss": 1.1171, + "step": 10914 + }, + { + "epoch": 0.33, + "learning_rate": 3.917829256728967e-06, + "loss": 1.1773, + "step": 10915 + }, + { + "epoch": 0.33, + "learning_rate": 3.917628350814048e-06, + "loss": 1.1157, + "step": 10916 + }, + { + "epoch": 0.33, + "learning_rate": 3.917427431403989e-06, + "loss": 1.2025, + "step": 10917 + }, + { + "epoch": 0.33, + "learning_rate": 3.917226498500704e-06, + "loss": 1.1644, + "step": 10918 + }, + { + "epoch": 0.33, + "learning_rate": 3.917025552106105e-06, + "loss": 1.0464, + "step": 10919 + }, + { + "epoch": 0.33, + "learning_rate": 3.916824592222106e-06, + "loss": 1.1509, + "step": 10920 + }, + { + "epoch": 0.33, + "learning_rate": 3.916623618850618e-06, + "loss": 1.0831, + "step": 10921 + }, + { + "epoch": 0.33, + "learning_rate": 3.916422631993557e-06, + "loss": 1.1701, + "step": 10922 + }, + { + "epoch": 0.33, + "learning_rate": 3.916221631652834e-06, + "loss": 1.1749, + "step": 10923 + }, + { + "epoch": 0.33, + "learning_rate": 3.9160206178303625e-06, + "loss": 1.2527, + "step": 10924 + }, + { + "epoch": 0.33, + "learning_rate": 3.915819590528057e-06, + "loss": 1.0112, + "step": 10925 + }, + { + "epoch": 0.33, + "learning_rate": 3.915618549747831e-06, + "loss": 1.1169, + "step": 10926 + }, + { + "epoch": 0.33, + "learning_rate": 3.915417495491599e-06, + "loss": 1.1528, + "step": 10927 + }, + { + "epoch": 0.33, + "learning_rate": 3.915216427761273e-06, + "loss": 1.1495, + "step": 10928 + }, + { + "epoch": 0.33, + "learning_rate": 3.915015346558769e-06, + "loss": 1.1658, + "step": 10929 + }, + { + "epoch": 0.33, + "learning_rate": 3.914814251886e-06, + "loss": 1.1148, + "step": 10930 + }, + { + "epoch": 0.33, + "learning_rate": 3.914613143744881e-06, + "loss": 1.2205, + "step": 10931 + }, + { + "epoch": 0.33, + "learning_rate": 3.914412022137325e-06, + "loss": 1.1436, + "step": 10932 + }, + { + "epoch": 0.33, + "learning_rate": 3.9142108870652494e-06, + "loss": 1.0737, + "step": 10933 + }, + { + "epoch": 0.33, + "learning_rate": 3.914009738530567e-06, + "loss": 1.0587, + "step": 10934 + }, + { + "epoch": 0.33, + "learning_rate": 3.913808576535192e-06, + "loss": 1.1332, + "step": 10935 + }, + { + "epoch": 0.33, + "learning_rate": 3.91360740108104e-06, + "loss": 1.0494, + "step": 10936 + }, + { + "epoch": 0.33, + "learning_rate": 3.913406212170028e-06, + "loss": 1.1707, + "step": 10937 + }, + { + "epoch": 0.33, + "learning_rate": 3.913205009804069e-06, + "loss": 1.0434, + "step": 10938 + }, + { + "epoch": 0.33, + "learning_rate": 3.9130037939850775e-06, + "loss": 1.1667, + "step": 10939 + }, + { + "epoch": 0.33, + "learning_rate": 3.912802564714972e-06, + "loss": 1.1873, + "step": 10940 + }, + { + "epoch": 0.33, + "learning_rate": 3.912601321995666e-06, + "loss": 1.1406, + "step": 10941 + }, + { + "epoch": 0.33, + "learning_rate": 3.9124000658290756e-06, + "loss": 1.1585, + "step": 10942 + }, + { + "epoch": 0.33, + "learning_rate": 3.912198796217117e-06, + "loss": 1.1274, + "step": 10943 + }, + { + "epoch": 0.33, + "learning_rate": 3.911997513161706e-06, + "loss": 1.0986, + "step": 10944 + }, + { + "epoch": 0.33, + "learning_rate": 3.9117962166647585e-06, + "loss": 1.1681, + "step": 10945 + }, + { + "epoch": 0.33, + "learning_rate": 3.911594906728191e-06, + "loss": 1.1573, + "step": 10946 + }, + { + "epoch": 0.33, + "learning_rate": 3.91139358335392e-06, + "loss": 1.0529, + "step": 10947 + }, + { + "epoch": 0.33, + "learning_rate": 3.911192246543862e-06, + "loss": 1.1249, + "step": 10948 + }, + { + "epoch": 0.33, + "learning_rate": 3.910990896299933e-06, + "loss": 1.2061, + "step": 10949 + }, + { + "epoch": 0.33, + "learning_rate": 3.910789532624051e-06, + "loss": 1.1498, + "step": 10950 + }, + { + "epoch": 0.33, + "learning_rate": 3.9105881555181315e-06, + "loss": 1.1458, + "step": 10951 + }, + { + "epoch": 0.33, + "learning_rate": 3.910386764984092e-06, + "loss": 1.0166, + "step": 10952 + }, + { + "epoch": 0.33, + "learning_rate": 3.91018536102385e-06, + "loss": 1.0695, + "step": 10953 + }, + { + "epoch": 0.33, + "learning_rate": 3.909983943639322e-06, + "loss": 1.1553, + "step": 10954 + }, + { + "epoch": 0.33, + "learning_rate": 3.909782512832427e-06, + "loss": 1.1011, + "step": 10955 + }, + { + "epoch": 0.33, + "learning_rate": 3.909581068605081e-06, + "loss": 1.0421, + "step": 10956 + }, + { + "epoch": 0.33, + "learning_rate": 3.909379610959202e-06, + "loss": 1.1918, + "step": 10957 + }, + { + "epoch": 0.33, + "learning_rate": 3.909178139896707e-06, + "loss": 1.0906, + "step": 10958 + }, + { + "epoch": 0.33, + "learning_rate": 3.908976655419517e-06, + "loss": 1.1024, + "step": 10959 + }, + { + "epoch": 0.33, + "learning_rate": 3.908775157529546e-06, + "loss": 1.1265, + "step": 10960 + }, + { + "epoch": 0.33, + "learning_rate": 3.908573646228715e-06, + "loss": 1.231, + "step": 10961 + }, + { + "epoch": 0.33, + "learning_rate": 3.9083721215189395e-06, + "loss": 1.1401, + "step": 10962 + }, + { + "epoch": 0.33, + "learning_rate": 3.908170583402141e-06, + "loss": 1.1447, + "step": 10963 + }, + { + "epoch": 0.33, + "learning_rate": 3.907969031880238e-06, + "loss": 1.1812, + "step": 10964 + }, + { + "epoch": 0.33, + "learning_rate": 3.907767466955146e-06, + "loss": 1.1561, + "step": 10965 + }, + { + "epoch": 0.33, + "learning_rate": 3.907565888628786e-06, + "loss": 1.1117, + "step": 10966 + }, + { + "epoch": 0.33, + "learning_rate": 3.907364296903077e-06, + "loss": 1.1886, + "step": 10967 + }, + { + "epoch": 0.33, + "learning_rate": 3.907162691779938e-06, + "loss": 1.1505, + "step": 10968 + }, + { + "epoch": 0.33, + "learning_rate": 3.906961073261287e-06, + "loss": 1.1041, + "step": 10969 + }, + { + "epoch": 0.33, + "learning_rate": 3.906759441349045e-06, + "loss": 1.209, + "step": 10970 + }, + { + "epoch": 0.33, + "learning_rate": 3.9065577960451306e-06, + "loss": 1.1006, + "step": 10971 + }, + { + "epoch": 0.33, + "learning_rate": 3.906356137351464e-06, + "loss": 1.1075, + "step": 10972 + }, + { + "epoch": 0.33, + "learning_rate": 3.906154465269962e-06, + "loss": 1.2614, + "step": 10973 + }, + { + "epoch": 0.33, + "learning_rate": 3.90595277980255e-06, + "loss": 1.1558, + "step": 10974 + }, + { + "epoch": 0.33, + "learning_rate": 3.905751080951142e-06, + "loss": 1.0662, + "step": 10975 + }, + { + "epoch": 0.33, + "learning_rate": 3.905549368717662e-06, + "loss": 1.1572, + "step": 10976 + }, + { + "epoch": 0.33, + "learning_rate": 3.905347643104028e-06, + "loss": 1.1273, + "step": 10977 + }, + { + "epoch": 0.33, + "learning_rate": 3.905145904112162e-06, + "loss": 1.0271, + "step": 10978 + }, + { + "epoch": 0.33, + "learning_rate": 3.904944151743984e-06, + "loss": 1.0955, + "step": 10979 + }, + { + "epoch": 0.33, + "learning_rate": 3.904742386001413e-06, + "loss": 1.1658, + "step": 10980 + }, + { + "epoch": 0.33, + "learning_rate": 3.904540606886372e-06, + "loss": 1.1042, + "step": 10981 + }, + { + "epoch": 0.33, + "learning_rate": 3.904338814400781e-06, + "loss": 1.0578, + "step": 10982 + }, + { + "epoch": 0.33, + "learning_rate": 3.904137008546562e-06, + "loss": 1.2068, + "step": 10983 + }, + { + "epoch": 0.33, + "learning_rate": 3.903935189325633e-06, + "loss": 1.1382, + "step": 10984 + }, + { + "epoch": 0.33, + "learning_rate": 3.903733356739918e-06, + "loss": 1.074, + "step": 10985 + }, + { + "epoch": 0.33, + "learning_rate": 3.9035315107913364e-06, + "loss": 1.0867, + "step": 10986 + }, + { + "epoch": 0.33, + "learning_rate": 3.903329651481812e-06, + "loss": 1.1451, + "step": 10987 + }, + { + "epoch": 0.33, + "learning_rate": 3.903127778813265e-06, + "loss": 1.1182, + "step": 10988 + }, + { + "epoch": 0.33, + "learning_rate": 3.902925892787617e-06, + "loss": 1.1448, + "step": 10989 + }, + { + "epoch": 0.33, + "learning_rate": 3.902723993406791e-06, + "loss": 1.0616, + "step": 10990 + }, + { + "epoch": 0.33, + "learning_rate": 3.902522080672707e-06, + "loss": 1.1281, + "step": 10991 + }, + { + "epoch": 0.33, + "learning_rate": 3.9023201545872885e-06, + "loss": 1.1979, + "step": 10992 + }, + { + "epoch": 0.33, + "learning_rate": 3.9021182151524574e-06, + "loss": 1.1438, + "step": 10993 + }, + { + "epoch": 0.33, + "learning_rate": 3.901916262370137e-06, + "loss": 1.203, + "step": 10994 + }, + { + "epoch": 0.33, + "learning_rate": 3.9017142962422485e-06, + "loss": 1.1408, + "step": 10995 + }, + { + "epoch": 0.33, + "learning_rate": 3.9015123167707145e-06, + "loss": 1.2086, + "step": 10996 + }, + { + "epoch": 0.33, + "learning_rate": 3.901310323957459e-06, + "loss": 1.0483, + "step": 10997 + }, + { + "epoch": 0.33, + "learning_rate": 3.901108317804404e-06, + "loss": 1.0914, + "step": 10998 + }, + { + "epoch": 0.33, + "learning_rate": 3.9009062983134725e-06, + "loss": 1.1232, + "step": 10999 + }, + { + "epoch": 0.33, + "learning_rate": 3.900704265486588e-06, + "loss": 1.114, + "step": 11000 + }, + { + "epoch": 0.33, + "learning_rate": 3.900502219325672e-06, + "loss": 1.1238, + "step": 11001 + }, + { + "epoch": 0.33, + "learning_rate": 3.900300159832652e-06, + "loss": 1.1086, + "step": 11002 + }, + { + "epoch": 0.33, + "learning_rate": 3.900098087009447e-06, + "loss": 1.1058, + "step": 11003 + }, + { + "epoch": 0.33, + "learning_rate": 3.899896000857982e-06, + "loss": 1.0587, + "step": 11004 + }, + { + "epoch": 0.33, + "learning_rate": 3.899693901380183e-06, + "loss": 1.1679, + "step": 11005 + }, + { + "epoch": 0.33, + "learning_rate": 3.899491788577971e-06, + "loss": 1.2256, + "step": 11006 + }, + { + "epoch": 0.33, + "learning_rate": 3.899289662453272e-06, + "loss": 1.118, + "step": 11007 + }, + { + "epoch": 0.33, + "learning_rate": 3.899087523008008e-06, + "loss": 1.1601, + "step": 11008 + }, + { + "epoch": 0.33, + "learning_rate": 3.8988853702441066e-06, + "loss": 1.158, + "step": 11009 + }, + { + "epoch": 0.33, + "learning_rate": 3.898683204163489e-06, + "loss": 1.1161, + "step": 11010 + }, + { + "epoch": 0.33, + "learning_rate": 3.898481024768082e-06, + "loss": 1.0836, + "step": 11011 + }, + { + "epoch": 0.33, + "learning_rate": 3.898278832059807e-06, + "loss": 1.1649, + "step": 11012 + }, + { + "epoch": 0.33, + "learning_rate": 3.898076626040592e-06, + "loss": 1.0999, + "step": 11013 + }, + { + "epoch": 0.33, + "learning_rate": 3.897874406712362e-06, + "loss": 1.0475, + "step": 11014 + }, + { + "epoch": 0.33, + "learning_rate": 3.897672174077039e-06, + "loss": 1.1527, + "step": 11015 + }, + { + "epoch": 0.33, + "learning_rate": 3.897469928136552e-06, + "loss": 1.0234, + "step": 11016 + }, + { + "epoch": 0.33, + "learning_rate": 3.897267668892823e-06, + "loss": 1.1157, + "step": 11017 + }, + { + "epoch": 0.33, + "learning_rate": 3.897065396347779e-06, + "loss": 1.2357, + "step": 11018 + }, + { + "epoch": 0.33, + "learning_rate": 3.896863110503345e-06, + "loss": 1.2197, + "step": 11019 + }, + { + "epoch": 0.33, + "learning_rate": 3.896660811361448e-06, + "loss": 1.1298, + "step": 11020 + }, + { + "epoch": 0.33, + "learning_rate": 3.896458498924012e-06, + "loss": 1.0786, + "step": 11021 + }, + { + "epoch": 0.33, + "learning_rate": 3.896256173192963e-06, + "loss": 1.2079, + "step": 11022 + }, + { + "epoch": 0.33, + "learning_rate": 3.896053834170228e-06, + "loss": 1.1567, + "step": 11023 + }, + { + "epoch": 0.33, + "learning_rate": 3.895851481857734e-06, + "loss": 1.1675, + "step": 11024 + }, + { + "epoch": 0.33, + "learning_rate": 3.895649116257405e-06, + "loss": 1.1482, + "step": 11025 + }, + { + "epoch": 0.33, + "learning_rate": 3.8954467373711694e-06, + "loss": 1.1077, + "step": 11026 + }, + { + "epoch": 0.33, + "learning_rate": 3.8952443452009524e-06, + "loss": 1.1468, + "step": 11027 + }, + { + "epoch": 0.33, + "learning_rate": 3.895041939748682e-06, + "loss": 1.1542, + "step": 11028 + }, + { + "epoch": 0.33, + "learning_rate": 3.894839521016283e-06, + "loss": 1.0548, + "step": 11029 + }, + { + "epoch": 0.33, + "learning_rate": 3.894637089005684e-06, + "loss": 1.2205, + "step": 11030 + }, + { + "epoch": 0.33, + "learning_rate": 3.8944346437188116e-06, + "loss": 1.0577, + "step": 11031 + }, + { + "epoch": 0.33, + "learning_rate": 3.894232185157592e-06, + "loss": 1.0956, + "step": 11032 + }, + { + "epoch": 0.33, + "learning_rate": 3.894029713323955e-06, + "loss": 1.2001, + "step": 11033 + }, + { + "epoch": 0.33, + "learning_rate": 3.893827228219826e-06, + "loss": 1.1174, + "step": 11034 + }, + { + "epoch": 0.33, + "learning_rate": 3.8936247298471334e-06, + "loss": 1.1149, + "step": 11035 + }, + { + "epoch": 0.33, + "learning_rate": 3.893422218207804e-06, + "loss": 1.2144, + "step": 11036 + }, + { + "epoch": 0.33, + "learning_rate": 3.893219693303767e-06, + "loss": 1.1898, + "step": 11037 + }, + { + "epoch": 0.33, + "learning_rate": 3.893017155136949e-06, + "loss": 1.0565, + "step": 11038 + }, + { + "epoch": 0.33, + "learning_rate": 3.892814603709278e-06, + "loss": 1.1891, + "step": 11039 + }, + { + "epoch": 0.33, + "learning_rate": 3.8926120390226835e-06, + "loss": 1.0474, + "step": 11040 + }, + { + "epoch": 0.33, + "learning_rate": 3.892409461079093e-06, + "loss": 1.0369, + "step": 11041 + }, + { + "epoch": 0.33, + "learning_rate": 3.892206869880435e-06, + "loss": 1.1552, + "step": 11042 + }, + { + "epoch": 0.33, + "learning_rate": 3.8920042654286375e-06, + "loss": 1.2449, + "step": 11043 + }, + { + "epoch": 0.33, + "learning_rate": 3.8918016477256306e-06, + "loss": 1.1164, + "step": 11044 + }, + { + "epoch": 0.33, + "learning_rate": 3.891599016773342e-06, + "loss": 1.1534, + "step": 11045 + }, + { + "epoch": 0.33, + "learning_rate": 3.891396372573701e-06, + "loss": 1.0412, + "step": 11046 + }, + { + "epoch": 0.33, + "learning_rate": 3.891193715128637e-06, + "loss": 1.2437, + "step": 11047 + }, + { + "epoch": 0.33, + "learning_rate": 3.890991044440078e-06, + "loss": 1.2574, + "step": 11048 + }, + { + "epoch": 0.33, + "learning_rate": 3.890788360509955e-06, + "loss": 1.3854, + "step": 11049 + }, + { + "epoch": 0.33, + "learning_rate": 3.890585663340196e-06, + "loss": 1.2154, + "step": 11050 + }, + { + "epoch": 0.33, + "learning_rate": 3.8903829529327316e-06, + "loss": 1.1752, + "step": 11051 + }, + { + "epoch": 0.33, + "learning_rate": 3.890180229289492e-06, + "loss": 1.0632, + "step": 11052 + }, + { + "epoch": 0.33, + "learning_rate": 3.889977492412404e-06, + "loss": 1.0321, + "step": 11053 + }, + { + "epoch": 0.33, + "learning_rate": 3.889774742303402e-06, + "loss": 1.0673, + "step": 11054 + }, + { + "epoch": 0.33, + "learning_rate": 3.889571978964413e-06, + "loss": 1.2627, + "step": 11055 + }, + { + "epoch": 0.33, + "learning_rate": 3.889369202397367e-06, + "loss": 1.1893, + "step": 11056 + }, + { + "epoch": 0.33, + "learning_rate": 3.889166412604196e-06, + "loss": 1.1663, + "step": 11057 + }, + { + "epoch": 0.33, + "learning_rate": 3.88896360958683e-06, + "loss": 1.1512, + "step": 11058 + }, + { + "epoch": 0.33, + "learning_rate": 3.888760793347199e-06, + "loss": 1.1716, + "step": 11059 + }, + { + "epoch": 0.33, + "learning_rate": 3.888557963887235e-06, + "loss": 0.9955, + "step": 11060 + }, + { + "epoch": 0.33, + "learning_rate": 3.888355121208867e-06, + "loss": 1.0602, + "step": 11061 + }, + { + "epoch": 0.33, + "learning_rate": 3.8881522653140276e-06, + "loss": 1.1102, + "step": 11062 + }, + { + "epoch": 0.33, + "learning_rate": 3.887949396204646e-06, + "loss": 1.1292, + "step": 11063 + }, + { + "epoch": 0.33, + "learning_rate": 3.887746513882656e-06, + "loss": 1.0889, + "step": 11064 + }, + { + "epoch": 0.33, + "learning_rate": 3.887543618349987e-06, + "loss": 1.14, + "step": 11065 + }, + { + "epoch": 0.33, + "learning_rate": 3.887340709608571e-06, + "loss": 1.1176, + "step": 11066 + }, + { + "epoch": 0.33, + "learning_rate": 3.88713778766034e-06, + "loss": 1.1523, + "step": 11067 + }, + { + "epoch": 0.33, + "learning_rate": 3.886934852507225e-06, + "loss": 1.1685, + "step": 11068 + }, + { + "epoch": 0.33, + "learning_rate": 3.886731904151157e-06, + "loss": 1.0817, + "step": 11069 + }, + { + "epoch": 0.33, + "learning_rate": 3.886528942594071e-06, + "loss": 1.0958, + "step": 11070 + }, + { + "epoch": 0.33, + "learning_rate": 3.886325967837896e-06, + "loss": 1.0826, + "step": 11071 + }, + { + "epoch": 0.33, + "learning_rate": 3.886122979884566e-06, + "loss": 1.1169, + "step": 11072 + }, + { + "epoch": 0.33, + "learning_rate": 3.885919978736012e-06, + "loss": 1.1396, + "step": 11073 + }, + { + "epoch": 0.33, + "learning_rate": 3.885716964394169e-06, + "loss": 1.098, + "step": 11074 + }, + { + "epoch": 0.33, + "learning_rate": 3.885513936860967e-06, + "loss": 0.9636, + "step": 11075 + }, + { + "epoch": 0.33, + "learning_rate": 3.8853108961383396e-06, + "loss": 1.1277, + "step": 11076 + }, + { + "epoch": 0.33, + "learning_rate": 3.885107842228219e-06, + "loss": 1.171, + "step": 11077 + }, + { + "epoch": 0.33, + "learning_rate": 3.884904775132539e-06, + "loss": 1.2609, + "step": 11078 + }, + { + "epoch": 0.33, + "learning_rate": 3.884701694853233e-06, + "loss": 1.1462, + "step": 11079 + }, + { + "epoch": 0.33, + "learning_rate": 3.884498601392235e-06, + "loss": 1.1155, + "step": 11080 + }, + { + "epoch": 0.33, + "learning_rate": 3.884295494751475e-06, + "loss": 1.2321, + "step": 11081 + }, + { + "epoch": 0.33, + "learning_rate": 3.884092374932889e-06, + "loss": 1.119, + "step": 11082 + }, + { + "epoch": 0.33, + "learning_rate": 3.883889241938411e-06, + "loss": 1.1343, + "step": 11083 + }, + { + "epoch": 0.33, + "learning_rate": 3.883686095769974e-06, + "loss": 1.1751, + "step": 11084 + }, + { + "epoch": 0.33, + "learning_rate": 3.883482936429511e-06, + "loss": 1.1277, + "step": 11085 + }, + { + "epoch": 0.33, + "learning_rate": 3.883279763918957e-06, + "loss": 1.2135, + "step": 11086 + }, + { + "epoch": 0.33, + "learning_rate": 3.883076578240246e-06, + "loss": 1.1093, + "step": 11087 + }, + { + "epoch": 0.33, + "learning_rate": 3.882873379395312e-06, + "loss": 1.198, + "step": 11088 + }, + { + "epoch": 0.33, + "learning_rate": 3.88267016738609e-06, + "loss": 1.1031, + "step": 11089 + }, + { + "epoch": 0.33, + "learning_rate": 3.882466942214513e-06, + "loss": 1.1456, + "step": 11090 + }, + { + "epoch": 0.33, + "learning_rate": 3.882263703882517e-06, + "loss": 1.1932, + "step": 11091 + }, + { + "epoch": 0.33, + "learning_rate": 3.882060452392035e-06, + "loss": 1.1139, + "step": 11092 + }, + { + "epoch": 0.33, + "learning_rate": 3.881857187745006e-06, + "loss": 1.1937, + "step": 11093 + }, + { + "epoch": 0.33, + "learning_rate": 3.88165390994336e-06, + "loss": 1.1758, + "step": 11094 + }, + { + "epoch": 0.33, + "learning_rate": 3.881450618989034e-06, + "loss": 1.0729, + "step": 11095 + }, + { + "epoch": 0.33, + "learning_rate": 3.881247314883964e-06, + "loss": 1.2177, + "step": 11096 + }, + { + "epoch": 0.33, + "learning_rate": 3.881043997630085e-06, + "loss": 1.1976, + "step": 11097 + }, + { + "epoch": 0.33, + "learning_rate": 3.880840667229332e-06, + "loss": 1.3033, + "step": 11098 + }, + { + "epoch": 0.33, + "learning_rate": 3.880637323683641e-06, + "loss": 1.23, + "step": 11099 + }, + { + "epoch": 0.33, + "learning_rate": 3.880433966994948e-06, + "loss": 1.1208, + "step": 11100 + }, + { + "epoch": 0.33, + "learning_rate": 3.880230597165188e-06, + "loss": 1.1534, + "step": 11101 + }, + { + "epoch": 0.33, + "learning_rate": 3.880027214196297e-06, + "loss": 1.2073, + "step": 11102 + }, + { + "epoch": 0.33, + "learning_rate": 3.879823818090213e-06, + "loss": 1.2253, + "step": 11103 + }, + { + "epoch": 0.33, + "learning_rate": 3.879620408848869e-06, + "loss": 1.0704, + "step": 11104 + }, + { + "epoch": 0.33, + "learning_rate": 3.879416986474205e-06, + "loss": 1.2636, + "step": 11105 + }, + { + "epoch": 0.33, + "learning_rate": 3.879213550968154e-06, + "loss": 1.0964, + "step": 11106 + }, + { + "epoch": 0.33, + "learning_rate": 3.8790101023326545e-06, + "loss": 1.2516, + "step": 11107 + }, + { + "epoch": 0.33, + "learning_rate": 3.878806640569644e-06, + "loss": 1.1896, + "step": 11108 + }, + { + "epoch": 0.33, + "learning_rate": 3.878603165681058e-06, + "loss": 1.0827, + "step": 11109 + }, + { + "epoch": 0.33, + "learning_rate": 3.878399677668833e-06, + "loss": 1.1724, + "step": 11110 + }, + { + "epoch": 0.33, + "learning_rate": 3.878196176534907e-06, + "loss": 1.1924, + "step": 11111 + }, + { + "epoch": 0.33, + "learning_rate": 3.877992662281218e-06, + "loss": 1.1959, + "step": 11112 + }, + { + "epoch": 0.33, + "learning_rate": 3.8777891349097025e-06, + "loss": 1.1657, + "step": 11113 + }, + { + "epoch": 0.33, + "learning_rate": 3.877585594422298e-06, + "loss": 1.1338, + "step": 11114 + }, + { + "epoch": 0.33, + "learning_rate": 3.877382040820941e-06, + "loss": 1.006, + "step": 11115 + }, + { + "epoch": 0.33, + "learning_rate": 3.877178474107571e-06, + "loss": 1.1519, + "step": 11116 + }, + { + "epoch": 0.33, + "learning_rate": 3.8769748942841254e-06, + "loss": 1.1595, + "step": 11117 + }, + { + "epoch": 0.33, + "learning_rate": 3.876771301352542e-06, + "loss": 1.1678, + "step": 11118 + }, + { + "epoch": 0.33, + "learning_rate": 3.876567695314759e-06, + "loss": 1.1012, + "step": 11119 + }, + { + "epoch": 0.33, + "learning_rate": 3.876364076172714e-06, + "loss": 1.1129, + "step": 11120 + }, + { + "epoch": 0.34, + "learning_rate": 3.8761604439283464e-06, + "loss": 1.1086, + "step": 11121 + }, + { + "epoch": 0.34, + "learning_rate": 3.875956798583595e-06, + "loss": 1.1697, + "step": 11122 + }, + { + "epoch": 0.34, + "learning_rate": 3.875753140140395e-06, + "loss": 1.2659, + "step": 11123 + }, + { + "epoch": 0.34, + "learning_rate": 3.87554946860069e-06, + "loss": 1.1304, + "step": 11124 + }, + { + "epoch": 0.34, + "learning_rate": 3.875345783966415e-06, + "loss": 1.2584, + "step": 11125 + }, + { + "epoch": 0.34, + "learning_rate": 3.875142086239512e-06, + "loss": 1.1909, + "step": 11126 + }, + { + "epoch": 0.34, + "learning_rate": 3.874938375421917e-06, + "loss": 1.0729, + "step": 11127 + }, + { + "epoch": 0.34, + "learning_rate": 3.874734651515573e-06, + "loss": 1.1367, + "step": 11128 + }, + { + "epoch": 0.34, + "learning_rate": 3.874530914522415e-06, + "loss": 1.1304, + "step": 11129 + }, + { + "epoch": 0.34, + "learning_rate": 3.874327164444386e-06, + "loss": 1.2164, + "step": 11130 + }, + { + "epoch": 0.34, + "learning_rate": 3.8741234012834235e-06, + "loss": 1.0798, + "step": 11131 + }, + { + "epoch": 0.34, + "learning_rate": 3.873919625041469e-06, + "loss": 1.1581, + "step": 11132 + }, + { + "epoch": 0.34, + "learning_rate": 3.873715835720461e-06, + "loss": 1.0808, + "step": 11133 + }, + { + "epoch": 0.34, + "learning_rate": 3.8735120333223394e-06, + "loss": 1.1143, + "step": 11134 + }, + { + "epoch": 0.34, + "learning_rate": 3.873308217849045e-06, + "loss": 1.1831, + "step": 11135 + }, + { + "epoch": 0.34, + "learning_rate": 3.873104389302518e-06, + "loss": 1.1085, + "step": 11136 + }, + { + "epoch": 0.34, + "learning_rate": 3.8729005476846984e-06, + "loss": 1.149, + "step": 11137 + }, + { + "epoch": 0.34, + "learning_rate": 3.872696692997527e-06, + "loss": 1.173, + "step": 11138 + }, + { + "epoch": 0.34, + "learning_rate": 3.872492825242944e-06, + "loss": 1.1536, + "step": 11139 + }, + { + "epoch": 0.34, + "learning_rate": 3.8722889444228896e-06, + "loss": 1.0258, + "step": 11140 + }, + { + "epoch": 0.34, + "learning_rate": 3.872085050539306e-06, + "loss": 1.1061, + "step": 11141 + }, + { + "epoch": 0.34, + "learning_rate": 3.8718811435941335e-06, + "loss": 1.1635, + "step": 11142 + }, + { + "epoch": 0.34, + "learning_rate": 3.871677223589313e-06, + "loss": 1.0493, + "step": 11143 + }, + { + "epoch": 0.34, + "learning_rate": 3.871473290526786e-06, + "loss": 1.1886, + "step": 11144 + }, + { + "epoch": 0.34, + "learning_rate": 3.871269344408495e-06, + "loss": 1.2083, + "step": 11145 + }, + { + "epoch": 0.34, + "learning_rate": 3.871065385236379e-06, + "loss": 1.092, + "step": 11146 + }, + { + "epoch": 0.34, + "learning_rate": 3.870861413012381e-06, + "loss": 1.2134, + "step": 11147 + }, + { + "epoch": 0.34, + "learning_rate": 3.870657427738443e-06, + "loss": 1.1082, + "step": 11148 + }, + { + "epoch": 0.34, + "learning_rate": 3.8704534294165056e-06, + "loss": 1.2043, + "step": 11149 + }, + { + "epoch": 0.34, + "learning_rate": 3.870249418048513e-06, + "loss": 1.2813, + "step": 11150 + }, + { + "epoch": 0.34, + "learning_rate": 3.870045393636405e-06, + "loss": 1.1649, + "step": 11151 + }, + { + "epoch": 0.34, + "learning_rate": 3.869841356182124e-06, + "loss": 1.0992, + "step": 11152 + }, + { + "epoch": 0.34, + "learning_rate": 3.869637305687613e-06, + "loss": 1.1323, + "step": 11153 + }, + { + "epoch": 0.34, + "learning_rate": 3.869433242154816e-06, + "loss": 1.1558, + "step": 11154 + }, + { + "epoch": 0.34, + "learning_rate": 3.869229165585673e-06, + "loss": 1.2104, + "step": 11155 + }, + { + "epoch": 0.34, + "learning_rate": 3.869025075982129e-06, + "loss": 1.2797, + "step": 11156 + }, + { + "epoch": 0.34, + "learning_rate": 3.868820973346125e-06, + "loss": 1.0873, + "step": 11157 + }, + { + "epoch": 0.34, + "learning_rate": 3.8686168576796035e-06, + "loss": 1.1499, + "step": 11158 + }, + { + "epoch": 0.34, + "learning_rate": 3.8684127289845095e-06, + "loss": 0.9794, + "step": 11159 + }, + { + "epoch": 0.34, + "learning_rate": 3.868208587262785e-06, + "loss": 1.2089, + "step": 11160 + }, + { + "epoch": 0.34, + "learning_rate": 3.868004432516374e-06, + "loss": 1.2061, + "step": 11161 + }, + { + "epoch": 0.34, + "learning_rate": 3.86780026474722e-06, + "loss": 1.088, + "step": 11162 + }, + { + "epoch": 0.34, + "learning_rate": 3.867596083957265e-06, + "loss": 1.2578, + "step": 11163 + }, + { + "epoch": 0.34, + "learning_rate": 3.867391890148456e-06, + "loss": 1.1431, + "step": 11164 + }, + { + "epoch": 0.34, + "learning_rate": 3.8671876833227334e-06, + "loss": 1.1693, + "step": 11165 + }, + { + "epoch": 0.34, + "learning_rate": 3.8669834634820425e-06, + "loss": 1.1223, + "step": 11166 + }, + { + "epoch": 0.34, + "learning_rate": 3.8667792306283284e-06, + "loss": 1.1407, + "step": 11167 + }, + { + "epoch": 0.34, + "learning_rate": 3.866574984763533e-06, + "loss": 1.0974, + "step": 11168 + }, + { + "epoch": 0.34, + "learning_rate": 3.866370725889602e-06, + "loss": 1.2025, + "step": 11169 + }, + { + "epoch": 0.34, + "learning_rate": 3.8661664540084805e-06, + "loss": 1.1761, + "step": 11170 + }, + { + "epoch": 0.34, + "learning_rate": 3.865962169122112e-06, + "loss": 1.0724, + "step": 11171 + }, + { + "epoch": 0.34, + "learning_rate": 3.865757871232442e-06, + "loss": 1.1078, + "step": 11172 + }, + { + "epoch": 0.34, + "learning_rate": 3.865553560341414e-06, + "loss": 1.2868, + "step": 11173 + }, + { + "epoch": 0.34, + "learning_rate": 3.8653492364509734e-06, + "loss": 1.2222, + "step": 11174 + }, + { + "epoch": 0.34, + "learning_rate": 3.865144899563067e-06, + "loss": 1.1703, + "step": 11175 + }, + { + "epoch": 0.34, + "learning_rate": 3.864940549679638e-06, + "loss": 1.2722, + "step": 11176 + }, + { + "epoch": 0.34, + "learning_rate": 3.8647361868026325e-06, + "loss": 1.1239, + "step": 11177 + }, + { + "epoch": 0.34, + "learning_rate": 3.864531810933996e-06, + "loss": 1.0914, + "step": 11178 + }, + { + "epoch": 0.34, + "learning_rate": 3.864327422075673e-06, + "loss": 1.1594, + "step": 11179 + }, + { + "epoch": 0.34, + "learning_rate": 3.86412302022961e-06, + "loss": 1.2015, + "step": 11180 + }, + { + "epoch": 0.34, + "learning_rate": 3.863918605397754e-06, + "loss": 1.2806, + "step": 11181 + }, + { + "epoch": 0.34, + "learning_rate": 3.863714177582049e-06, + "loss": 1.143, + "step": 11182 + }, + { + "epoch": 0.34, + "learning_rate": 3.863509736784442e-06, + "loss": 1.1278, + "step": 11183 + }, + { + "epoch": 0.34, + "learning_rate": 3.8633052830068785e-06, + "loss": 1.1697, + "step": 11184 + }, + { + "epoch": 0.34, + "learning_rate": 3.863100816251306e-06, + "loss": 1.0391, + "step": 11185 + }, + { + "epoch": 0.34, + "learning_rate": 3.86289633651967e-06, + "loss": 1.1892, + "step": 11186 + }, + { + "epoch": 0.34, + "learning_rate": 3.862691843813917e-06, + "loss": 1.2084, + "step": 11187 + }, + { + "epoch": 0.34, + "learning_rate": 3.862487338135994e-06, + "loss": 1.1029, + "step": 11188 + }, + { + "epoch": 0.34, + "learning_rate": 3.8622828194878485e-06, + "loss": 1.1786, + "step": 11189 + }, + { + "epoch": 0.34, + "learning_rate": 3.862078287871426e-06, + "loss": 1.0912, + "step": 11190 + }, + { + "epoch": 0.34, + "learning_rate": 3.8618737432886735e-06, + "loss": 1.0148, + "step": 11191 + }, + { + "epoch": 0.34, + "learning_rate": 3.86166918574154e-06, + "loss": 1.1644, + "step": 11192 + }, + { + "epoch": 0.34, + "learning_rate": 3.861464615231971e-06, + "loss": 1.1587, + "step": 11193 + }, + { + "epoch": 0.34, + "learning_rate": 3.861260031761915e-06, + "loss": 1.0422, + "step": 11194 + }, + { + "epoch": 0.34, + "learning_rate": 3.861055435333319e-06, + "loss": 1.2136, + "step": 11195 + }, + { + "epoch": 0.34, + "learning_rate": 3.86085082594813e-06, + "loss": 1.0133, + "step": 11196 + }, + { + "epoch": 0.34, + "learning_rate": 3.860646203608298e-06, + "loss": 1.0901, + "step": 11197 + }, + { + "epoch": 0.34, + "learning_rate": 3.860441568315768e-06, + "loss": 1.2172, + "step": 11198 + }, + { + "epoch": 0.34, + "learning_rate": 3.860236920072491e-06, + "loss": 1.1205, + "step": 11199 + }, + { + "epoch": 0.34, + "learning_rate": 3.860032258880412e-06, + "loss": 1.0571, + "step": 11200 + }, + { + "epoch": 0.34, + "learning_rate": 3.8598275847414825e-06, + "loss": 1.0859, + "step": 11201 + }, + { + "epoch": 0.34, + "learning_rate": 3.859622897657648e-06, + "loss": 1.0491, + "step": 11202 + }, + { + "epoch": 0.34, + "learning_rate": 3.859418197630859e-06, + "loss": 1.1083, + "step": 11203 + }, + { + "epoch": 0.34, + "learning_rate": 3.859213484663064e-06, + "loss": 1.0957, + "step": 11204 + }, + { + "epoch": 0.34, + "learning_rate": 3.8590087587562094e-06, + "loss": 1.1376, + "step": 11205 + }, + { + "epoch": 0.34, + "learning_rate": 3.858804019912248e-06, + "loss": 1.2523, + "step": 11206 + }, + { + "epoch": 0.34, + "learning_rate": 3.858599268133125e-06, + "loss": 1.2045, + "step": 11207 + }, + { + "epoch": 0.34, + "learning_rate": 3.858394503420793e-06, + "loss": 1.1159, + "step": 11208 + }, + { + "epoch": 0.34, + "learning_rate": 3.858189725777198e-06, + "loss": 1.1911, + "step": 11209 + }, + { + "epoch": 0.34, + "learning_rate": 3.857984935204292e-06, + "loss": 1.2886, + "step": 11210 + }, + { + "epoch": 0.34, + "learning_rate": 3.857780131704023e-06, + "loss": 1.2128, + "step": 11211 + }, + { + "epoch": 0.34, + "learning_rate": 3.8575753152783414e-06, + "loss": 1.1066, + "step": 11212 + }, + { + "epoch": 0.34, + "learning_rate": 3.857370485929196e-06, + "loss": 1.0425, + "step": 11213 + }, + { + "epoch": 0.34, + "learning_rate": 3.857165643658538e-06, + "loss": 1.1585, + "step": 11214 + }, + { + "epoch": 0.34, + "learning_rate": 3.856960788468316e-06, + "loss": 1.0848, + "step": 11215 + }, + { + "epoch": 0.34, + "learning_rate": 3.8567559203604805e-06, + "loss": 1.1354, + "step": 11216 + }, + { + "epoch": 0.34, + "learning_rate": 3.856551039336984e-06, + "loss": 1.0338, + "step": 11217 + }, + { + "epoch": 0.34, + "learning_rate": 3.856346145399773e-06, + "loss": 1.2699, + "step": 11218 + }, + { + "epoch": 0.34, + "learning_rate": 3.856141238550801e-06, + "loss": 1.2303, + "step": 11219 + }, + { + "epoch": 0.34, + "learning_rate": 3.855936318792018e-06, + "loss": 1.1844, + "step": 11220 + }, + { + "epoch": 0.34, + "learning_rate": 3.855731386125373e-06, + "loss": 1.0306, + "step": 11221 + }, + { + "epoch": 0.34, + "learning_rate": 3.855526440552818e-06, + "loss": 1.1191, + "step": 11222 + }, + { + "epoch": 0.34, + "learning_rate": 3.855321482076305e-06, + "loss": 1.0703, + "step": 11223 + }, + { + "epoch": 0.34, + "learning_rate": 3.855116510697784e-06, + "loss": 1.2028, + "step": 11224 + }, + { + "epoch": 0.34, + "learning_rate": 3.8549115264192074e-06, + "loss": 1.0339, + "step": 11225 + }, + { + "epoch": 0.34, + "learning_rate": 3.854706529242524e-06, + "loss": 1.0765, + "step": 11226 + }, + { + "epoch": 0.34, + "learning_rate": 3.854501519169688e-06, + "loss": 1.1219, + "step": 11227 + }, + { + "epoch": 0.34, + "learning_rate": 3.854296496202649e-06, + "loss": 1.0971, + "step": 11228 + }, + { + "epoch": 0.34, + "learning_rate": 3.85409146034336e-06, + "loss": 1.257, + "step": 11229 + }, + { + "epoch": 0.34, + "learning_rate": 3.853886411593773e-06, + "loss": 1.1918, + "step": 11230 + }, + { + "epoch": 0.34, + "learning_rate": 3.853681349955839e-06, + "loss": 1.1364, + "step": 11231 + }, + { + "epoch": 0.34, + "learning_rate": 3.85347627543151e-06, + "loss": 1.1276, + "step": 11232 + }, + { + "epoch": 0.34, + "learning_rate": 3.8532711880227396e-06, + "loss": 1.1462, + "step": 11233 + }, + { + "epoch": 0.34, + "learning_rate": 3.853066087731478e-06, + "loss": 1.1231, + "step": 11234 + }, + { + "epoch": 0.34, + "learning_rate": 3.8528609745596805e-06, + "loss": 1.188, + "step": 11235 + }, + { + "epoch": 0.34, + "learning_rate": 3.8526558485092975e-06, + "loss": 1.1536, + "step": 11236 + }, + { + "epoch": 0.34, + "learning_rate": 3.8524507095822816e-06, + "loss": 1.1187, + "step": 11237 + }, + { + "epoch": 0.34, + "learning_rate": 3.852245557780588e-06, + "loss": 1.1746, + "step": 11238 + }, + { + "epoch": 0.34, + "learning_rate": 3.8520403931061654e-06, + "loss": 1.0988, + "step": 11239 + }, + { + "epoch": 0.34, + "learning_rate": 3.851835215560971e-06, + "loss": 1.0845, + "step": 11240 + }, + { + "epoch": 0.34, + "learning_rate": 3.8516300251469565e-06, + "loss": 1.221, + "step": 11241 + }, + { + "epoch": 0.34, + "learning_rate": 3.8514248218660745e-06, + "loss": 1.1458, + "step": 11242 + }, + { + "epoch": 0.34, + "learning_rate": 3.851219605720279e-06, + "loss": 1.1812, + "step": 11243 + }, + { + "epoch": 0.34, + "learning_rate": 3.851014376711524e-06, + "loss": 1.1844, + "step": 11244 + }, + { + "epoch": 0.34, + "learning_rate": 3.8508091348417635e-06, + "loss": 1.0787, + "step": 11245 + }, + { + "epoch": 0.34, + "learning_rate": 3.85060388011295e-06, + "loss": 1.0972, + "step": 11246 + }, + { + "epoch": 0.34, + "learning_rate": 3.8503986125270375e-06, + "loss": 1.177, + "step": 11247 + }, + { + "epoch": 0.34, + "learning_rate": 3.8501933320859806e-06, + "loss": 1.1689, + "step": 11248 + }, + { + "epoch": 0.34, + "learning_rate": 3.849988038791734e-06, + "loss": 1.2109, + "step": 11249 + }, + { + "epoch": 0.34, + "learning_rate": 3.849782732646252e-06, + "loss": 1.0764, + "step": 11250 + }, + { + "epoch": 0.34, + "learning_rate": 3.849577413651488e-06, + "loss": 1.1581, + "step": 11251 + }, + { + "epoch": 0.34, + "learning_rate": 3.8493720818093965e-06, + "loss": 1.166, + "step": 11252 + }, + { + "epoch": 0.34, + "learning_rate": 3.849166737121933e-06, + "loss": 1.0887, + "step": 11253 + }, + { + "epoch": 0.34, + "learning_rate": 3.848961379591052e-06, + "loss": 1.2064, + "step": 11254 + }, + { + "epoch": 0.34, + "learning_rate": 3.8487560092187084e-06, + "loss": 1.1936, + "step": 11255 + }, + { + "epoch": 0.34, + "learning_rate": 3.848550626006857e-06, + "loss": 1.1373, + "step": 11256 + }, + { + "epoch": 0.34, + "learning_rate": 3.848345229957453e-06, + "loss": 1.1746, + "step": 11257 + }, + { + "epoch": 0.34, + "learning_rate": 3.848139821072452e-06, + "loss": 1.0573, + "step": 11258 + }, + { + "epoch": 0.34, + "learning_rate": 3.847934399353809e-06, + "loss": 1.177, + "step": 11259 + }, + { + "epoch": 0.34, + "learning_rate": 3.84772896480348e-06, + "loss": 1.1175, + "step": 11260 + }, + { + "epoch": 0.34, + "learning_rate": 3.8475235174234196e-06, + "loss": 1.1229, + "step": 11261 + }, + { + "epoch": 0.34, + "learning_rate": 3.847318057215585e-06, + "loss": 1.1185, + "step": 11262 + }, + { + "epoch": 0.34, + "learning_rate": 3.8471125841819316e-06, + "loss": 1.2097, + "step": 11263 + }, + { + "epoch": 0.34, + "learning_rate": 3.846907098324415e-06, + "loss": 1.044, + "step": 11264 + }, + { + "epoch": 0.34, + "learning_rate": 3.8467015996449905e-06, + "loss": 1.1022, + "step": 11265 + }, + { + "epoch": 0.34, + "learning_rate": 3.846496088145617e-06, + "loss": 1.1812, + "step": 11266 + }, + { + "epoch": 0.34, + "learning_rate": 3.846290563828249e-06, + "loss": 1.1366, + "step": 11267 + }, + { + "epoch": 0.34, + "learning_rate": 3.846085026694842e-06, + "loss": 1.0645, + "step": 11268 + }, + { + "epoch": 0.34, + "learning_rate": 3.845879476747355e-06, + "loss": 1.0046, + "step": 11269 + }, + { + "epoch": 0.34, + "learning_rate": 3.845673913987743e-06, + "loss": 1.1031, + "step": 11270 + }, + { + "epoch": 0.34, + "learning_rate": 3.845468338417963e-06, + "loss": 1.175, + "step": 11271 + }, + { + "epoch": 0.34, + "learning_rate": 3.845262750039973e-06, + "loss": 1.0826, + "step": 11272 + }, + { + "epoch": 0.34, + "learning_rate": 3.84505714885573e-06, + "loss": 1.1688, + "step": 11273 + }, + { + "epoch": 0.34, + "learning_rate": 3.84485153486719e-06, + "loss": 1.1766, + "step": 11274 + }, + { + "epoch": 0.34, + "learning_rate": 3.844645908076311e-06, + "loss": 1.2717, + "step": 11275 + }, + { + "epoch": 0.34, + "learning_rate": 3.844440268485052e-06, + "loss": 1.0822, + "step": 11276 + }, + { + "epoch": 0.34, + "learning_rate": 3.844234616095367e-06, + "loss": 1.118, + "step": 11277 + }, + { + "epoch": 0.34, + "learning_rate": 3.844028950909218e-06, + "loss": 1.2838, + "step": 11278 + }, + { + "epoch": 0.34, + "learning_rate": 3.84382327292856e-06, + "loss": 1.098, + "step": 11279 + }, + { + "epoch": 0.34, + "learning_rate": 3.8436175821553505e-06, + "loss": 1.1099, + "step": 11280 + }, + { + "epoch": 0.34, + "learning_rate": 3.84341187859155e-06, + "loss": 1.311, + "step": 11281 + }, + { + "epoch": 0.34, + "learning_rate": 3.843206162239114e-06, + "loss": 1.1389, + "step": 11282 + }, + { + "epoch": 0.34, + "learning_rate": 3.843000433100004e-06, + "loss": 1.1245, + "step": 11283 + }, + { + "epoch": 0.34, + "learning_rate": 3.842794691176175e-06, + "loss": 1.0717, + "step": 11284 + }, + { + "epoch": 0.34, + "learning_rate": 3.842588936469588e-06, + "loss": 1.1424, + "step": 11285 + }, + { + "epoch": 0.34, + "learning_rate": 3.842383168982201e-06, + "loss": 1.1847, + "step": 11286 + }, + { + "epoch": 0.34, + "learning_rate": 3.842177388715973e-06, + "loss": 1.1407, + "step": 11287 + }, + { + "epoch": 0.34, + "learning_rate": 3.841971595672863e-06, + "loss": 1.128, + "step": 11288 + }, + { + "epoch": 0.34, + "learning_rate": 3.841765789854829e-06, + "loss": 1.1387, + "step": 11289 + }, + { + "epoch": 0.34, + "learning_rate": 3.841559971263831e-06, + "loss": 1.041, + "step": 11290 + }, + { + "epoch": 0.34, + "learning_rate": 3.841354139901828e-06, + "loss": 1.1782, + "step": 11291 + }, + { + "epoch": 0.34, + "learning_rate": 3.84114829577078e-06, + "loss": 1.2205, + "step": 11292 + }, + { + "epoch": 0.34, + "learning_rate": 3.8409424388726455e-06, + "loss": 1.1951, + "step": 11293 + }, + { + "epoch": 0.34, + "learning_rate": 3.840736569209386e-06, + "loss": 1.1729, + "step": 11294 + }, + { + "epoch": 0.34, + "learning_rate": 3.84053068678296e-06, + "loss": 1.1365, + "step": 11295 + }, + { + "epoch": 0.34, + "learning_rate": 3.840324791595325e-06, + "loss": 1.1543, + "step": 11296 + }, + { + "epoch": 0.34, + "learning_rate": 3.840118883648447e-06, + "loss": 1.1616, + "step": 11297 + }, + { + "epoch": 0.34, + "learning_rate": 3.8399129629442805e-06, + "loss": 1.1273, + "step": 11298 + }, + { + "epoch": 0.34, + "learning_rate": 3.839707029484788e-06, + "loss": 1.2728, + "step": 11299 + }, + { + "epoch": 0.34, + "learning_rate": 3.839501083271931e-06, + "loss": 1.2471, + "step": 11300 + }, + { + "epoch": 0.34, + "learning_rate": 3.839295124307668e-06, + "loss": 1.189, + "step": 11301 + }, + { + "epoch": 0.34, + "learning_rate": 3.83908915259396e-06, + "loss": 1.1764, + "step": 11302 + }, + { + "epoch": 0.34, + "learning_rate": 3.838883168132769e-06, + "loss": 1.1628, + "step": 11303 + }, + { + "epoch": 0.34, + "learning_rate": 3.838677170926055e-06, + "loss": 1.1233, + "step": 11304 + }, + { + "epoch": 0.34, + "learning_rate": 3.838471160975779e-06, + "loss": 1.2184, + "step": 11305 + }, + { + "epoch": 0.34, + "learning_rate": 3.838265138283902e-06, + "loss": 1.0927, + "step": 11306 + }, + { + "epoch": 0.34, + "learning_rate": 3.838059102852385e-06, + "loss": 1.0902, + "step": 11307 + }, + { + "epoch": 0.34, + "learning_rate": 3.837853054683191e-06, + "loss": 1.1725, + "step": 11308 + }, + { + "epoch": 0.34, + "learning_rate": 3.837646993778279e-06, + "loss": 1.0939, + "step": 11309 + }, + { + "epoch": 0.34, + "learning_rate": 3.837440920139612e-06, + "loss": 1.0936, + "step": 11310 + }, + { + "epoch": 0.34, + "learning_rate": 3.837234833769152e-06, + "loss": 1.1382, + "step": 11311 + }, + { + "epoch": 0.34, + "learning_rate": 3.83702873466886e-06, + "loss": 1.1135, + "step": 11312 + }, + { + "epoch": 0.34, + "learning_rate": 3.836822622840698e-06, + "loss": 1.2263, + "step": 11313 + }, + { + "epoch": 0.34, + "learning_rate": 3.83661649828663e-06, + "loss": 1.1556, + "step": 11314 + }, + { + "epoch": 0.34, + "learning_rate": 3.836410361008616e-06, + "loss": 1.1937, + "step": 11315 + }, + { + "epoch": 0.34, + "learning_rate": 3.836204211008619e-06, + "loss": 1.1068, + "step": 11316 + }, + { + "epoch": 0.34, + "learning_rate": 3.835998048288601e-06, + "loss": 1.1071, + "step": 11317 + }, + { + "epoch": 0.34, + "learning_rate": 3.835791872850525e-06, + "loss": 1.2205, + "step": 11318 + }, + { + "epoch": 0.34, + "learning_rate": 3.835585684696355e-06, + "loss": 1.2443, + "step": 11319 + }, + { + "epoch": 0.34, + "learning_rate": 3.835379483828051e-06, + "loss": 1.2811, + "step": 11320 + }, + { + "epoch": 0.34, + "learning_rate": 3.835173270247578e-06, + "loss": 1.1091, + "step": 11321 + }, + { + "epoch": 0.34, + "learning_rate": 3.834967043956898e-06, + "loss": 1.2241, + "step": 11322 + }, + { + "epoch": 0.34, + "learning_rate": 3.8347608049579754e-06, + "loss": 1.1158, + "step": 11323 + }, + { + "epoch": 0.34, + "learning_rate": 3.834554553252773e-06, + "loss": 1.1382, + "step": 11324 + }, + { + "epoch": 0.34, + "learning_rate": 3.834348288843252e-06, + "loss": 1.1914, + "step": 11325 + }, + { + "epoch": 0.34, + "learning_rate": 3.834142011731381e-06, + "loss": 1.1285, + "step": 11326 + }, + { + "epoch": 0.34, + "learning_rate": 3.833935721919119e-06, + "loss": 1.1374, + "step": 11327 + }, + { + "epoch": 0.34, + "learning_rate": 3.83372941940843e-06, + "loss": 1.1534, + "step": 11328 + }, + { + "epoch": 0.34, + "learning_rate": 3.833523104201282e-06, + "loss": 1.1641, + "step": 11329 + }, + { + "epoch": 0.34, + "learning_rate": 3.833316776299635e-06, + "loss": 1.2583, + "step": 11330 + }, + { + "epoch": 0.34, + "learning_rate": 3.833110435705454e-06, + "loss": 1.0554, + "step": 11331 + }, + { + "epoch": 0.34, + "learning_rate": 3.832904082420704e-06, + "loss": 1.1052, + "step": 11332 + }, + { + "epoch": 0.34, + "learning_rate": 3.83269771644735e-06, + "loss": 1.0876, + "step": 11333 + }, + { + "epoch": 0.34, + "learning_rate": 3.832491337787355e-06, + "loss": 1.1328, + "step": 11334 + }, + { + "epoch": 0.34, + "learning_rate": 3.832284946442684e-06, + "loss": 1.2404, + "step": 11335 + }, + { + "epoch": 0.34, + "learning_rate": 3.8320785424153015e-06, + "loss": 1.2032, + "step": 11336 + }, + { + "epoch": 0.34, + "learning_rate": 3.8318721257071735e-06, + "loss": 1.2103, + "step": 11337 + }, + { + "epoch": 0.34, + "learning_rate": 3.831665696320265e-06, + "loss": 1.0918, + "step": 11338 + }, + { + "epoch": 0.34, + "learning_rate": 3.831459254256539e-06, + "loss": 1.2373, + "step": 11339 + }, + { + "epoch": 0.34, + "learning_rate": 3.831252799517963e-06, + "loss": 1.1406, + "step": 11340 + }, + { + "epoch": 0.34, + "learning_rate": 3.8310463321065e-06, + "loss": 1.1432, + "step": 11341 + }, + { + "epoch": 0.34, + "learning_rate": 3.830839852024118e-06, + "loss": 1.0778, + "step": 11342 + }, + { + "epoch": 0.34, + "learning_rate": 3.8306333592727825e-06, + "loss": 1.1412, + "step": 11343 + }, + { + "epoch": 0.34, + "learning_rate": 3.830426853854458e-06, + "loss": 1.1668, + "step": 11344 + }, + { + "epoch": 0.34, + "learning_rate": 3.83022033577111e-06, + "loss": 1.0898, + "step": 11345 + }, + { + "epoch": 0.34, + "learning_rate": 3.830013805024705e-06, + "loss": 1.1873, + "step": 11346 + }, + { + "epoch": 0.34, + "learning_rate": 3.829807261617209e-06, + "loss": 1.0211, + "step": 11347 + }, + { + "epoch": 0.34, + "learning_rate": 3.829600705550589e-06, + "loss": 1.1703, + "step": 11348 + }, + { + "epoch": 0.34, + "learning_rate": 3.829394136826811e-06, + "loss": 1.2041, + "step": 11349 + }, + { + "epoch": 0.34, + "learning_rate": 3.829187555447839e-06, + "loss": 1.2205, + "step": 11350 + }, + { + "epoch": 0.34, + "learning_rate": 3.828980961415643e-06, + "loss": 1.2059, + "step": 11351 + }, + { + "epoch": 0.34, + "learning_rate": 3.8287743547321884e-06, + "loss": 1.1609, + "step": 11352 + }, + { + "epoch": 0.34, + "learning_rate": 3.8285677353994426e-06, + "loss": 1.1196, + "step": 11353 + }, + { + "epoch": 0.34, + "learning_rate": 3.82836110341937e-06, + "loss": 1.254, + "step": 11354 + }, + { + "epoch": 0.34, + "learning_rate": 3.8281544587939416e-06, + "loss": 1.1479, + "step": 11355 + }, + { + "epoch": 0.34, + "learning_rate": 3.82794780152512e-06, + "loss": 1.1364, + "step": 11356 + }, + { + "epoch": 0.34, + "learning_rate": 3.827741131614877e-06, + "loss": 1.166, + "step": 11357 + }, + { + "epoch": 0.34, + "learning_rate": 3.827534449065177e-06, + "loss": 1.1552, + "step": 11358 + }, + { + "epoch": 0.34, + "learning_rate": 3.8273277538779886e-06, + "loss": 0.9754, + "step": 11359 + }, + { + "epoch": 0.34, + "learning_rate": 3.827121046055279e-06, + "loss": 1.0603, + "step": 11360 + }, + { + "epoch": 0.34, + "learning_rate": 3.826914325599017e-06, + "loss": 1.1854, + "step": 11361 + }, + { + "epoch": 0.34, + "learning_rate": 3.826707592511169e-06, + "loss": 1.1102, + "step": 11362 + }, + { + "epoch": 0.34, + "learning_rate": 3.826500846793703e-06, + "loss": 1.204, + "step": 11363 + }, + { + "epoch": 0.34, + "learning_rate": 3.8262940884485885e-06, + "loss": 1.1079, + "step": 11364 + }, + { + "epoch": 0.34, + "learning_rate": 3.826087317477794e-06, + "loss": 1.2416, + "step": 11365 + }, + { + "epoch": 0.34, + "learning_rate": 3.825880533883285e-06, + "loss": 1.1062, + "step": 11366 + }, + { + "epoch": 0.34, + "learning_rate": 3.825673737667033e-06, + "loss": 1.0864, + "step": 11367 + }, + { + "epoch": 0.34, + "learning_rate": 3.825466928831006e-06, + "loss": 1.1881, + "step": 11368 + }, + { + "epoch": 0.34, + "learning_rate": 3.825260107377171e-06, + "loss": 1.1849, + "step": 11369 + }, + { + "epoch": 0.34, + "learning_rate": 3.825053273307499e-06, + "loss": 1.1663, + "step": 11370 + }, + { + "epoch": 0.34, + "learning_rate": 3.824846426623957e-06, + "loss": 1.1207, + "step": 11371 + }, + { + "epoch": 0.34, + "learning_rate": 3.824639567328516e-06, + "loss": 1.1537, + "step": 11372 + }, + { + "epoch": 0.34, + "learning_rate": 3.824432695423144e-06, + "loss": 1.048, + "step": 11373 + }, + { + "epoch": 0.34, + "learning_rate": 3.824225810909811e-06, + "loss": 1.1934, + "step": 11374 + }, + { + "epoch": 0.34, + "learning_rate": 3.824018913790485e-06, + "loss": 1.0866, + "step": 11375 + }, + { + "epoch": 0.34, + "learning_rate": 3.823812004067136e-06, + "loss": 1.0991, + "step": 11376 + }, + { + "epoch": 0.34, + "learning_rate": 3.823605081741737e-06, + "loss": 1.1998, + "step": 11377 + }, + { + "epoch": 0.34, + "learning_rate": 3.823398146816253e-06, + "loss": 1.1817, + "step": 11378 + }, + { + "epoch": 0.34, + "learning_rate": 3.8231911992926575e-06, + "loss": 1.2981, + "step": 11379 + }, + { + "epoch": 0.34, + "learning_rate": 3.822984239172917e-06, + "loss": 1.1509, + "step": 11380 + }, + { + "epoch": 0.34, + "learning_rate": 3.822777266459006e-06, + "loss": 1.2178, + "step": 11381 + }, + { + "epoch": 0.34, + "learning_rate": 3.822570281152891e-06, + "loss": 1.1038, + "step": 11382 + }, + { + "epoch": 0.34, + "learning_rate": 3.822363283256544e-06, + "loss": 1.0583, + "step": 11383 + }, + { + "epoch": 0.34, + "learning_rate": 3.822156272771935e-06, + "loss": 1.1221, + "step": 11384 + }, + { + "epoch": 0.34, + "learning_rate": 3.821949249701037e-06, + "loss": 1.1196, + "step": 11385 + }, + { + "epoch": 0.34, + "learning_rate": 3.821742214045817e-06, + "loss": 1.1716, + "step": 11386 + }, + { + "epoch": 0.34, + "learning_rate": 3.821535165808249e-06, + "loss": 1.1551, + "step": 11387 + }, + { + "epoch": 0.34, + "learning_rate": 3.821328104990301e-06, + "loss": 1.1602, + "step": 11388 + }, + { + "epoch": 0.34, + "learning_rate": 3.821121031593947e-06, + "loss": 1.0604, + "step": 11389 + }, + { + "epoch": 0.34, + "learning_rate": 3.8209139456211566e-06, + "loss": 1.0154, + "step": 11390 + }, + { + "epoch": 0.34, + "learning_rate": 3.8207068470739016e-06, + "loss": 1.1691, + "step": 11391 + }, + { + "epoch": 0.34, + "learning_rate": 3.820499735954154e-06, + "loss": 1.1146, + "step": 11392 + }, + { + "epoch": 0.34, + "learning_rate": 3.820292612263885e-06, + "loss": 1.246, + "step": 11393 + }, + { + "epoch": 0.34, + "learning_rate": 3.820085476005066e-06, + "loss": 1.0847, + "step": 11394 + }, + { + "epoch": 0.34, + "learning_rate": 3.819878327179668e-06, + "loss": 1.2289, + "step": 11395 + }, + { + "epoch": 0.34, + "learning_rate": 3.8196711657896655e-06, + "loss": 1.0496, + "step": 11396 + }, + { + "epoch": 0.34, + "learning_rate": 3.819463991837028e-06, + "loss": 1.226, + "step": 11397 + }, + { + "epoch": 0.34, + "learning_rate": 3.819256805323729e-06, + "loss": 1.2891, + "step": 11398 + }, + { + "epoch": 0.34, + "learning_rate": 3.8190496062517415e-06, + "loss": 1.1743, + "step": 11399 + }, + { + "epoch": 0.34, + "learning_rate": 3.818842394623036e-06, + "loss": 1.1342, + "step": 11400 + }, + { + "epoch": 0.34, + "learning_rate": 3.818635170439586e-06, + "loss": 1.2535, + "step": 11401 + }, + { + "epoch": 0.34, + "learning_rate": 3.8184279337033645e-06, + "loss": 1.0726, + "step": 11402 + }, + { + "epoch": 0.34, + "learning_rate": 3.818220684416345e-06, + "loss": 1.0346, + "step": 11403 + }, + { + "epoch": 0.34, + "learning_rate": 3.818013422580499e-06, + "loss": 1.1307, + "step": 11404 + }, + { + "epoch": 0.34, + "learning_rate": 3.817806148197799e-06, + "loss": 1.2748, + "step": 11405 + }, + { + "epoch": 0.34, + "learning_rate": 3.81759886127022e-06, + "loss": 1.1802, + "step": 11406 + }, + { + "epoch": 0.34, + "learning_rate": 3.817391561799734e-06, + "loss": 1.0868, + "step": 11407 + }, + { + "epoch": 0.34, + "learning_rate": 3.8171842497883145e-06, + "loss": 1.2188, + "step": 11408 + }, + { + "epoch": 0.34, + "learning_rate": 3.816976925237936e-06, + "loss": 1.062, + "step": 11409 + }, + { + "epoch": 0.34, + "learning_rate": 3.816769588150572e-06, + "loss": 1.2269, + "step": 11410 + }, + { + "epoch": 0.34, + "learning_rate": 3.816562238528195e-06, + "loss": 1.1703, + "step": 11411 + }, + { + "epoch": 0.34, + "learning_rate": 3.816354876372779e-06, + "loss": 1.1719, + "step": 11412 + }, + { + "epoch": 0.34, + "learning_rate": 3.8161475016863e-06, + "loss": 1.1825, + "step": 11413 + }, + { + "epoch": 0.34, + "learning_rate": 3.815940114470729e-06, + "loss": 1.0801, + "step": 11414 + }, + { + "epoch": 0.34, + "learning_rate": 3.815732714728042e-06, + "loss": 1.0789, + "step": 11415 + }, + { + "epoch": 0.34, + "learning_rate": 3.815525302460215e-06, + "loss": 1.0328, + "step": 11416 + }, + { + "epoch": 0.34, + "learning_rate": 3.815317877669219e-06, + "loss": 1.2045, + "step": 11417 + }, + { + "epoch": 0.34, + "learning_rate": 3.815110440357032e-06, + "loss": 1.103, + "step": 11418 + }, + { + "epoch": 0.34, + "learning_rate": 3.814902990525625e-06, + "loss": 1.0906, + "step": 11419 + }, + { + "epoch": 0.34, + "learning_rate": 3.814695528176976e-06, + "loss": 1.1469, + "step": 11420 + }, + { + "epoch": 0.34, + "learning_rate": 3.8144880533130585e-06, + "loss": 1.1471, + "step": 11421 + }, + { + "epoch": 0.34, + "learning_rate": 3.814280565935847e-06, + "loss": 1.0906, + "step": 11422 + }, + { + "epoch": 0.34, + "learning_rate": 3.8140730660473186e-06, + "loss": 1.0963, + "step": 11423 + }, + { + "epoch": 0.34, + "learning_rate": 3.813865553649447e-06, + "loss": 1.2418, + "step": 11424 + }, + { + "epoch": 0.34, + "learning_rate": 3.813658028744208e-06, + "loss": 1.071, + "step": 11425 + }, + { + "epoch": 0.34, + "learning_rate": 3.8134504913335777e-06, + "loss": 1.2438, + "step": 11426 + }, + { + "epoch": 0.34, + "learning_rate": 3.8132429414195316e-06, + "loss": 1.1471, + "step": 11427 + }, + { + "epoch": 0.34, + "learning_rate": 3.813035379004044e-06, + "loss": 1.18, + "step": 11428 + }, + { + "epoch": 0.34, + "learning_rate": 3.8128278040890933e-06, + "loss": 1.0852, + "step": 11429 + }, + { + "epoch": 0.34, + "learning_rate": 3.8126202166766533e-06, + "loss": 1.246, + "step": 11430 + }, + { + "epoch": 0.34, + "learning_rate": 3.8124126167687016e-06, + "loss": 1.0334, + "step": 11431 + }, + { + "epoch": 0.34, + "learning_rate": 3.8122050043672134e-06, + "loss": 1.1552, + "step": 11432 + }, + { + "epoch": 0.34, + "learning_rate": 3.811997379474166e-06, + "loss": 1.134, + "step": 11433 + }, + { + "epoch": 0.34, + "learning_rate": 3.8117897420915345e-06, + "loss": 1.0954, + "step": 11434 + }, + { + "epoch": 0.34, + "learning_rate": 3.811582092221297e-06, + "loss": 1.1829, + "step": 11435 + }, + { + "epoch": 0.34, + "learning_rate": 3.81137442986543e-06, + "loss": 1.1862, + "step": 11436 + }, + { + "epoch": 0.34, + "learning_rate": 3.811166755025909e-06, + "loss": 1.2681, + "step": 11437 + }, + { + "epoch": 0.34, + "learning_rate": 3.8109590677047126e-06, + "loss": 0.9451, + "step": 11438 + }, + { + "epoch": 0.34, + "learning_rate": 3.810751367903818e-06, + "loss": 1.202, + "step": 11439 + }, + { + "epoch": 0.34, + "learning_rate": 3.8105436556252008e-06, + "loss": 1.1324, + "step": 11440 + }, + { + "epoch": 0.34, + "learning_rate": 3.8103359308708395e-06, + "loss": 1.0298, + "step": 11441 + }, + { + "epoch": 0.34, + "learning_rate": 3.810128193642711e-06, + "loss": 1.05, + "step": 11442 + }, + { + "epoch": 0.34, + "learning_rate": 3.809920443942793e-06, + "loss": 1.1652, + "step": 11443 + }, + { + "epoch": 0.34, + "learning_rate": 3.8097126817730635e-06, + "loss": 1.113, + "step": 11444 + }, + { + "epoch": 0.34, + "learning_rate": 3.8095049071354997e-06, + "loss": 1.3311, + "step": 11445 + }, + { + "epoch": 0.34, + "learning_rate": 3.8092971200320803e-06, + "loss": 1.1134, + "step": 11446 + }, + { + "epoch": 0.34, + "learning_rate": 3.809089320464783e-06, + "loss": 1.0762, + "step": 11447 + }, + { + "epoch": 0.34, + "learning_rate": 3.8088815084355845e-06, + "loss": 1.1506, + "step": 11448 + }, + { + "epoch": 0.34, + "learning_rate": 3.8086736839464657e-06, + "loss": 1.0865, + "step": 11449 + }, + { + "epoch": 0.34, + "learning_rate": 3.808465846999404e-06, + "loss": 1.1038, + "step": 11450 + }, + { + "epoch": 0.34, + "learning_rate": 3.8082579975963764e-06, + "loss": 1.1733, + "step": 11451 + }, + { + "epoch": 0.34, + "learning_rate": 3.808050135739364e-06, + "loss": 1.2559, + "step": 11452 + }, + { + "epoch": 0.35, + "learning_rate": 3.8078422614303432e-06, + "loss": 1.1047, + "step": 11453 + }, + { + "epoch": 0.35, + "learning_rate": 3.8076343746712954e-06, + "loss": 1.1373, + "step": 11454 + }, + { + "epoch": 0.35, + "learning_rate": 3.8074264754641967e-06, + "loss": 1.1487, + "step": 11455 + }, + { + "epoch": 0.35, + "learning_rate": 3.8072185638110284e-06, + "loss": 1.1046, + "step": 11456 + }, + { + "epoch": 0.35, + "learning_rate": 3.8070106397137687e-06, + "loss": 1.1274, + "step": 11457 + }, + { + "epoch": 0.35, + "learning_rate": 3.806802703174397e-06, + "loss": 1.0967, + "step": 11458 + }, + { + "epoch": 0.35, + "learning_rate": 3.8065947541948933e-06, + "loss": 1.1275, + "step": 11459 + }, + { + "epoch": 0.35, + "learning_rate": 3.806386792777236e-06, + "loss": 1.0096, + "step": 11460 + }, + { + "epoch": 0.35, + "learning_rate": 3.8061788189234066e-06, + "loss": 1.0679, + "step": 11461 + }, + { + "epoch": 0.35, + "learning_rate": 3.8059708326353833e-06, + "loss": 1.1205, + "step": 11462 + }, + { + "epoch": 0.35, + "learning_rate": 3.805762833915147e-06, + "loss": 1.2109, + "step": 11463 + }, + { + "epoch": 0.35, + "learning_rate": 3.805554822764677e-06, + "loss": 1.1859, + "step": 11464 + }, + { + "epoch": 0.35, + "learning_rate": 3.8053467991859545e-06, + "loss": 1.0886, + "step": 11465 + }, + { + "epoch": 0.35, + "learning_rate": 3.8051387631809587e-06, + "loss": 1.0616, + "step": 11466 + }, + { + "epoch": 0.35, + "learning_rate": 3.8049307147516706e-06, + "loss": 1.1133, + "step": 11467 + }, + { + "epoch": 0.35, + "learning_rate": 3.8047226539000704e-06, + "loss": 1.2358, + "step": 11468 + }, + { + "epoch": 0.35, + "learning_rate": 3.804514580628139e-06, + "loss": 1.3397, + "step": 11469 + }, + { + "epoch": 0.35, + "learning_rate": 3.804306494937857e-06, + "loss": 1.0816, + "step": 11470 + }, + { + "epoch": 0.35, + "learning_rate": 3.8040983968312055e-06, + "loss": 1.1488, + "step": 11471 + }, + { + "epoch": 0.35, + "learning_rate": 3.8038902863101655e-06, + "loss": 1.0485, + "step": 11472 + }, + { + "epoch": 0.35, + "learning_rate": 3.8036821633767174e-06, + "loss": 1.1935, + "step": 11473 + }, + { + "epoch": 0.35, + "learning_rate": 3.803474028032844e-06, + "loss": 1.15, + "step": 11474 + }, + { + "epoch": 0.35, + "learning_rate": 3.8032658802805246e-06, + "loss": 1.1705, + "step": 11475 + }, + { + "epoch": 0.35, + "learning_rate": 3.8030577201217424e-06, + "loss": 1.1174, + "step": 11476 + }, + { + "epoch": 0.35, + "learning_rate": 3.802849547558477e-06, + "loss": 1.0398, + "step": 11477 + }, + { + "epoch": 0.35, + "learning_rate": 3.8026413625927127e-06, + "loss": 1.1444, + "step": 11478 + }, + { + "epoch": 0.35, + "learning_rate": 3.8024331652264294e-06, + "loss": 1.1948, + "step": 11479 + }, + { + "epoch": 0.35, + "learning_rate": 3.8022249554616103e-06, + "loss": 1.1248, + "step": 11480 + }, + { + "epoch": 0.35, + "learning_rate": 3.802016733300236e-06, + "loss": 1.2236, + "step": 11481 + }, + { + "epoch": 0.35, + "learning_rate": 3.80180849874429e-06, + "loss": 1.1448, + "step": 11482 + }, + { + "epoch": 0.35, + "learning_rate": 3.801600251795754e-06, + "loss": 1.1776, + "step": 11483 + }, + { + "epoch": 0.35, + "learning_rate": 3.80139199245661e-06, + "loss": 1.1823, + "step": 11484 + }, + { + "epoch": 0.35, + "learning_rate": 3.8011837207288417e-06, + "loss": 1.1415, + "step": 11485 + }, + { + "epoch": 0.35, + "learning_rate": 3.800975436614431e-06, + "loss": 1.134, + "step": 11486 + }, + { + "epoch": 0.35, + "learning_rate": 3.80076714011536e-06, + "loss": 1.1943, + "step": 11487 + }, + { + "epoch": 0.35, + "learning_rate": 3.800558831233613e-06, + "loss": 1.0865, + "step": 11488 + }, + { + "epoch": 0.35, + "learning_rate": 3.800350509971172e-06, + "loss": 1.0847, + "step": 11489 + }, + { + "epoch": 0.35, + "learning_rate": 3.80014217633002e-06, + "loss": 1.0273, + "step": 11490 + }, + { + "epoch": 0.35, + "learning_rate": 3.7999338303121413e-06, + "loss": 1.2169, + "step": 11491 + }, + { + "epoch": 0.35, + "learning_rate": 3.7997254719195186e-06, + "loss": 1.0132, + "step": 11492 + }, + { + "epoch": 0.35, + "learning_rate": 3.7995171011541353e-06, + "loss": 1.1223, + "step": 11493 + }, + { + "epoch": 0.35, + "learning_rate": 3.7993087180179743e-06, + "loss": 1.1423, + "step": 11494 + }, + { + "epoch": 0.35, + "learning_rate": 3.7991003225130206e-06, + "loss": 1.0707, + "step": 11495 + }, + { + "epoch": 0.35, + "learning_rate": 3.7988919146412584e-06, + "loss": 1.1282, + "step": 11496 + }, + { + "epoch": 0.35, + "learning_rate": 3.798683494404669e-06, + "loss": 1.0237, + "step": 11497 + }, + { + "epoch": 0.35, + "learning_rate": 3.79847506180524e-06, + "loss": 1.1532, + "step": 11498 + }, + { + "epoch": 0.35, + "learning_rate": 3.7982666168449528e-06, + "loss": 1.1275, + "step": 11499 + }, + { + "epoch": 0.35, + "learning_rate": 3.798058159525793e-06, + "loss": 1.0451, + "step": 11500 + }, + { + "epoch": 0.35, + "learning_rate": 3.7978496898497443e-06, + "loss": 1.1316, + "step": 11501 + }, + { + "epoch": 0.35, + "learning_rate": 3.797641207818792e-06, + "loss": 1.0974, + "step": 11502 + }, + { + "epoch": 0.35, + "learning_rate": 3.79743271343492e-06, + "loss": 1.1494, + "step": 11503 + }, + { + "epoch": 0.35, + "learning_rate": 3.797224206700113e-06, + "loss": 1.1258, + "step": 11504 + }, + { + "epoch": 0.35, + "learning_rate": 3.797015687616357e-06, + "loss": 1.1487, + "step": 11505 + }, + { + "epoch": 0.35, + "learning_rate": 3.796807156185637e-06, + "loss": 1.1003, + "step": 11506 + }, + { + "epoch": 0.35, + "learning_rate": 3.7965986124099362e-06, + "loss": 1.043, + "step": 11507 + }, + { + "epoch": 0.35, + "learning_rate": 3.7963900562912414e-06, + "loss": 1.1001, + "step": 11508 + }, + { + "epoch": 0.35, + "learning_rate": 3.7961814878315382e-06, + "loss": 1.0365, + "step": 11509 + }, + { + "epoch": 0.35, + "learning_rate": 3.795972907032811e-06, + "loss": 1.1608, + "step": 11510 + }, + { + "epoch": 0.35, + "learning_rate": 3.7957643138970458e-06, + "loss": 1.1598, + "step": 11511 + }, + { + "epoch": 0.35, + "learning_rate": 3.7955557084262286e-06, + "loss": 1.1849, + "step": 11512 + }, + { + "epoch": 0.35, + "learning_rate": 3.7953470906223454e-06, + "loss": 1.1354, + "step": 11513 + }, + { + "epoch": 0.35, + "learning_rate": 3.7951384604873807e-06, + "loss": 1.1715, + "step": 11514 + }, + { + "epoch": 0.35, + "learning_rate": 3.794929818023323e-06, + "loss": 1.1185, + "step": 11515 + }, + { + "epoch": 0.35, + "learning_rate": 3.7947211632321557e-06, + "loss": 1.233, + "step": 11516 + }, + { + "epoch": 0.35, + "learning_rate": 3.7945124961158676e-06, + "loss": 1.2098, + "step": 11517 + }, + { + "epoch": 0.35, + "learning_rate": 3.7943038166764427e-06, + "loss": 1.0251, + "step": 11518 + }, + { + "epoch": 0.35, + "learning_rate": 3.7940951249158704e-06, + "loss": 1.197, + "step": 11519 + }, + { + "epoch": 0.35, + "learning_rate": 3.7938864208361347e-06, + "loss": 1.1926, + "step": 11520 + }, + { + "epoch": 0.35, + "learning_rate": 3.7936777044392236e-06, + "loss": 1.0954, + "step": 11521 + }, + { + "epoch": 0.35, + "learning_rate": 3.7934689757271236e-06, + "loss": 1.0927, + "step": 11522 + }, + { + "epoch": 0.35, + "learning_rate": 3.793260234701822e-06, + "loss": 1.2058, + "step": 11523 + }, + { + "epoch": 0.35, + "learning_rate": 3.793051481365307e-06, + "loss": 1.0874, + "step": 11524 + }, + { + "epoch": 0.35, + "learning_rate": 3.7928427157195634e-06, + "loss": 1.227, + "step": 11525 + }, + { + "epoch": 0.35, + "learning_rate": 3.7926339377665806e-06, + "loss": 1.1355, + "step": 11526 + }, + { + "epoch": 0.35, + "learning_rate": 3.7924251475083444e-06, + "loss": 1.1678, + "step": 11527 + }, + { + "epoch": 0.35, + "learning_rate": 3.7922163449468442e-06, + "loss": 1.1815, + "step": 11528 + }, + { + "epoch": 0.35, + "learning_rate": 3.7920075300840658e-06, + "loss": 1.1586, + "step": 11529 + }, + { + "epoch": 0.35, + "learning_rate": 3.7917987029219983e-06, + "loss": 1.2297, + "step": 11530 + }, + { + "epoch": 0.35, + "learning_rate": 3.791589863462629e-06, + "loss": 1.1122, + "step": 11531 + }, + { + "epoch": 0.35, + "learning_rate": 3.791381011707947e-06, + "loss": 1.1852, + "step": 11532 + }, + { + "epoch": 0.35, + "learning_rate": 3.7911721476599396e-06, + "loss": 1.1077, + "step": 11533 + }, + { + "epoch": 0.35, + "learning_rate": 3.7909632713205944e-06, + "loss": 1.1136, + "step": 11534 + }, + { + "epoch": 0.35, + "learning_rate": 3.7907543826919015e-06, + "loss": 1.0233, + "step": 11535 + }, + { + "epoch": 0.35, + "learning_rate": 3.790545481775848e-06, + "loss": 1.2828, + "step": 11536 + }, + { + "epoch": 0.35, + "learning_rate": 3.790336568574423e-06, + "loss": 1.1852, + "step": 11537 + }, + { + "epoch": 0.35, + "learning_rate": 3.7901276430896156e-06, + "loss": 1.0674, + "step": 11538 + }, + { + "epoch": 0.35, + "learning_rate": 3.7899187053234144e-06, + "loss": 1.0966, + "step": 11539 + }, + { + "epoch": 0.35, + "learning_rate": 3.7897097552778084e-06, + "loss": 1.1422, + "step": 11540 + }, + { + "epoch": 0.35, + "learning_rate": 3.7895007929547868e-06, + "loss": 1.1657, + "step": 11541 + }, + { + "epoch": 0.35, + "learning_rate": 3.7892918183563388e-06, + "loss": 1.0937, + "step": 11542 + }, + { + "epoch": 0.35, + "learning_rate": 3.789082831484453e-06, + "loss": 1.0333, + "step": 11543 + }, + { + "epoch": 0.35, + "learning_rate": 3.78887383234112e-06, + "loss": 1.1923, + "step": 11544 + }, + { + "epoch": 0.35, + "learning_rate": 3.7886648209283283e-06, + "loss": 1.127, + "step": 11545 + }, + { + "epoch": 0.35, + "learning_rate": 3.7884557972480683e-06, + "loss": 0.9929, + "step": 11546 + }, + { + "epoch": 0.35, + "learning_rate": 3.78824676130233e-06, + "loss": 1.0187, + "step": 11547 + }, + { + "epoch": 0.35, + "learning_rate": 3.7880377130931028e-06, + "loss": 1.2426, + "step": 11548 + }, + { + "epoch": 0.35, + "learning_rate": 3.7878286526223767e-06, + "loss": 1.2594, + "step": 11549 + }, + { + "epoch": 0.35, + "learning_rate": 3.787619579892142e-06, + "loss": 1.2211, + "step": 11550 + }, + { + "epoch": 0.35, + "learning_rate": 3.78741049490439e-06, + "loss": 1.1074, + "step": 11551 + }, + { + "epoch": 0.35, + "learning_rate": 3.7872013976611094e-06, + "loss": 1.0857, + "step": 11552 + }, + { + "epoch": 0.35, + "learning_rate": 3.7869922881642917e-06, + "loss": 1.103, + "step": 11553 + }, + { + "epoch": 0.35, + "learning_rate": 3.786783166415927e-06, + "loss": 1.1523, + "step": 11554 + }, + { + "epoch": 0.35, + "learning_rate": 3.7865740324180062e-06, + "loss": 1.1348, + "step": 11555 + }, + { + "epoch": 0.35, + "learning_rate": 3.786364886172521e-06, + "loss": 1.2645, + "step": 11556 + }, + { + "epoch": 0.35, + "learning_rate": 3.7861557276814607e-06, + "loss": 1.2441, + "step": 11557 + }, + { + "epoch": 0.35, + "learning_rate": 3.785946556946817e-06, + "loss": 1.1086, + "step": 11558 + }, + { + "epoch": 0.35, + "learning_rate": 3.785737373970582e-06, + "loss": 1.0829, + "step": 11559 + }, + { + "epoch": 0.35, + "learning_rate": 3.785528178754747e-06, + "loss": 1.1699, + "step": 11560 + }, + { + "epoch": 0.35, + "learning_rate": 3.7853189713013018e-06, + "loss": 1.1588, + "step": 11561 + }, + { + "epoch": 0.35, + "learning_rate": 3.785109751612239e-06, + "loss": 1.1716, + "step": 11562 + }, + { + "epoch": 0.35, + "learning_rate": 3.7849005196895516e-06, + "loss": 1.1131, + "step": 11563 + }, + { + "epoch": 0.35, + "learning_rate": 3.7846912755352293e-06, + "loss": 1.1068, + "step": 11564 + }, + { + "epoch": 0.35, + "learning_rate": 3.784482019151265e-06, + "loss": 1.032, + "step": 11565 + }, + { + "epoch": 0.35, + "learning_rate": 3.7842727505396506e-06, + "loss": 1.1832, + "step": 11566 + }, + { + "epoch": 0.35, + "learning_rate": 3.7840634697023778e-06, + "loss": 1.1459, + "step": 11567 + }, + { + "epoch": 0.35, + "learning_rate": 3.7838541766414387e-06, + "loss": 1.1866, + "step": 11568 + }, + { + "epoch": 0.35, + "learning_rate": 3.7836448713588268e-06, + "loss": 1.0855, + "step": 11569 + }, + { + "epoch": 0.35, + "learning_rate": 3.7834355538565343e-06, + "loss": 1.1551, + "step": 11570 + }, + { + "epoch": 0.35, + "learning_rate": 3.7832262241365526e-06, + "loss": 1.1229, + "step": 11571 + }, + { + "epoch": 0.35, + "learning_rate": 3.7830168822008756e-06, + "loss": 1.1301, + "step": 11572 + }, + { + "epoch": 0.35, + "learning_rate": 3.7828075280514964e-06, + "loss": 1.173, + "step": 11573 + }, + { + "epoch": 0.35, + "learning_rate": 3.782598161690406e-06, + "loss": 1.3577, + "step": 11574 + }, + { + "epoch": 0.35, + "learning_rate": 3.7823887831196e-06, + "loss": 1.0618, + "step": 11575 + }, + { + "epoch": 0.35, + "learning_rate": 3.78217939234107e-06, + "loss": 1.0595, + "step": 11576 + }, + { + "epoch": 0.35, + "learning_rate": 3.7819699893568095e-06, + "loss": 1.1329, + "step": 11577 + }, + { + "epoch": 0.35, + "learning_rate": 3.7817605741688135e-06, + "loss": 1.1906, + "step": 11578 + }, + { + "epoch": 0.35, + "learning_rate": 3.781551146779072e-06, + "loss": 1.1638, + "step": 11579 + }, + { + "epoch": 0.35, + "learning_rate": 3.7813417071895824e-06, + "loss": 1.2184, + "step": 11580 + }, + { + "epoch": 0.35, + "learning_rate": 3.7811322554023367e-06, + "loss": 1.2156, + "step": 11581 + }, + { + "epoch": 0.35, + "learning_rate": 3.780922791419328e-06, + "loss": 1.119, + "step": 11582 + }, + { + "epoch": 0.35, + "learning_rate": 3.7807133152425523e-06, + "loss": 1.1309, + "step": 11583 + }, + { + "epoch": 0.35, + "learning_rate": 3.7805038268740022e-06, + "loss": 1.1072, + "step": 11584 + }, + { + "epoch": 0.35, + "learning_rate": 3.7802943263156722e-06, + "loss": 1.248, + "step": 11585 + }, + { + "epoch": 0.35, + "learning_rate": 3.7800848135695567e-06, + "loss": 1.1584, + "step": 11586 + }, + { + "epoch": 0.35, + "learning_rate": 3.77987528863765e-06, + "loss": 1.2812, + "step": 11587 + }, + { + "epoch": 0.35, + "learning_rate": 3.7796657515219476e-06, + "loss": 1.095, + "step": 11588 + }, + { + "epoch": 0.35, + "learning_rate": 3.779456202224444e-06, + "loss": 1.1165, + "step": 11589 + }, + { + "epoch": 0.35, + "learning_rate": 3.779246640747133e-06, + "loss": 1.1254, + "step": 11590 + }, + { + "epoch": 0.35, + "learning_rate": 3.7790370670920094e-06, + "loss": 1.0404, + "step": 11591 + }, + { + "epoch": 0.35, + "learning_rate": 3.77882748126107e-06, + "loss": 1.1212, + "step": 11592 + }, + { + "epoch": 0.35, + "learning_rate": 3.778617883256309e-06, + "loss": 1.2705, + "step": 11593 + }, + { + "epoch": 0.35, + "learning_rate": 3.7784082730797206e-06, + "loss": 0.9623, + "step": 11594 + }, + { + "epoch": 0.35, + "learning_rate": 3.778198650733302e-06, + "loss": 1.0903, + "step": 11595 + }, + { + "epoch": 0.35, + "learning_rate": 3.777989016219047e-06, + "loss": 1.1144, + "step": 11596 + }, + { + "epoch": 0.35, + "learning_rate": 3.777779369538953e-06, + "loss": 1.1439, + "step": 11597 + }, + { + "epoch": 0.35, + "learning_rate": 3.777569710695014e-06, + "loss": 1.066, + "step": 11598 + }, + { + "epoch": 0.35, + "learning_rate": 3.777360039689227e-06, + "loss": 1.1967, + "step": 11599 + }, + { + "epoch": 0.35, + "learning_rate": 3.7771503565235874e-06, + "loss": 1.3215, + "step": 11600 + }, + { + "epoch": 0.35, + "learning_rate": 3.7769406612000914e-06, + "loss": 1.0692, + "step": 11601 + }, + { + "epoch": 0.35, + "learning_rate": 3.776730953720736e-06, + "loss": 1.1158, + "step": 11602 + }, + { + "epoch": 0.35, + "learning_rate": 3.776521234087516e-06, + "loss": 1.1293, + "step": 11603 + }, + { + "epoch": 0.35, + "learning_rate": 3.7763115023024295e-06, + "loss": 1.1824, + "step": 11604 + }, + { + "epoch": 0.35, + "learning_rate": 3.776101758367472e-06, + "loss": 1.027, + "step": 11605 + }, + { + "epoch": 0.35, + "learning_rate": 3.77589200228464e-06, + "loss": 1.1016, + "step": 11606 + }, + { + "epoch": 0.35, + "learning_rate": 3.7756822340559307e-06, + "loss": 1.1327, + "step": 11607 + }, + { + "epoch": 0.35, + "learning_rate": 3.775472453683341e-06, + "loss": 1.1802, + "step": 11608 + }, + { + "epoch": 0.35, + "learning_rate": 3.7752626611688675e-06, + "loss": 1.0864, + "step": 11609 + }, + { + "epoch": 0.35, + "learning_rate": 3.7750528565145083e-06, + "loss": 1.262, + "step": 11610 + }, + { + "epoch": 0.35, + "learning_rate": 3.7748430397222593e-06, + "loss": 1.1107, + "step": 11611 + }, + { + "epoch": 0.35, + "learning_rate": 3.7746332107941186e-06, + "loss": 1.183, + "step": 11612 + }, + { + "epoch": 0.35, + "learning_rate": 3.7744233697320844e-06, + "loss": 1.176, + "step": 11613 + }, + { + "epoch": 0.35, + "learning_rate": 3.7742135165381528e-06, + "loss": 1.1157, + "step": 11614 + }, + { + "epoch": 0.35, + "learning_rate": 3.7740036512143218e-06, + "loss": 1.0992, + "step": 11615 + }, + { + "epoch": 0.35, + "learning_rate": 3.773793773762591e-06, + "loss": 1.1197, + "step": 11616 + }, + { + "epoch": 0.35, + "learning_rate": 3.7735838841849557e-06, + "loss": 1.1236, + "step": 11617 + }, + { + "epoch": 0.35, + "learning_rate": 3.773373982483416e-06, + "loss": 1.0708, + "step": 11618 + }, + { + "epoch": 0.35, + "learning_rate": 3.773164068659969e-06, + "loss": 1.1699, + "step": 11619 + }, + { + "epoch": 0.35, + "learning_rate": 3.7729541427166128e-06, + "loss": 1.0662, + "step": 11620 + }, + { + "epoch": 0.35, + "learning_rate": 3.772744204655347e-06, + "loss": 1.142, + "step": 11621 + }, + { + "epoch": 0.35, + "learning_rate": 3.7725342544781686e-06, + "loss": 1.1577, + "step": 11622 + }, + { + "epoch": 0.35, + "learning_rate": 3.7723242921870777e-06, + "loss": 1.1537, + "step": 11623 + }, + { + "epoch": 0.35, + "learning_rate": 3.7721143177840717e-06, + "loss": 1.1979, + "step": 11624 + }, + { + "epoch": 0.35, + "learning_rate": 3.7719043312711513e-06, + "loss": 1.1144, + "step": 11625 + }, + { + "epoch": 0.35, + "learning_rate": 3.7716943326503125e-06, + "loss": 1.0674, + "step": 11626 + }, + { + "epoch": 0.35, + "learning_rate": 3.7714843219235564e-06, + "loss": 1.0956, + "step": 11627 + }, + { + "epoch": 0.35, + "learning_rate": 3.7712742990928825e-06, + "loss": 1.0945, + "step": 11628 + }, + { + "epoch": 0.35, + "learning_rate": 3.771064264160289e-06, + "loss": 1.129, + "step": 11629 + }, + { + "epoch": 0.35, + "learning_rate": 3.7708542171277766e-06, + "loss": 1.2065, + "step": 11630 + }, + { + "epoch": 0.35, + "learning_rate": 3.770644157997344e-06, + "loss": 1.0896, + "step": 11631 + }, + { + "epoch": 0.35, + "learning_rate": 3.770434086770991e-06, + "loss": 1.0648, + "step": 11632 + }, + { + "epoch": 0.35, + "learning_rate": 3.770224003450717e-06, + "loss": 1.1597, + "step": 11633 + }, + { + "epoch": 0.35, + "learning_rate": 3.770013908038522e-06, + "loss": 1.1068, + "step": 11634 + }, + { + "epoch": 0.35, + "learning_rate": 3.769803800536407e-06, + "loss": 1.1386, + "step": 11635 + }, + { + "epoch": 0.35, + "learning_rate": 3.769593680946372e-06, + "loss": 1.212, + "step": 11636 + }, + { + "epoch": 0.35, + "learning_rate": 3.769383549270415e-06, + "loss": 1.1442, + "step": 11637 + }, + { + "epoch": 0.35, + "learning_rate": 3.7691734055105388e-06, + "loss": 1.0707, + "step": 11638 + }, + { + "epoch": 0.35, + "learning_rate": 3.768963249668743e-06, + "loss": 1.0565, + "step": 11639 + }, + { + "epoch": 0.35, + "learning_rate": 3.7687530817470273e-06, + "loss": 1.0045, + "step": 11640 + }, + { + "epoch": 0.35, + "learning_rate": 3.768542901747394e-06, + "loss": 1.0876, + "step": 11641 + }, + { + "epoch": 0.35, + "learning_rate": 3.7683327096718436e-06, + "loss": 1.0887, + "step": 11642 + }, + { + "epoch": 0.35, + "learning_rate": 3.7681225055223764e-06, + "loss": 1.1109, + "step": 11643 + }, + { + "epoch": 0.35, + "learning_rate": 3.7679122893009935e-06, + "loss": 1.2625, + "step": 11644 + }, + { + "epoch": 0.35, + "learning_rate": 3.767702061009697e-06, + "loss": 1.1012, + "step": 11645 + }, + { + "epoch": 0.35, + "learning_rate": 3.767491820650486e-06, + "loss": 1.1201, + "step": 11646 + }, + { + "epoch": 0.35, + "learning_rate": 3.767281568225365e-06, + "loss": 1.1528, + "step": 11647 + }, + { + "epoch": 0.35, + "learning_rate": 3.7670713037363326e-06, + "loss": 1.1953, + "step": 11648 + }, + { + "epoch": 0.35, + "learning_rate": 3.7668610271853923e-06, + "loss": 1.1407, + "step": 11649 + }, + { + "epoch": 0.35, + "learning_rate": 3.7666507385745442e-06, + "loss": 1.1937, + "step": 11650 + }, + { + "epoch": 0.35, + "learning_rate": 3.766440437905793e-06, + "loss": 1.0328, + "step": 11651 + }, + { + "epoch": 0.35, + "learning_rate": 3.7662301251811367e-06, + "loss": 1.2462, + "step": 11652 + }, + { + "epoch": 0.35, + "learning_rate": 3.7660198004025806e-06, + "loss": 1.033, + "step": 11653 + }, + { + "epoch": 0.35, + "learning_rate": 3.7658094635721247e-06, + "loss": 1.1545, + "step": 11654 + }, + { + "epoch": 0.35, + "learning_rate": 3.7655991146917735e-06, + "loss": 1.064, + "step": 11655 + }, + { + "epoch": 0.35, + "learning_rate": 3.7653887537635275e-06, + "loss": 1.0629, + "step": 11656 + }, + { + "epoch": 0.35, + "learning_rate": 3.7651783807893906e-06, + "loss": 1.1277, + "step": 11657 + }, + { + "epoch": 0.35, + "learning_rate": 3.7649679957713645e-06, + "loss": 1.1581, + "step": 11658 + }, + { + "epoch": 0.35, + "learning_rate": 3.7647575987114523e-06, + "loss": 1.1296, + "step": 11659 + }, + { + "epoch": 0.35, + "learning_rate": 3.764547189611657e-06, + "loss": 1.0889, + "step": 11660 + }, + { + "epoch": 0.35, + "learning_rate": 3.764336768473982e-06, + "loss": 1.1626, + "step": 11661 + }, + { + "epoch": 0.35, + "learning_rate": 3.7641263353004286e-06, + "loss": 1.0992, + "step": 11662 + }, + { + "epoch": 0.35, + "learning_rate": 3.7639158900930024e-06, + "loss": 1.1335, + "step": 11663 + }, + { + "epoch": 0.35, + "learning_rate": 3.7637054328537053e-06, + "loss": 1.2161, + "step": 11664 + }, + { + "epoch": 0.35, + "learning_rate": 3.763494963584541e-06, + "loss": 1.1268, + "step": 11665 + }, + { + "epoch": 0.35, + "learning_rate": 3.7632844822875138e-06, + "loss": 1.1375, + "step": 11666 + }, + { + "epoch": 0.35, + "learning_rate": 3.7630739889646262e-06, + "loss": 1.1046, + "step": 11667 + }, + { + "epoch": 0.35, + "learning_rate": 3.7628634836178824e-06, + "loss": 1.0972, + "step": 11668 + }, + { + "epoch": 0.35, + "learning_rate": 3.7626529662492863e-06, + "loss": 0.9966, + "step": 11669 + }, + { + "epoch": 0.35, + "learning_rate": 3.762442436860842e-06, + "loss": 1.1375, + "step": 11670 + }, + { + "epoch": 0.35, + "learning_rate": 3.7622318954545547e-06, + "loss": 1.2474, + "step": 11671 + }, + { + "epoch": 0.35, + "learning_rate": 3.7620213420324264e-06, + "loss": 1.1378, + "step": 11672 + }, + { + "epoch": 0.35, + "learning_rate": 3.761810776596464e-06, + "loss": 1.1408, + "step": 11673 + }, + { + "epoch": 0.35, + "learning_rate": 3.7616001991486696e-06, + "loss": 1.2484, + "step": 11674 + }, + { + "epoch": 0.35, + "learning_rate": 3.7613896096910497e-06, + "loss": 1.123, + "step": 11675 + }, + { + "epoch": 0.35, + "learning_rate": 3.761179008225608e-06, + "loss": 1.0927, + "step": 11676 + }, + { + "epoch": 0.35, + "learning_rate": 3.7609683947543497e-06, + "loss": 1.1171, + "step": 11677 + }, + { + "epoch": 0.35, + "learning_rate": 3.760757769279279e-06, + "loss": 1.0956, + "step": 11678 + }, + { + "epoch": 0.35, + "learning_rate": 3.760547131802402e-06, + "loss": 0.9976, + "step": 11679 + }, + { + "epoch": 0.35, + "learning_rate": 3.7603364823257238e-06, + "loss": 1.0374, + "step": 11680 + }, + { + "epoch": 0.35, + "learning_rate": 3.760125820851248e-06, + "loss": 1.0484, + "step": 11681 + }, + { + "epoch": 0.35, + "learning_rate": 3.7599151473809825e-06, + "loss": 1.0726, + "step": 11682 + }, + { + "epoch": 0.35, + "learning_rate": 3.759704461916931e-06, + "loss": 1.1344, + "step": 11683 + }, + { + "epoch": 0.35, + "learning_rate": 3.7594937644610997e-06, + "loss": 1.1495, + "step": 11684 + }, + { + "epoch": 0.35, + "learning_rate": 3.7592830550154946e-06, + "loss": 1.1611, + "step": 11685 + }, + { + "epoch": 0.35, + "learning_rate": 3.7590723335821217e-06, + "loss": 1.2042, + "step": 11686 + }, + { + "epoch": 0.35, + "learning_rate": 3.758861600162986e-06, + "loss": 1.1734, + "step": 11687 + }, + { + "epoch": 0.35, + "learning_rate": 3.7586508547600943e-06, + "loss": 1.2637, + "step": 11688 + }, + { + "epoch": 0.35, + "learning_rate": 3.7584400973754524e-06, + "loss": 1.26, + "step": 11689 + }, + { + "epoch": 0.35, + "learning_rate": 3.7582293280110677e-06, + "loss": 1.1481, + "step": 11690 + }, + { + "epoch": 0.35, + "learning_rate": 3.7580185466689447e-06, + "loss": 1.0762, + "step": 11691 + }, + { + "epoch": 0.35, + "learning_rate": 3.7578077533510917e-06, + "loss": 1.2324, + "step": 11692 + }, + { + "epoch": 0.35, + "learning_rate": 3.7575969480595144e-06, + "loss": 1.1107, + "step": 11693 + }, + { + "epoch": 0.35, + "learning_rate": 3.75738613079622e-06, + "loss": 1.2227, + "step": 11694 + }, + { + "epoch": 0.35, + "learning_rate": 3.757175301563215e-06, + "loss": 1.1287, + "step": 11695 + }, + { + "epoch": 0.35, + "learning_rate": 3.7569644603625064e-06, + "loss": 1.0626, + "step": 11696 + }, + { + "epoch": 0.35, + "learning_rate": 3.756753607196102e-06, + "loss": 1.2933, + "step": 11697 + }, + { + "epoch": 0.35, + "learning_rate": 3.756542742066008e-06, + "loss": 1.1819, + "step": 11698 + }, + { + "epoch": 0.35, + "learning_rate": 3.756331864974233e-06, + "loss": 1.1089, + "step": 11699 + }, + { + "epoch": 0.35, + "learning_rate": 3.7561209759227834e-06, + "loss": 1.162, + "step": 11700 + }, + { + "epoch": 0.35, + "learning_rate": 3.7559100749136667e-06, + "loss": 1.1929, + "step": 11701 + }, + { + "epoch": 0.35, + "learning_rate": 3.7556991619488913e-06, + "loss": 1.1325, + "step": 11702 + }, + { + "epoch": 0.35, + "learning_rate": 3.755488237030465e-06, + "loss": 1.0609, + "step": 11703 + }, + { + "epoch": 0.35, + "learning_rate": 3.7552773001603947e-06, + "loss": 1.1233, + "step": 11704 + }, + { + "epoch": 0.35, + "learning_rate": 3.75506635134069e-06, + "loss": 1.1355, + "step": 11705 + }, + { + "epoch": 0.35, + "learning_rate": 3.754855390573357e-06, + "loss": 1.067, + "step": 11706 + }, + { + "epoch": 0.35, + "learning_rate": 3.7546444178604056e-06, + "loss": 1.1366, + "step": 11707 + }, + { + "epoch": 0.35, + "learning_rate": 3.7544334332038436e-06, + "loss": 1.1355, + "step": 11708 + }, + { + "epoch": 0.35, + "learning_rate": 3.754222436605679e-06, + "loss": 1.1851, + "step": 11709 + }, + { + "epoch": 0.35, + "learning_rate": 3.7540114280679214e-06, + "loss": 1.2003, + "step": 11710 + }, + { + "epoch": 0.35, + "learning_rate": 3.753800407592578e-06, + "loss": 1.218, + "step": 11711 + }, + { + "epoch": 0.35, + "learning_rate": 3.75358937518166e-06, + "loss": 1.1575, + "step": 11712 + }, + { + "epoch": 0.35, + "learning_rate": 3.7533783308371742e-06, + "loss": 1.0385, + "step": 11713 + }, + { + "epoch": 0.35, + "learning_rate": 3.75316727456113e-06, + "loss": 1.166, + "step": 11714 + }, + { + "epoch": 0.35, + "learning_rate": 3.7529562063555375e-06, + "loss": 1.1235, + "step": 11715 + }, + { + "epoch": 0.35, + "learning_rate": 3.7527451262224055e-06, + "loss": 1.0765, + "step": 11716 + }, + { + "epoch": 0.35, + "learning_rate": 3.752534034163743e-06, + "loss": 1.1701, + "step": 11717 + }, + { + "epoch": 0.35, + "learning_rate": 3.7523229301815594e-06, + "loss": 1.1407, + "step": 11718 + }, + { + "epoch": 0.35, + "learning_rate": 3.7521118142778644e-06, + "loss": 1.0695, + "step": 11719 + }, + { + "epoch": 0.35, + "learning_rate": 3.7519006864546693e-06, + "loss": 1.2526, + "step": 11720 + }, + { + "epoch": 0.35, + "learning_rate": 3.7516895467139814e-06, + "loss": 0.9993, + "step": 11721 + }, + { + "epoch": 0.35, + "learning_rate": 3.7514783950578113e-06, + "loss": 1.1353, + "step": 11722 + }, + { + "epoch": 0.35, + "learning_rate": 3.751267231488171e-06, + "loss": 1.1438, + "step": 11723 + }, + { + "epoch": 0.35, + "learning_rate": 3.7510560560070687e-06, + "loss": 0.9665, + "step": 11724 + }, + { + "epoch": 0.35, + "learning_rate": 3.7508448686165153e-06, + "loss": 1.1051, + "step": 11725 + }, + { + "epoch": 0.35, + "learning_rate": 3.750633669318521e-06, + "loss": 1.0854, + "step": 11726 + }, + { + "epoch": 0.35, + "learning_rate": 3.750422458115097e-06, + "loss": 1.063, + "step": 11727 + }, + { + "epoch": 0.35, + "learning_rate": 3.750211235008253e-06, + "loss": 1.0837, + "step": 11728 + }, + { + "epoch": 0.35, + "learning_rate": 3.7500000000000005e-06, + "loss": 1.2133, + "step": 11729 + }, + { + "epoch": 0.35, + "learning_rate": 3.7497887530923493e-06, + "loss": 1.1534, + "step": 11730 + }, + { + "epoch": 0.35, + "learning_rate": 3.749577494287312e-06, + "loss": 1.1332, + "step": 11731 + }, + { + "epoch": 0.35, + "learning_rate": 3.749366223586898e-06, + "loss": 1.1259, + "step": 11732 + }, + { + "epoch": 0.35, + "learning_rate": 3.7491549409931204e-06, + "loss": 1.1632, + "step": 11733 + }, + { + "epoch": 0.35, + "learning_rate": 3.748943646507989e-06, + "loss": 1.1445, + "step": 11734 + }, + { + "epoch": 0.35, + "learning_rate": 3.7487323401335146e-06, + "loss": 1.0917, + "step": 11735 + }, + { + "epoch": 0.35, + "learning_rate": 3.74852102187171e-06, + "loss": 1.165, + "step": 11736 + }, + { + "epoch": 0.35, + "learning_rate": 3.7483096917245866e-06, + "loss": 1.1645, + "step": 11737 + }, + { + "epoch": 0.35, + "learning_rate": 3.748098349694157e-06, + "loss": 1.1656, + "step": 11738 + }, + { + "epoch": 0.35, + "learning_rate": 3.7478869957824315e-06, + "loss": 0.9963, + "step": 11739 + }, + { + "epoch": 0.35, + "learning_rate": 3.747675629991423e-06, + "loss": 1.0436, + "step": 11740 + }, + { + "epoch": 0.35, + "learning_rate": 3.747464252323143e-06, + "loss": 1.1984, + "step": 11741 + }, + { + "epoch": 0.35, + "learning_rate": 3.747252862779605e-06, + "loss": 1.1801, + "step": 11742 + }, + { + "epoch": 0.35, + "learning_rate": 3.7470414613628196e-06, + "loss": 1.1226, + "step": 11743 + }, + { + "epoch": 0.35, + "learning_rate": 3.746830048074801e-06, + "loss": 1.1779, + "step": 11744 + }, + { + "epoch": 0.35, + "learning_rate": 3.74661862291756e-06, + "loss": 1.0593, + "step": 11745 + }, + { + "epoch": 0.35, + "learning_rate": 3.7464071858931106e-06, + "loss": 1.1439, + "step": 11746 + }, + { + "epoch": 0.35, + "learning_rate": 3.746195737003465e-06, + "loss": 1.084, + "step": 11747 + }, + { + "epoch": 0.35, + "learning_rate": 3.745984276250636e-06, + "loss": 0.9449, + "step": 11748 + }, + { + "epoch": 0.35, + "learning_rate": 3.745772803636637e-06, + "loss": 1.166, + "step": 11749 + }, + { + "epoch": 0.35, + "learning_rate": 3.7455613191634805e-06, + "loss": 1.0461, + "step": 11750 + }, + { + "epoch": 0.35, + "learning_rate": 3.7453498228331798e-06, + "loss": 1.063, + "step": 11751 + }, + { + "epoch": 0.35, + "learning_rate": 3.745138314647749e-06, + "loss": 1.075, + "step": 11752 + }, + { + "epoch": 0.35, + "learning_rate": 3.7449267946092017e-06, + "loss": 1.1021, + "step": 11753 + }, + { + "epoch": 0.35, + "learning_rate": 3.74471526271955e-06, + "loss": 1.1351, + "step": 11754 + }, + { + "epoch": 0.35, + "learning_rate": 3.744503718980809e-06, + "loss": 1.3168, + "step": 11755 + }, + { + "epoch": 0.35, + "learning_rate": 3.7442921633949917e-06, + "loss": 1.091, + "step": 11756 + }, + { + "epoch": 0.35, + "learning_rate": 3.744080595964113e-06, + "loss": 1.1584, + "step": 11757 + }, + { + "epoch": 0.35, + "learning_rate": 3.7438690166901854e-06, + "loss": 1.1551, + "step": 11758 + }, + { + "epoch": 0.35, + "learning_rate": 3.7436574255752246e-06, + "loss": 1.157, + "step": 11759 + }, + { + "epoch": 0.35, + "learning_rate": 3.743445822621243e-06, + "loss": 1.2008, + "step": 11760 + }, + { + "epoch": 0.35, + "learning_rate": 3.7432342078302563e-06, + "loss": 1.1216, + "step": 11761 + }, + { + "epoch": 0.35, + "learning_rate": 3.743022581204279e-06, + "loss": 1.1517, + "step": 11762 + }, + { + "epoch": 0.35, + "learning_rate": 3.742810942745325e-06, + "loss": 1.1605, + "step": 11763 + }, + { + "epoch": 0.35, + "learning_rate": 3.74259929245541e-06, + "loss": 1.1515, + "step": 11764 + }, + { + "epoch": 0.35, + "learning_rate": 3.742387630336548e-06, + "loss": 1.2144, + "step": 11765 + }, + { + "epoch": 0.35, + "learning_rate": 3.742175956390754e-06, + "loss": 1.0444, + "step": 11766 + }, + { + "epoch": 0.35, + "learning_rate": 3.741964270620043e-06, + "loss": 1.1575, + "step": 11767 + }, + { + "epoch": 0.35, + "learning_rate": 3.741752573026431e-06, + "loss": 1.1555, + "step": 11768 + }, + { + "epoch": 0.35, + "learning_rate": 3.7415408636119315e-06, + "loss": 1.1666, + "step": 11769 + }, + { + "epoch": 0.35, + "learning_rate": 3.741329142378562e-06, + "loss": 1.2279, + "step": 11770 + }, + { + "epoch": 0.35, + "learning_rate": 3.7411174093283367e-06, + "loss": 1.2053, + "step": 11771 + }, + { + "epoch": 0.35, + "learning_rate": 3.740905664463271e-06, + "loss": 1.0906, + "step": 11772 + }, + { + "epoch": 0.35, + "learning_rate": 3.740693907785381e-06, + "loss": 1.0375, + "step": 11773 + }, + { + "epoch": 0.35, + "learning_rate": 3.7404821392966823e-06, + "loss": 1.17, + "step": 11774 + }, + { + "epoch": 0.35, + "learning_rate": 3.7402703589991917e-06, + "loss": 1.2852, + "step": 11775 + }, + { + "epoch": 0.35, + "learning_rate": 3.740058566894924e-06, + "loss": 1.0644, + "step": 11776 + }, + { + "epoch": 0.35, + "learning_rate": 3.7398467629858957e-06, + "loss": 1.183, + "step": 11777 + }, + { + "epoch": 0.35, + "learning_rate": 3.739634947274124e-06, + "loss": 1.0477, + "step": 11778 + }, + { + "epoch": 0.35, + "learning_rate": 3.7394231197616248e-06, + "loss": 1.1368, + "step": 11779 + }, + { + "epoch": 0.35, + "learning_rate": 3.7392112804504144e-06, + "loss": 1.2888, + "step": 11780 + }, + { + "epoch": 0.35, + "learning_rate": 3.7389994293425093e-06, + "loss": 1.1457, + "step": 11781 + }, + { + "epoch": 0.35, + "learning_rate": 3.7387875664399257e-06, + "loss": 1.101, + "step": 11782 + }, + { + "epoch": 0.35, + "learning_rate": 3.7385756917446827e-06, + "loss": 1.0768, + "step": 11783 + }, + { + "epoch": 0.35, + "learning_rate": 3.738363805258794e-06, + "loss": 1.1381, + "step": 11784 + }, + { + "epoch": 0.36, + "learning_rate": 3.7381519069842793e-06, + "loss": 1.1242, + "step": 11785 + }, + { + "epoch": 0.36, + "learning_rate": 3.7379399969231537e-06, + "loss": 1.1853, + "step": 11786 + }, + { + "epoch": 0.36, + "learning_rate": 3.7377280750774363e-06, + "loss": 1.2363, + "step": 11787 + }, + { + "epoch": 0.36, + "learning_rate": 3.737516141449144e-06, + "loss": 1.107, + "step": 11788 + }, + { + "epoch": 0.36, + "learning_rate": 3.7373041960402935e-06, + "loss": 1.1376, + "step": 11789 + }, + { + "epoch": 0.36, + "learning_rate": 3.7370922388529035e-06, + "loss": 1.0613, + "step": 11790 + }, + { + "epoch": 0.36, + "learning_rate": 3.7368802698889904e-06, + "loss": 1.1469, + "step": 11791 + }, + { + "epoch": 0.36, + "learning_rate": 3.7366682891505734e-06, + "loss": 1.1947, + "step": 11792 + }, + { + "epoch": 0.36, + "learning_rate": 3.7364562966396695e-06, + "loss": 1.2004, + "step": 11793 + }, + { + "epoch": 0.36, + "learning_rate": 3.7362442923582975e-06, + "loss": 1.2073, + "step": 11794 + }, + { + "epoch": 0.36, + "learning_rate": 3.736032276308475e-06, + "loss": 1.1133, + "step": 11795 + }, + { + "epoch": 0.36, + "learning_rate": 3.735820248492221e-06, + "loss": 1.0814, + "step": 11796 + }, + { + "epoch": 0.36, + "learning_rate": 3.735608208911553e-06, + "loss": 1.1755, + "step": 11797 + }, + { + "epoch": 0.36, + "learning_rate": 3.7353961575684897e-06, + "loss": 1.1383, + "step": 11798 + }, + { + "epoch": 0.36, + "learning_rate": 3.7351840944650507e-06, + "loss": 1.1097, + "step": 11799 + }, + { + "epoch": 0.36, + "learning_rate": 3.7349720196032535e-06, + "loss": 1.1594, + "step": 11800 + }, + { + "epoch": 0.36, + "learning_rate": 3.7347599329851177e-06, + "loss": 1.2192, + "step": 11801 + }, + { + "epoch": 0.36, + "learning_rate": 3.734547834612662e-06, + "loss": 1.1062, + "step": 11802 + }, + { + "epoch": 0.36, + "learning_rate": 3.7343357244879053e-06, + "loss": 1.0569, + "step": 11803 + }, + { + "epoch": 0.36, + "learning_rate": 3.7341236026128667e-06, + "loss": 1.1141, + "step": 11804 + }, + { + "epoch": 0.36, + "learning_rate": 3.733911468989566e-06, + "loss": 1.1483, + "step": 11805 + }, + { + "epoch": 0.36, + "learning_rate": 3.7336993236200223e-06, + "loss": 1.1891, + "step": 11806 + }, + { + "epoch": 0.36, + "learning_rate": 3.7334871665062557e-06, + "loss": 1.1553, + "step": 11807 + }, + { + "epoch": 0.36, + "learning_rate": 3.7332749976502847e-06, + "loss": 1.0936, + "step": 11808 + }, + { + "epoch": 0.36, + "learning_rate": 3.7330628170541305e-06, + "loss": 1.1539, + "step": 11809 + }, + { + "epoch": 0.36, + "learning_rate": 3.7328506247198115e-06, + "loss": 1.1149, + "step": 11810 + }, + { + "epoch": 0.36, + "learning_rate": 3.7326384206493487e-06, + "loss": 1.1707, + "step": 11811 + }, + { + "epoch": 0.36, + "learning_rate": 3.7324262048447614e-06, + "loss": 1.1327, + "step": 11812 + }, + { + "epoch": 0.36, + "learning_rate": 3.7322139773080708e-06, + "loss": 1.0891, + "step": 11813 + }, + { + "epoch": 0.36, + "learning_rate": 3.732001738041296e-06, + "loss": 1.1768, + "step": 11814 + }, + { + "epoch": 0.36, + "learning_rate": 3.7317894870464577e-06, + "loss": 1.098, + "step": 11815 + }, + { + "epoch": 0.36, + "learning_rate": 3.731577224325578e-06, + "loss": 1.1487, + "step": 11816 + }, + { + "epoch": 0.36, + "learning_rate": 3.7313649498806747e-06, + "loss": 1.1139, + "step": 11817 + }, + { + "epoch": 0.36, + "learning_rate": 3.731152663713771e-06, + "loss": 1.2698, + "step": 11818 + }, + { + "epoch": 0.36, + "learning_rate": 3.7309403658268866e-06, + "loss": 1.1643, + "step": 11819 + }, + { + "epoch": 0.36, + "learning_rate": 3.730728056222043e-06, + "loss": 1.0996, + "step": 11820 + }, + { + "epoch": 0.36, + "learning_rate": 3.730515734901261e-06, + "loss": 1.1241, + "step": 11821 + }, + { + "epoch": 0.36, + "learning_rate": 3.730303401866562e-06, + "loss": 1.008, + "step": 11822 + }, + { + "epoch": 0.36, + "learning_rate": 3.7300910571199667e-06, + "loss": 1.1548, + "step": 11823 + }, + { + "epoch": 0.36, + "learning_rate": 3.7298787006634977e-06, + "loss": 1.1334, + "step": 11824 + }, + { + "epoch": 0.36, + "learning_rate": 3.7296663324991755e-06, + "loss": 1.3195, + "step": 11825 + }, + { + "epoch": 0.36, + "learning_rate": 3.7294539526290218e-06, + "loss": 1.1526, + "step": 11826 + }, + { + "epoch": 0.36, + "learning_rate": 3.7292415610550585e-06, + "loss": 1.1743, + "step": 11827 + }, + { + "epoch": 0.36, + "learning_rate": 3.729029157779308e-06, + "loss": 1.0452, + "step": 11828 + }, + { + "epoch": 0.36, + "learning_rate": 3.7288167428037912e-06, + "loss": 1.1989, + "step": 11829 + }, + { + "epoch": 0.36, + "learning_rate": 3.7286043161305313e-06, + "loss": 1.1887, + "step": 11830 + }, + { + "epoch": 0.36, + "learning_rate": 3.72839187776155e-06, + "loss": 1.188, + "step": 11831 + }, + { + "epoch": 0.36, + "learning_rate": 3.7281794276988697e-06, + "loss": 1.1467, + "step": 11832 + }, + { + "epoch": 0.36, + "learning_rate": 3.727966965944513e-06, + "loss": 1.1127, + "step": 11833 + }, + { + "epoch": 0.36, + "learning_rate": 3.727754492500501e-06, + "loss": 1.1484, + "step": 11834 + }, + { + "epoch": 0.36, + "learning_rate": 3.727542007368859e-06, + "loss": 1.053, + "step": 11835 + }, + { + "epoch": 0.36, + "learning_rate": 3.7273295105516073e-06, + "loss": 1.1124, + "step": 11836 + }, + { + "epoch": 0.36, + "learning_rate": 3.7271170020507706e-06, + "loss": 1.2007, + "step": 11837 + }, + { + "epoch": 0.36, + "learning_rate": 3.7269044818683705e-06, + "loss": 1.2303, + "step": 11838 + }, + { + "epoch": 0.36, + "learning_rate": 3.7266919500064307e-06, + "loss": 1.0272, + "step": 11839 + }, + { + "epoch": 0.36, + "learning_rate": 3.726479406466974e-06, + "loss": 1.1082, + "step": 11840 + }, + { + "epoch": 0.36, + "learning_rate": 3.7262668512520244e-06, + "loss": 1.0955, + "step": 11841 + }, + { + "epoch": 0.36, + "learning_rate": 3.726054284363605e-06, + "loss": 1.1929, + "step": 11842 + }, + { + "epoch": 0.36, + "learning_rate": 3.7258417058037394e-06, + "loss": 1.1628, + "step": 11843 + }, + { + "epoch": 0.36, + "learning_rate": 3.725629115574451e-06, + "loss": 1.2778, + "step": 11844 + }, + { + "epoch": 0.36, + "learning_rate": 3.7254165136777636e-06, + "loss": 1.1714, + "step": 11845 + }, + { + "epoch": 0.36, + "learning_rate": 3.725203900115701e-06, + "loss": 1.0185, + "step": 11846 + }, + { + "epoch": 0.36, + "learning_rate": 3.7249912748902873e-06, + "loss": 1.1248, + "step": 11847 + }, + { + "epoch": 0.36, + "learning_rate": 3.724778638003548e-06, + "loss": 1.2518, + "step": 11848 + }, + { + "epoch": 0.36, + "learning_rate": 3.724565989457504e-06, + "loss": 1.1107, + "step": 11849 + }, + { + "epoch": 0.36, + "learning_rate": 3.7243533292541826e-06, + "loss": 1.229, + "step": 11850 + }, + { + "epoch": 0.36, + "learning_rate": 3.724140657395607e-06, + "loss": 1.1642, + "step": 11851 + }, + { + "epoch": 0.36, + "learning_rate": 3.7239279738838024e-06, + "loss": 1.0197, + "step": 11852 + }, + { + "epoch": 0.36, + "learning_rate": 3.723715278720792e-06, + "loss": 1.0107, + "step": 11853 + }, + { + "epoch": 0.36, + "learning_rate": 3.723502571908602e-06, + "loss": 1.1661, + "step": 11854 + }, + { + "epoch": 0.36, + "learning_rate": 3.723289853449257e-06, + "loss": 1.174, + "step": 11855 + }, + { + "epoch": 0.36, + "learning_rate": 3.7230771233447815e-06, + "loss": 1.0371, + "step": 11856 + }, + { + "epoch": 0.36, + "learning_rate": 3.722864381597201e-06, + "loss": 1.0942, + "step": 11857 + }, + { + "epoch": 0.36, + "learning_rate": 3.72265162820854e-06, + "loss": 1.0543, + "step": 11858 + }, + { + "epoch": 0.36, + "learning_rate": 3.722438863180825e-06, + "loss": 1.1884, + "step": 11859 + }, + { + "epoch": 0.36, + "learning_rate": 3.72222608651608e-06, + "loss": 1.1366, + "step": 11860 + }, + { + "epoch": 0.36, + "learning_rate": 3.722013298216332e-06, + "loss": 1.1669, + "step": 11861 + }, + { + "epoch": 0.36, + "learning_rate": 3.721800498283606e-06, + "loss": 1.2166, + "step": 11862 + }, + { + "epoch": 0.36, + "learning_rate": 3.7215876867199273e-06, + "loss": 1.1056, + "step": 11863 + }, + { + "epoch": 0.36, + "learning_rate": 3.721374863527322e-06, + "loss": 1.0165, + "step": 11864 + }, + { + "epoch": 0.36, + "learning_rate": 3.721162028707817e-06, + "loss": 1.0969, + "step": 11865 + }, + { + "epoch": 0.36, + "learning_rate": 3.720949182263437e-06, + "loss": 1.1469, + "step": 11866 + }, + { + "epoch": 0.36, + "learning_rate": 3.720736324196209e-06, + "loss": 1.1122, + "step": 11867 + }, + { + "epoch": 0.36, + "learning_rate": 3.720523454508159e-06, + "loss": 1.3024, + "step": 11868 + }, + { + "epoch": 0.36, + "learning_rate": 3.7203105732013134e-06, + "loss": 1.2075, + "step": 11869 + }, + { + "epoch": 0.36, + "learning_rate": 3.7200976802777e-06, + "loss": 1.1151, + "step": 11870 + }, + { + "epoch": 0.36, + "learning_rate": 3.719884775739343e-06, + "loss": 1.0901, + "step": 11871 + }, + { + "epoch": 0.36, + "learning_rate": 3.719671859588271e-06, + "loss": 1.1489, + "step": 11872 + }, + { + "epoch": 0.36, + "learning_rate": 3.71945893182651e-06, + "loss": 1.1511, + "step": 11873 + }, + { + "epoch": 0.36, + "learning_rate": 3.7192459924560877e-06, + "loss": 1.2379, + "step": 11874 + }, + { + "epoch": 0.36, + "learning_rate": 3.71903304147903e-06, + "loss": 1.2065, + "step": 11875 + }, + { + "epoch": 0.36, + "learning_rate": 3.7188200788973654e-06, + "loss": 1.0596, + "step": 11876 + }, + { + "epoch": 0.36, + "learning_rate": 3.7186071047131206e-06, + "loss": 1.1007, + "step": 11877 + }, + { + "epoch": 0.36, + "learning_rate": 3.7183941189283234e-06, + "loss": 1.1036, + "step": 11878 + }, + { + "epoch": 0.36, + "learning_rate": 3.7181811215450003e-06, + "loss": 1.1581, + "step": 11879 + }, + { + "epoch": 0.36, + "learning_rate": 3.71796811256518e-06, + "loss": 1.1671, + "step": 11880 + }, + { + "epoch": 0.36, + "learning_rate": 3.71775509199089e-06, + "loss": 1.1053, + "step": 11881 + }, + { + "epoch": 0.36, + "learning_rate": 3.7175420598241573e-06, + "loss": 1.0908, + "step": 11882 + }, + { + "epoch": 0.36, + "learning_rate": 3.7173290160670115e-06, + "loss": 1.1208, + "step": 11883 + }, + { + "epoch": 0.36, + "learning_rate": 3.7171159607214796e-06, + "loss": 1.0919, + "step": 11884 + }, + { + "epoch": 0.36, + "learning_rate": 3.7169028937895903e-06, + "loss": 1.0853, + "step": 11885 + }, + { + "epoch": 0.36, + "learning_rate": 3.7166898152733705e-06, + "loss": 1.2646, + "step": 11886 + }, + { + "epoch": 0.36, + "learning_rate": 3.7164767251748497e-06, + "loss": 1.0585, + "step": 11887 + }, + { + "epoch": 0.36, + "learning_rate": 3.7162636234960566e-06, + "loss": 1.1478, + "step": 11888 + }, + { + "epoch": 0.36, + "learning_rate": 3.7160505102390197e-06, + "loss": 1.2374, + "step": 11889 + }, + { + "epoch": 0.36, + "learning_rate": 3.715837385405768e-06, + "loss": 1.1207, + "step": 11890 + }, + { + "epoch": 0.36, + "learning_rate": 3.7156242489983295e-06, + "loss": 1.0692, + "step": 11891 + }, + { + "epoch": 0.36, + "learning_rate": 3.715411101018734e-06, + "loss": 1.1829, + "step": 11892 + }, + { + "epoch": 0.36, + "learning_rate": 3.7151979414690094e-06, + "loss": 1.2192, + "step": 11893 + }, + { + "epoch": 0.36, + "learning_rate": 3.7149847703511867e-06, + "loss": 1.1317, + "step": 11894 + }, + { + "epoch": 0.36, + "learning_rate": 3.714771587667293e-06, + "loss": 1.1854, + "step": 11895 + }, + { + "epoch": 0.36, + "learning_rate": 3.71455839341936e-06, + "loss": 1.0573, + "step": 11896 + }, + { + "epoch": 0.36, + "learning_rate": 3.714345187609415e-06, + "loss": 1.0896, + "step": 11897 + }, + { + "epoch": 0.36, + "learning_rate": 3.7141319702394895e-06, + "loss": 1.121, + "step": 11898 + }, + { + "epoch": 0.36, + "learning_rate": 3.713918741311612e-06, + "loss": 1.2087, + "step": 11899 + }, + { + "epoch": 0.36, + "learning_rate": 3.7137055008278122e-06, + "loss": 1.1501, + "step": 11900 + }, + { + "epoch": 0.36, + "learning_rate": 3.7134922487901207e-06, + "loss": 1.1335, + "step": 11901 + }, + { + "epoch": 0.36, + "learning_rate": 3.7132789852005685e-06, + "loss": 1.161, + "step": 11902 + }, + { + "epoch": 0.36, + "learning_rate": 3.7130657100611837e-06, + "loss": 1.071, + "step": 11903 + }, + { + "epoch": 0.36, + "learning_rate": 3.712852423373998e-06, + "loss": 1.2232, + "step": 11904 + }, + { + "epoch": 0.36, + "learning_rate": 3.7126391251410413e-06, + "loss": 1.1774, + "step": 11905 + }, + { + "epoch": 0.36, + "learning_rate": 3.7124258153643444e-06, + "loss": 1.2057, + "step": 11906 + }, + { + "epoch": 0.36, + "learning_rate": 3.7122124940459376e-06, + "loss": 1.1401, + "step": 11907 + }, + { + "epoch": 0.36, + "learning_rate": 3.7119991611878516e-06, + "loss": 1.1312, + "step": 11908 + }, + { + "epoch": 0.36, + "learning_rate": 3.7117858167921172e-06, + "loss": 1.0419, + "step": 11909 + }, + { + "epoch": 0.36, + "learning_rate": 3.7115724608607653e-06, + "loss": 1.1383, + "step": 11910 + }, + { + "epoch": 0.36, + "learning_rate": 3.7113590933958273e-06, + "loss": 1.1129, + "step": 11911 + }, + { + "epoch": 0.36, + "learning_rate": 3.7111457143993336e-06, + "loss": 1.2255, + "step": 11912 + }, + { + "epoch": 0.36, + "learning_rate": 3.7109323238733168e-06, + "loss": 1.2382, + "step": 11913 + }, + { + "epoch": 0.36, + "learning_rate": 3.710718921819807e-06, + "loss": 1.1889, + "step": 11914 + }, + { + "epoch": 0.36, + "learning_rate": 3.710505508240836e-06, + "loss": 1.2347, + "step": 11915 + }, + { + "epoch": 0.36, + "learning_rate": 3.7102920831384357e-06, + "loss": 1.1216, + "step": 11916 + }, + { + "epoch": 0.36, + "learning_rate": 3.7100786465146383e-06, + "loss": 1.1727, + "step": 11917 + }, + { + "epoch": 0.36, + "learning_rate": 3.709865198371474e-06, + "loss": 1.1201, + "step": 11918 + }, + { + "epoch": 0.36, + "learning_rate": 3.7096517387109765e-06, + "loss": 1.1491, + "step": 11919 + }, + { + "epoch": 0.36, + "learning_rate": 3.709438267535177e-06, + "loss": 1.1499, + "step": 11920 + }, + { + "epoch": 0.36, + "learning_rate": 3.7092247848461073e-06, + "loss": 1.1588, + "step": 11921 + }, + { + "epoch": 0.36, + "learning_rate": 3.7090112906458004e-06, + "loss": 1.1657, + "step": 11922 + }, + { + "epoch": 0.36, + "learning_rate": 3.7087977849362877e-06, + "loss": 1.0206, + "step": 11923 + }, + { + "epoch": 0.36, + "learning_rate": 3.7085842677196025e-06, + "loss": 1.2214, + "step": 11924 + }, + { + "epoch": 0.36, + "learning_rate": 3.7083707389977776e-06, + "loss": 1.1285, + "step": 11925 + }, + { + "epoch": 0.36, + "learning_rate": 3.708157198772845e-06, + "loss": 1.126, + "step": 11926 + }, + { + "epoch": 0.36, + "learning_rate": 3.7079436470468377e-06, + "loss": 1.0719, + "step": 11927 + }, + { + "epoch": 0.36, + "learning_rate": 3.7077300838217876e-06, + "loss": 1.1903, + "step": 11928 + }, + { + "epoch": 0.36, + "learning_rate": 3.7075165090997302e-06, + "loss": 1.1042, + "step": 11929 + }, + { + "epoch": 0.36, + "learning_rate": 3.7073029228826967e-06, + "loss": 1.0676, + "step": 11930 + }, + { + "epoch": 0.36, + "learning_rate": 3.707089325172721e-06, + "loss": 1.039, + "step": 11931 + }, + { + "epoch": 0.36, + "learning_rate": 3.706875715971836e-06, + "loss": 1.1235, + "step": 11932 + }, + { + "epoch": 0.36, + "learning_rate": 3.7066620952820754e-06, + "loss": 1.1314, + "step": 11933 + }, + { + "epoch": 0.36, + "learning_rate": 3.7064484631054733e-06, + "loss": 1.045, + "step": 11934 + }, + { + "epoch": 0.36, + "learning_rate": 3.706234819444062e-06, + "loss": 1.134, + "step": 11935 + }, + { + "epoch": 0.36, + "learning_rate": 3.706021164299877e-06, + "loss": 1.1348, + "step": 11936 + }, + { + "epoch": 0.36, + "learning_rate": 3.7058074976749516e-06, + "loss": 1.2366, + "step": 11937 + }, + { + "epoch": 0.36, + "learning_rate": 3.7055938195713185e-06, + "loss": 1.21, + "step": 11938 + }, + { + "epoch": 0.36, + "learning_rate": 3.705380129991014e-06, + "loss": 1.2109, + "step": 11939 + }, + { + "epoch": 0.36, + "learning_rate": 3.70516642893607e-06, + "loss": 1.1665, + "step": 11940 + }, + { + "epoch": 0.36, + "learning_rate": 3.7049527164085232e-06, + "loss": 1.1675, + "step": 11941 + }, + { + "epoch": 0.36, + "learning_rate": 3.7047389924104055e-06, + "loss": 1.229, + "step": 11942 + }, + { + "epoch": 0.36, + "learning_rate": 3.704525256943754e-06, + "loss": 1.1129, + "step": 11943 + }, + { + "epoch": 0.36, + "learning_rate": 3.7043115100106018e-06, + "loss": 1.1077, + "step": 11944 + }, + { + "epoch": 0.36, + "learning_rate": 3.704097751612984e-06, + "loss": 1.1953, + "step": 11945 + }, + { + "epoch": 0.36, + "learning_rate": 3.7038839817529352e-06, + "loss": 1.0797, + "step": 11946 + }, + { + "epoch": 0.36, + "learning_rate": 3.703670200432491e-06, + "loss": 1.1749, + "step": 11947 + }, + { + "epoch": 0.36, + "learning_rate": 3.703456407653687e-06, + "loss": 1.2271, + "step": 11948 + }, + { + "epoch": 0.36, + "learning_rate": 3.7032426034185563e-06, + "loss": 1.0971, + "step": 11949 + }, + { + "epoch": 0.36, + "learning_rate": 3.7030287877291364e-06, + "loss": 1.2394, + "step": 11950 + }, + { + "epoch": 0.36, + "learning_rate": 3.7028149605874614e-06, + "loss": 1.0966, + "step": 11951 + }, + { + "epoch": 0.36, + "learning_rate": 3.7026011219955674e-06, + "loss": 1.1478, + "step": 11952 + }, + { + "epoch": 0.36, + "learning_rate": 3.70238727195549e-06, + "loss": 1.1492, + "step": 11953 + }, + { + "epoch": 0.36, + "learning_rate": 3.7021734104692645e-06, + "loss": 1.1104, + "step": 11954 + }, + { + "epoch": 0.36, + "learning_rate": 3.701959537538927e-06, + "loss": 1.2002, + "step": 11955 + }, + { + "epoch": 0.36, + "learning_rate": 3.701745653166514e-06, + "loss": 1.2416, + "step": 11956 + }, + { + "epoch": 0.36, + "learning_rate": 3.701531757354061e-06, + "loss": 1.262, + "step": 11957 + }, + { + "epoch": 0.36, + "learning_rate": 3.701317850103605e-06, + "loss": 1.166, + "step": 11958 + }, + { + "epoch": 0.36, + "learning_rate": 3.701103931417181e-06, + "loss": 1.0295, + "step": 11959 + }, + { + "epoch": 0.36, + "learning_rate": 3.700890001296826e-06, + "loss": 1.1083, + "step": 11960 + }, + { + "epoch": 0.36, + "learning_rate": 3.7006760597445768e-06, + "loss": 1.2328, + "step": 11961 + }, + { + "epoch": 0.36, + "learning_rate": 3.7004621067624698e-06, + "loss": 1.2324, + "step": 11962 + }, + { + "epoch": 0.36, + "learning_rate": 3.7002481423525416e-06, + "loss": 1.0969, + "step": 11963 + }, + { + "epoch": 0.36, + "learning_rate": 3.700034166516829e-06, + "loss": 1.1952, + "step": 11964 + }, + { + "epoch": 0.36, + "learning_rate": 3.6998201792573694e-06, + "loss": 1.122, + "step": 11965 + }, + { + "epoch": 0.36, + "learning_rate": 3.699606180576199e-06, + "loss": 1.1899, + "step": 11966 + }, + { + "epoch": 0.36, + "learning_rate": 3.6993921704753564e-06, + "loss": 1.1599, + "step": 11967 + }, + { + "epoch": 0.36, + "learning_rate": 3.6991781489568775e-06, + "loss": 1.1671, + "step": 11968 + }, + { + "epoch": 0.36, + "learning_rate": 3.6989641160227995e-06, + "loss": 1.0763, + "step": 11969 + }, + { + "epoch": 0.36, + "learning_rate": 3.6987500716751614e-06, + "loss": 1.1642, + "step": 11970 + }, + { + "epoch": 0.36, + "learning_rate": 3.6985360159159998e-06, + "loss": 1.1624, + "step": 11971 + }, + { + "epoch": 0.36, + "learning_rate": 3.6983219487473522e-06, + "loss": 1.106, + "step": 11972 + }, + { + "epoch": 0.36, + "learning_rate": 3.698107870171257e-06, + "loss": 1.1735, + "step": 11973 + }, + { + "epoch": 0.36, + "learning_rate": 3.697893780189752e-06, + "loss": 1.1478, + "step": 11974 + }, + { + "epoch": 0.36, + "learning_rate": 3.6976796788048752e-06, + "loss": 1.1863, + "step": 11975 + }, + { + "epoch": 0.36, + "learning_rate": 3.6974655660186648e-06, + "loss": 1.1024, + "step": 11976 + }, + { + "epoch": 0.36, + "learning_rate": 3.6972514418331586e-06, + "loss": 1.1299, + "step": 11977 + }, + { + "epoch": 0.36, + "learning_rate": 3.6970373062503956e-06, + "loss": 1.0894, + "step": 11978 + }, + { + "epoch": 0.36, + "learning_rate": 3.6968231592724136e-06, + "loss": 1.1033, + "step": 11979 + }, + { + "epoch": 0.36, + "learning_rate": 3.6966090009012523e-06, + "loss": 1.0971, + "step": 11980 + }, + { + "epoch": 0.36, + "learning_rate": 3.6963948311389484e-06, + "loss": 1.2021, + "step": 11981 + }, + { + "epoch": 0.36, + "learning_rate": 3.6961806499875425e-06, + "loss": 1.1185, + "step": 11982 + }, + { + "epoch": 0.36, + "learning_rate": 3.6959664574490728e-06, + "loss": 1.0904, + "step": 11983 + }, + { + "epoch": 0.36, + "learning_rate": 3.6957522535255786e-06, + "loss": 1.095, + "step": 11984 + }, + { + "epoch": 0.36, + "learning_rate": 3.6955380382190988e-06, + "loss": 1.1878, + "step": 11985 + }, + { + "epoch": 0.36, + "learning_rate": 3.6953238115316725e-06, + "loss": 1.3005, + "step": 11986 + }, + { + "epoch": 0.36, + "learning_rate": 3.69510957346534e-06, + "loss": 1.1558, + "step": 11987 + }, + { + "epoch": 0.36, + "learning_rate": 3.6948953240221384e-06, + "loss": 1.0933, + "step": 11988 + }, + { + "epoch": 0.36, + "learning_rate": 3.6946810632041108e-06, + "loss": 1.1364, + "step": 11989 + }, + { + "epoch": 0.36, + "learning_rate": 3.694466791013293e-06, + "loss": 1.1009, + "step": 11990 + }, + { + "epoch": 0.36, + "learning_rate": 3.694252507451728e-06, + "loss": 1.1923, + "step": 11991 + }, + { + "epoch": 0.36, + "learning_rate": 3.6940382125214536e-06, + "loss": 1.0959, + "step": 11992 + }, + { + "epoch": 0.36, + "learning_rate": 3.6938239062245105e-06, + "loss": 1.2197, + "step": 11993 + }, + { + "epoch": 0.36, + "learning_rate": 3.6936095885629387e-06, + "loss": 1.0339, + "step": 11994 + }, + { + "epoch": 0.36, + "learning_rate": 3.693395259538779e-06, + "loss": 1.1312, + "step": 11995 + }, + { + "epoch": 0.36, + "learning_rate": 3.6931809191540706e-06, + "loss": 1.0832, + "step": 11996 + }, + { + "epoch": 0.36, + "learning_rate": 3.692966567410855e-06, + "loss": 1.1598, + "step": 11997 + }, + { + "epoch": 0.36, + "learning_rate": 3.692752204311172e-06, + "loss": 1.0975, + "step": 11998 + }, + { + "epoch": 0.36, + "learning_rate": 3.6925378298570624e-06, + "loss": 1.116, + "step": 11999 + }, + { + "epoch": 0.36, + "learning_rate": 3.6923234440505667e-06, + "loss": 1.2745, + "step": 12000 + }, + { + "epoch": 0.36, + "learning_rate": 3.692109046893726e-06, + "loss": 1.1385, + "step": 12001 + }, + { + "epoch": 0.36, + "learning_rate": 3.6918946383885823e-06, + "loss": 1.1006, + "step": 12002 + }, + { + "epoch": 0.36, + "learning_rate": 3.691680218537175e-06, + "loss": 1.0156, + "step": 12003 + }, + { + "epoch": 0.36, + "learning_rate": 3.691465787341546e-06, + "loss": 1.0594, + "step": 12004 + }, + { + "epoch": 0.36, + "learning_rate": 3.6912513448037367e-06, + "loss": 1.2352, + "step": 12005 + }, + { + "epoch": 0.36, + "learning_rate": 3.691036890925788e-06, + "loss": 1.1906, + "step": 12006 + }, + { + "epoch": 0.36, + "learning_rate": 3.690822425709742e-06, + "loss": 1.1141, + "step": 12007 + }, + { + "epoch": 0.36, + "learning_rate": 3.6906079491576403e-06, + "loss": 1.2064, + "step": 12008 + }, + { + "epoch": 0.36, + "learning_rate": 3.6903934612715238e-06, + "loss": 1.0897, + "step": 12009 + }, + { + "epoch": 0.36, + "learning_rate": 3.690178962053435e-06, + "loss": 1.1018, + "step": 12010 + }, + { + "epoch": 0.36, + "learning_rate": 3.689964451505416e-06, + "loss": 1.0655, + "step": 12011 + }, + { + "epoch": 0.36, + "learning_rate": 3.689749929629508e-06, + "loss": 1.0637, + "step": 12012 + }, + { + "epoch": 0.36, + "learning_rate": 3.6895353964277534e-06, + "loss": 1.2949, + "step": 12013 + }, + { + "epoch": 0.36, + "learning_rate": 3.6893208519021955e-06, + "loss": 1.1025, + "step": 12014 + }, + { + "epoch": 0.36, + "learning_rate": 3.689106296054876e-06, + "loss": 1.1224, + "step": 12015 + }, + { + "epoch": 0.36, + "learning_rate": 3.6888917288878367e-06, + "loss": 1.1705, + "step": 12016 + }, + { + "epoch": 0.36, + "learning_rate": 3.688677150403121e-06, + "loss": 1.1038, + "step": 12017 + }, + { + "epoch": 0.36, + "learning_rate": 3.688462560602771e-06, + "loss": 1.1754, + "step": 12018 + }, + { + "epoch": 0.36, + "learning_rate": 3.6882479594888305e-06, + "loss": 1.0867, + "step": 12019 + }, + { + "epoch": 0.36, + "learning_rate": 3.688033347063341e-06, + "loss": 1.1866, + "step": 12020 + }, + { + "epoch": 0.36, + "learning_rate": 3.6878187233283467e-06, + "loss": 1.1064, + "step": 12021 + }, + { + "epoch": 0.36, + "learning_rate": 3.6876040882858898e-06, + "loss": 1.0948, + "step": 12022 + }, + { + "epoch": 0.36, + "learning_rate": 3.687389441938014e-06, + "loss": 1.2351, + "step": 12023 + }, + { + "epoch": 0.36, + "learning_rate": 3.6871747842867626e-06, + "loss": 1.1506, + "step": 12024 + }, + { + "epoch": 0.36, + "learning_rate": 3.6869601153341793e-06, + "loss": 1.082, + "step": 12025 + }, + { + "epoch": 0.36, + "learning_rate": 3.6867454350823074e-06, + "loss": 1.2003, + "step": 12026 + }, + { + "epoch": 0.36, + "learning_rate": 3.68653074353319e-06, + "loss": 1.0965, + "step": 12027 + }, + { + "epoch": 0.36, + "learning_rate": 3.686316040688872e-06, + "loss": 1.0956, + "step": 12028 + }, + { + "epoch": 0.36, + "learning_rate": 3.686101326551396e-06, + "loss": 1.2292, + "step": 12029 + }, + { + "epoch": 0.36, + "learning_rate": 3.6858866011228072e-06, + "loss": 1.2584, + "step": 12030 + }, + { + "epoch": 0.36, + "learning_rate": 3.685671864405149e-06, + "loss": 1.1887, + "step": 12031 + }, + { + "epoch": 0.36, + "learning_rate": 3.685457116400466e-06, + "loss": 1.1329, + "step": 12032 + }, + { + "epoch": 0.36, + "learning_rate": 3.6852423571108013e-06, + "loss": 1.1346, + "step": 12033 + }, + { + "epoch": 0.36, + "learning_rate": 3.685027586538201e-06, + "loss": 1.0687, + "step": 12034 + }, + { + "epoch": 0.36, + "learning_rate": 3.684812804684708e-06, + "loss": 1.0399, + "step": 12035 + }, + { + "epoch": 0.36, + "learning_rate": 3.6845980115523683e-06, + "loss": 1.1442, + "step": 12036 + }, + { + "epoch": 0.36, + "learning_rate": 3.684383207143226e-06, + "loss": 1.1736, + "step": 12037 + }, + { + "epoch": 0.36, + "learning_rate": 3.6841683914593257e-06, + "loss": 1.095, + "step": 12038 + }, + { + "epoch": 0.36, + "learning_rate": 3.6839535645027123e-06, + "loss": 1.1595, + "step": 12039 + }, + { + "epoch": 0.36, + "learning_rate": 3.683738726275432e-06, + "loss": 1.0016, + "step": 12040 + }, + { + "epoch": 0.36, + "learning_rate": 3.683523876779529e-06, + "loss": 1.1589, + "step": 12041 + }, + { + "epoch": 0.36, + "learning_rate": 3.6833090160170483e-06, + "loss": 1.1899, + "step": 12042 + }, + { + "epoch": 0.36, + "learning_rate": 3.6830941439900362e-06, + "loss": 1.2412, + "step": 12043 + }, + { + "epoch": 0.36, + "learning_rate": 3.682879260700537e-06, + "loss": 1.135, + "step": 12044 + }, + { + "epoch": 0.36, + "learning_rate": 3.682664366150598e-06, + "loss": 1.0591, + "step": 12045 + }, + { + "epoch": 0.36, + "learning_rate": 3.6824494603422627e-06, + "loss": 1.1678, + "step": 12046 + }, + { + "epoch": 0.36, + "learning_rate": 3.6822345432775788e-06, + "loss": 1.0627, + "step": 12047 + }, + { + "epoch": 0.36, + "learning_rate": 3.682019614958591e-06, + "loss": 1.2941, + "step": 12048 + }, + { + "epoch": 0.36, + "learning_rate": 3.681804675387346e-06, + "loss": 1.1984, + "step": 12049 + }, + { + "epoch": 0.36, + "learning_rate": 3.681589724565889e-06, + "loss": 1.0892, + "step": 12050 + }, + { + "epoch": 0.36, + "learning_rate": 3.6813747624962675e-06, + "loss": 1.0847, + "step": 12051 + }, + { + "epoch": 0.36, + "learning_rate": 3.6811597891805266e-06, + "loss": 1.0993, + "step": 12052 + }, + { + "epoch": 0.36, + "learning_rate": 3.6809448046207143e-06, + "loss": 1.1091, + "step": 12053 + }, + { + "epoch": 0.36, + "learning_rate": 3.6807298088188758e-06, + "loss": 1.108, + "step": 12054 + }, + { + "epoch": 0.36, + "learning_rate": 3.6805148017770583e-06, + "loss": 1.1607, + "step": 12055 + }, + { + "epoch": 0.36, + "learning_rate": 3.680299783497308e-06, + "loss": 1.1268, + "step": 12056 + }, + { + "epoch": 0.36, + "learning_rate": 3.6800847539816724e-06, + "loss": 1.1381, + "step": 12057 + }, + { + "epoch": 0.36, + "learning_rate": 3.679869713232199e-06, + "loss": 1.1655, + "step": 12058 + }, + { + "epoch": 0.36, + "learning_rate": 3.6796546612509334e-06, + "loss": 1.1046, + "step": 12059 + }, + { + "epoch": 0.36, + "learning_rate": 3.6794395980399238e-06, + "loss": 1.1613, + "step": 12060 + }, + { + "epoch": 0.36, + "learning_rate": 3.6792245236012168e-06, + "loss": 1.1516, + "step": 12061 + }, + { + "epoch": 0.36, + "learning_rate": 3.6790094379368613e-06, + "loss": 1.197, + "step": 12062 + }, + { + "epoch": 0.36, + "learning_rate": 3.678794341048903e-06, + "loss": 1.1991, + "step": 12063 + }, + { + "epoch": 0.36, + "learning_rate": 3.6785792329393903e-06, + "loss": 1.1407, + "step": 12064 + }, + { + "epoch": 0.36, + "learning_rate": 3.678364113610371e-06, + "loss": 1.0605, + "step": 12065 + }, + { + "epoch": 0.36, + "learning_rate": 3.678148983063893e-06, + "loss": 1.1219, + "step": 12066 + }, + { + "epoch": 0.36, + "learning_rate": 3.6779338413020043e-06, + "loss": 1.1687, + "step": 12067 + }, + { + "epoch": 0.36, + "learning_rate": 3.6777186883267523e-06, + "loss": 1.1726, + "step": 12068 + }, + { + "epoch": 0.36, + "learning_rate": 3.6775035241401857e-06, + "loss": 1.0493, + "step": 12069 + }, + { + "epoch": 0.36, + "learning_rate": 3.6772883487443527e-06, + "loss": 1.2999, + "step": 12070 + }, + { + "epoch": 0.36, + "learning_rate": 3.677073162141302e-06, + "loss": 1.1611, + "step": 12071 + }, + { + "epoch": 0.36, + "learning_rate": 3.6768579643330816e-06, + "loss": 1.0867, + "step": 12072 + }, + { + "epoch": 0.36, + "learning_rate": 3.67664275532174e-06, + "loss": 1.1658, + "step": 12073 + }, + { + "epoch": 0.36, + "learning_rate": 3.676427535109326e-06, + "loss": 1.2243, + "step": 12074 + }, + { + "epoch": 0.36, + "learning_rate": 3.6762123036978886e-06, + "loss": 1.0485, + "step": 12075 + }, + { + "epoch": 0.36, + "learning_rate": 3.675997061089476e-06, + "loss": 1.1244, + "step": 12076 + }, + { + "epoch": 0.36, + "learning_rate": 3.6757818072861385e-06, + "loss": 1.0787, + "step": 12077 + }, + { + "epoch": 0.36, + "learning_rate": 3.675566542289924e-06, + "loss": 1.1429, + "step": 12078 + }, + { + "epoch": 0.36, + "learning_rate": 3.6753512661028823e-06, + "loss": 1.1419, + "step": 12079 + }, + { + "epoch": 0.36, + "learning_rate": 3.675135978727062e-06, + "loss": 1.1513, + "step": 12080 + }, + { + "epoch": 0.36, + "learning_rate": 3.674920680164514e-06, + "loss": 1.1326, + "step": 12081 + }, + { + "epoch": 0.36, + "learning_rate": 3.674705370417287e-06, + "loss": 1.1227, + "step": 12082 + }, + { + "epoch": 0.36, + "learning_rate": 3.67449004948743e-06, + "loss": 1.1318, + "step": 12083 + }, + { + "epoch": 0.36, + "learning_rate": 3.6742747173769942e-06, + "loss": 1.0804, + "step": 12084 + }, + { + "epoch": 0.36, + "learning_rate": 3.6740593740880282e-06, + "loss": 1.1572, + "step": 12085 + }, + { + "epoch": 0.36, + "learning_rate": 3.6738440196225828e-06, + "loss": 1.0162, + "step": 12086 + }, + { + "epoch": 0.36, + "learning_rate": 3.6736286539827072e-06, + "loss": 1.2227, + "step": 12087 + }, + { + "epoch": 0.36, + "learning_rate": 3.6734132771704523e-06, + "loss": 1.1293, + "step": 12088 + }, + { + "epoch": 0.36, + "learning_rate": 3.6731978891878678e-06, + "loss": 1.1175, + "step": 12089 + }, + { + "epoch": 0.36, + "learning_rate": 3.672982490037005e-06, + "loss": 1.1279, + "step": 12090 + }, + { + "epoch": 0.36, + "learning_rate": 3.672767079719913e-06, + "loss": 1.1292, + "step": 12091 + }, + { + "epoch": 0.36, + "learning_rate": 3.6725516582386435e-06, + "loss": 1.1522, + "step": 12092 + }, + { + "epoch": 0.36, + "learning_rate": 3.6723362255952473e-06, + "loss": 1.0721, + "step": 12093 + }, + { + "epoch": 0.36, + "learning_rate": 3.672120781791774e-06, + "loss": 1.0703, + "step": 12094 + }, + { + "epoch": 0.36, + "learning_rate": 3.671905326830277e-06, + "loss": 1.0893, + "step": 12095 + }, + { + "epoch": 0.36, + "learning_rate": 3.6716898607128045e-06, + "loss": 1.1516, + "step": 12096 + }, + { + "epoch": 0.36, + "learning_rate": 3.671474383441409e-06, + "loss": 1.1382, + "step": 12097 + }, + { + "epoch": 0.36, + "learning_rate": 3.6712588950181417e-06, + "loss": 1.2064, + "step": 12098 + }, + { + "epoch": 0.36, + "learning_rate": 3.6710433954450536e-06, + "loss": 1.113, + "step": 12099 + }, + { + "epoch": 0.36, + "learning_rate": 3.6708278847241962e-06, + "loss": 1.2273, + "step": 12100 + }, + { + "epoch": 0.36, + "learning_rate": 3.670612362857622e-06, + "loss": 1.1591, + "step": 12101 + }, + { + "epoch": 0.36, + "learning_rate": 3.6703968298473814e-06, + "loss": 1.1731, + "step": 12102 + }, + { + "epoch": 0.36, + "learning_rate": 3.670181285695527e-06, + "loss": 1.1196, + "step": 12103 + }, + { + "epoch": 0.36, + "learning_rate": 3.6699657304041097e-06, + "loss": 1.0895, + "step": 12104 + }, + { + "epoch": 0.36, + "learning_rate": 3.6697501639751824e-06, + "loss": 0.9976, + "step": 12105 + }, + { + "epoch": 0.36, + "learning_rate": 3.6695345864107967e-06, + "loss": 1.2487, + "step": 12106 + }, + { + "epoch": 0.36, + "learning_rate": 3.669318997713005e-06, + "loss": 1.218, + "step": 12107 + }, + { + "epoch": 0.36, + "learning_rate": 3.6691033978838603e-06, + "loss": 1.0377, + "step": 12108 + }, + { + "epoch": 0.36, + "learning_rate": 3.6688877869254137e-06, + "loss": 1.1801, + "step": 12109 + }, + { + "epoch": 0.36, + "learning_rate": 3.6686721648397188e-06, + "loss": 1.19, + "step": 12110 + }, + { + "epoch": 0.36, + "learning_rate": 3.668456531628827e-06, + "loss": 1.1859, + "step": 12111 + }, + { + "epoch": 0.36, + "learning_rate": 3.668240887294793e-06, + "loss": 1.2091, + "step": 12112 + }, + { + "epoch": 0.36, + "learning_rate": 3.668025231839667e-06, + "loss": 1.1073, + "step": 12113 + }, + { + "epoch": 0.36, + "learning_rate": 3.6678095652655043e-06, + "loss": 1.0967, + "step": 12114 + }, + { + "epoch": 0.36, + "learning_rate": 3.6675938875743567e-06, + "loss": 1.0527, + "step": 12115 + }, + { + "epoch": 0.36, + "learning_rate": 3.6673781987682777e-06, + "loss": 1.0594, + "step": 12116 + }, + { + "epoch": 0.37, + "learning_rate": 3.6671624988493203e-06, + "loss": 1.2198, + "step": 12117 + }, + { + "epoch": 0.37, + "learning_rate": 3.6669467878195374e-06, + "loss": 1.2333, + "step": 12118 + }, + { + "epoch": 0.37, + "learning_rate": 3.6667310656809847e-06, + "loss": 0.9609, + "step": 12119 + }, + { + "epoch": 0.37, + "learning_rate": 3.6665153324357126e-06, + "loss": 1.1454, + "step": 12120 + }, + { + "epoch": 0.37, + "learning_rate": 3.666299588085777e-06, + "loss": 1.1387, + "step": 12121 + }, + { + "epoch": 0.37, + "learning_rate": 3.666083832633231e-06, + "loss": 1.0291, + "step": 12122 + }, + { + "epoch": 0.37, + "learning_rate": 3.665868066080129e-06, + "loss": 1.1153, + "step": 12123 + }, + { + "epoch": 0.37, + "learning_rate": 3.6656522884285233e-06, + "loss": 1.1566, + "step": 12124 + }, + { + "epoch": 0.37, + "learning_rate": 3.6654364996804703e-06, + "loss": 1.1962, + "step": 12125 + }, + { + "epoch": 0.37, + "learning_rate": 3.6652206998380225e-06, + "loss": 1.2473, + "step": 12126 + }, + { + "epoch": 0.37, + "learning_rate": 3.6650048889032357e-06, + "loss": 1.1757, + "step": 12127 + }, + { + "epoch": 0.37, + "learning_rate": 3.6647890668781627e-06, + "loss": 1.1252, + "step": 12128 + }, + { + "epoch": 0.37, + "learning_rate": 3.6645732337648587e-06, + "loss": 1.0787, + "step": 12129 + }, + { + "epoch": 0.37, + "learning_rate": 3.6643573895653787e-06, + "loss": 1.0829, + "step": 12130 + }, + { + "epoch": 0.37, + "learning_rate": 3.6641415342817777e-06, + "loss": 1.1339, + "step": 12131 + }, + { + "epoch": 0.37, + "learning_rate": 3.663925667916109e-06, + "loss": 1.1903, + "step": 12132 + }, + { + "epoch": 0.37, + "learning_rate": 3.6637097904704284e-06, + "loss": 1.1218, + "step": 12133 + }, + { + "epoch": 0.37, + "learning_rate": 3.6634939019467914e-06, + "loss": 1.2089, + "step": 12134 + }, + { + "epoch": 0.37, + "learning_rate": 3.6632780023472523e-06, + "loss": 1.1068, + "step": 12135 + }, + { + "epoch": 0.37, + "learning_rate": 3.663062091673868e-06, + "loss": 1.2476, + "step": 12136 + }, + { + "epoch": 0.37, + "learning_rate": 3.662846169928692e-06, + "loss": 1.1475, + "step": 12137 + }, + { + "epoch": 0.37, + "learning_rate": 3.6626302371137813e-06, + "loss": 1.1169, + "step": 12138 + }, + { + "epoch": 0.37, + "learning_rate": 3.6624142932311895e-06, + "loss": 1.1588, + "step": 12139 + }, + { + "epoch": 0.37, + "learning_rate": 3.662198338282974e-06, + "loss": 1.0999, + "step": 12140 + }, + { + "epoch": 0.37, + "learning_rate": 3.66198237227119e-06, + "loss": 1.1643, + "step": 12141 + }, + { + "epoch": 0.37, + "learning_rate": 3.6617663951978944e-06, + "loss": 1.3273, + "step": 12142 + }, + { + "epoch": 0.37, + "learning_rate": 3.661550407065141e-06, + "loss": 1.2047, + "step": 12143 + }, + { + "epoch": 0.37, + "learning_rate": 3.661334407874988e-06, + "loss": 1.1976, + "step": 12144 + }, + { + "epoch": 0.37, + "learning_rate": 3.6611183976294896e-06, + "loss": 1.0639, + "step": 12145 + }, + { + "epoch": 0.37, + "learning_rate": 3.660902376330704e-06, + "loss": 1.194, + "step": 12146 + }, + { + "epoch": 0.37, + "learning_rate": 3.6606863439806868e-06, + "loss": 1.1146, + "step": 12147 + }, + { + "epoch": 0.37, + "learning_rate": 3.660470300581494e-06, + "loss": 1.2438, + "step": 12148 + }, + { + "epoch": 0.37, + "learning_rate": 3.660254246135184e-06, + "loss": 1.1953, + "step": 12149 + }, + { + "epoch": 0.37, + "learning_rate": 3.6600381806438116e-06, + "loss": 1.0836, + "step": 12150 + }, + { + "epoch": 0.37, + "learning_rate": 3.659822104109435e-06, + "loss": 1.1903, + "step": 12151 + }, + { + "epoch": 0.37, + "learning_rate": 3.65960601653411e-06, + "loss": 1.1344, + "step": 12152 + }, + { + "epoch": 0.37, + "learning_rate": 3.659389917919895e-06, + "loss": 1.2208, + "step": 12153 + }, + { + "epoch": 0.37, + "learning_rate": 3.6591738082688456e-06, + "loss": 1.1858, + "step": 12154 + }, + { + "epoch": 0.37, + "learning_rate": 3.6589576875830204e-06, + "loss": 1.1972, + "step": 12155 + }, + { + "epoch": 0.37, + "learning_rate": 3.6587415558644758e-06, + "loss": 1.0131, + "step": 12156 + }, + { + "epoch": 0.37, + "learning_rate": 3.6585254131152693e-06, + "loss": 1.1627, + "step": 12157 + }, + { + "epoch": 0.37, + "learning_rate": 3.658309259337459e-06, + "loss": 1.1787, + "step": 12158 + }, + { + "epoch": 0.37, + "learning_rate": 3.658093094533103e-06, + "loss": 1.2565, + "step": 12159 + }, + { + "epoch": 0.37, + "learning_rate": 3.657876918704258e-06, + "loss": 1.1953, + "step": 12160 + }, + { + "epoch": 0.37, + "learning_rate": 3.657660731852982e-06, + "loss": 1.1235, + "step": 12161 + }, + { + "epoch": 0.37, + "learning_rate": 3.6574445339813342e-06, + "loss": 1.1614, + "step": 12162 + }, + { + "epoch": 0.37, + "learning_rate": 3.6572283250913708e-06, + "loss": 1.0684, + "step": 12163 + }, + { + "epoch": 0.37, + "learning_rate": 3.6570121051851526e-06, + "loss": 1.1456, + "step": 12164 + }, + { + "epoch": 0.37, + "learning_rate": 3.6567958742647354e-06, + "loss": 1.1729, + "step": 12165 + }, + { + "epoch": 0.37, + "learning_rate": 3.656579632332179e-06, + "loss": 1.0927, + "step": 12166 + }, + { + "epoch": 0.37, + "learning_rate": 3.6563633793895416e-06, + "loss": 1.1754, + "step": 12167 + }, + { + "epoch": 0.37, + "learning_rate": 3.6561471154388816e-06, + "loss": 1.0781, + "step": 12168 + }, + { + "epoch": 0.37, + "learning_rate": 3.6559308404822574e-06, + "loss": 1.2152, + "step": 12169 + }, + { + "epoch": 0.37, + "learning_rate": 3.655714554521729e-06, + "loss": 1.1526, + "step": 12170 + }, + { + "epoch": 0.37, + "learning_rate": 3.6554982575593546e-06, + "loss": 1.148, + "step": 12171 + }, + { + "epoch": 0.37, + "learning_rate": 3.6552819495971926e-06, + "loss": 1.1469, + "step": 12172 + }, + { + "epoch": 0.37, + "learning_rate": 3.6550656306373034e-06, + "loss": 1.2238, + "step": 12173 + }, + { + "epoch": 0.37, + "learning_rate": 3.6548493006817453e-06, + "loss": 1.135, + "step": 12174 + }, + { + "epoch": 0.37, + "learning_rate": 3.6546329597325784e-06, + "loss": 1.1057, + "step": 12175 + }, + { + "epoch": 0.37, + "learning_rate": 3.6544166077918618e-06, + "loss": 1.1359, + "step": 12176 + }, + { + "epoch": 0.37, + "learning_rate": 3.6542002448616554e-06, + "loss": 1.1411, + "step": 12177 + }, + { + "epoch": 0.37, + "learning_rate": 3.653983870944018e-06, + "loss": 1.146, + "step": 12178 + }, + { + "epoch": 0.37, + "learning_rate": 3.65376748604101e-06, + "loss": 1.0867, + "step": 12179 + }, + { + "epoch": 0.37, + "learning_rate": 3.653551090154691e-06, + "loss": 1.2731, + "step": 12180 + }, + { + "epoch": 0.37, + "learning_rate": 3.653334683287122e-06, + "loss": 1.1625, + "step": 12181 + }, + { + "epoch": 0.37, + "learning_rate": 3.6531182654403617e-06, + "loss": 1.1696, + "step": 12182 + }, + { + "epoch": 0.37, + "learning_rate": 3.6529018366164715e-06, + "loss": 1.0809, + "step": 12183 + }, + { + "epoch": 0.37, + "learning_rate": 3.65268539681751e-06, + "loss": 1.0612, + "step": 12184 + }, + { + "epoch": 0.37, + "learning_rate": 3.65246894604554e-06, + "loss": 1.1229, + "step": 12185 + }, + { + "epoch": 0.37, + "learning_rate": 3.6522524843026196e-06, + "loss": 1.2239, + "step": 12186 + }, + { + "epoch": 0.37, + "learning_rate": 3.6520360115908104e-06, + "loss": 1.0961, + "step": 12187 + }, + { + "epoch": 0.37, + "learning_rate": 3.6518195279121737e-06, + "loss": 1.0964, + "step": 12188 + }, + { + "epoch": 0.37, + "learning_rate": 3.6516030332687693e-06, + "loss": 1.1643, + "step": 12189 + }, + { + "epoch": 0.37, + "learning_rate": 3.651386527662659e-06, + "loss": 1.1407, + "step": 12190 + }, + { + "epoch": 0.37, + "learning_rate": 3.6511700110959036e-06, + "loss": 1.1068, + "step": 12191 + }, + { + "epoch": 0.37, + "learning_rate": 3.6509534835705646e-06, + "loss": 1.1124, + "step": 12192 + }, + { + "epoch": 0.37, + "learning_rate": 3.650736945088702e-06, + "loss": 1.2238, + "step": 12193 + }, + { + "epoch": 0.37, + "learning_rate": 3.6505203956523784e-06, + "loss": 1.1207, + "step": 12194 + }, + { + "epoch": 0.37, + "learning_rate": 3.6503038352636543e-06, + "loss": 1.22, + "step": 12195 + }, + { + "epoch": 0.37, + "learning_rate": 3.650087263924592e-06, + "loss": 1.2013, + "step": 12196 + }, + { + "epoch": 0.37, + "learning_rate": 3.649870681637253e-06, + "loss": 1.1122, + "step": 12197 + }, + { + "epoch": 0.37, + "learning_rate": 3.649654088403699e-06, + "loss": 1.1156, + "step": 12198 + }, + { + "epoch": 0.37, + "learning_rate": 3.649437484225991e-06, + "loss": 1.1447, + "step": 12199 + }, + { + "epoch": 0.37, + "learning_rate": 3.649220869106192e-06, + "loss": 1.0284, + "step": 12200 + }, + { + "epoch": 0.37, + "learning_rate": 3.6490042430463644e-06, + "loss": 1.1149, + "step": 12201 + }, + { + "epoch": 0.37, + "learning_rate": 3.6487876060485687e-06, + "loss": 1.1354, + "step": 12202 + }, + { + "epoch": 0.37, + "learning_rate": 3.6485709581148687e-06, + "loss": 1.083, + "step": 12203 + }, + { + "epoch": 0.37, + "learning_rate": 3.6483542992473264e-06, + "loss": 0.9887, + "step": 12204 + }, + { + "epoch": 0.37, + "learning_rate": 3.6481376294480053e-06, + "loss": 1.2346, + "step": 12205 + }, + { + "epoch": 0.37, + "learning_rate": 3.6479209487189654e-06, + "loss": 1.1793, + "step": 12206 + }, + { + "epoch": 0.37, + "learning_rate": 3.647704257062272e-06, + "loss": 1.1788, + "step": 12207 + }, + { + "epoch": 0.37, + "learning_rate": 3.647487554479986e-06, + "loss": 1.2413, + "step": 12208 + }, + { + "epoch": 0.37, + "learning_rate": 3.647270840974172e-06, + "loss": 1.0497, + "step": 12209 + }, + { + "epoch": 0.37, + "learning_rate": 3.6470541165468913e-06, + "loss": 1.1605, + "step": 12210 + }, + { + "epoch": 0.37, + "learning_rate": 3.646837381200209e-06, + "loss": 1.1663, + "step": 12211 + }, + { + "epoch": 0.37, + "learning_rate": 3.6466206349361853e-06, + "loss": 1.1798, + "step": 12212 + }, + { + "epoch": 0.37, + "learning_rate": 3.6464038777568865e-06, + "loss": 1.1712, + "step": 12213 + }, + { + "epoch": 0.37, + "learning_rate": 3.6461871096643754e-06, + "loss": 1.1076, + "step": 12214 + }, + { + "epoch": 0.37, + "learning_rate": 3.645970330660714e-06, + "loss": 1.0457, + "step": 12215 + }, + { + "epoch": 0.37, + "learning_rate": 3.6457535407479677e-06, + "loss": 1.1397, + "step": 12216 + }, + { + "epoch": 0.37, + "learning_rate": 3.6455367399281987e-06, + "loss": 1.1672, + "step": 12217 + }, + { + "epoch": 0.37, + "learning_rate": 3.645319928203473e-06, + "loss": 1.2368, + "step": 12218 + }, + { + "epoch": 0.37, + "learning_rate": 3.645103105575852e-06, + "loss": 1.1968, + "step": 12219 + }, + { + "epoch": 0.37, + "learning_rate": 3.6448862720474014e-06, + "loss": 1.0892, + "step": 12220 + }, + { + "epoch": 0.37, + "learning_rate": 3.644669427620185e-06, + "loss": 1.1362, + "step": 12221 + }, + { + "epoch": 0.37, + "learning_rate": 3.644452572296267e-06, + "loss": 1.1425, + "step": 12222 + }, + { + "epoch": 0.37, + "learning_rate": 3.644235706077711e-06, + "loss": 1.1555, + "step": 12223 + }, + { + "epoch": 0.37, + "learning_rate": 3.6440188289665835e-06, + "loss": 1.184, + "step": 12224 + }, + { + "epoch": 0.37, + "learning_rate": 3.6438019409649463e-06, + "loss": 1.1549, + "step": 12225 + }, + { + "epoch": 0.37, + "learning_rate": 3.6435850420748657e-06, + "loss": 1.0859, + "step": 12226 + }, + { + "epoch": 0.37, + "learning_rate": 3.6433681322984073e-06, + "loss": 1.114, + "step": 12227 + }, + { + "epoch": 0.37, + "learning_rate": 3.643151211637634e-06, + "loss": 1.2493, + "step": 12228 + }, + { + "epoch": 0.37, + "learning_rate": 3.6429342800946116e-06, + "loss": 1.1893, + "step": 12229 + }, + { + "epoch": 0.37, + "learning_rate": 3.6427173376714053e-06, + "loss": 1.1926, + "step": 12230 + }, + { + "epoch": 0.37, + "learning_rate": 3.6425003843700814e-06, + "loss": 1.19, + "step": 12231 + }, + { + "epoch": 0.37, + "learning_rate": 3.6422834201927032e-06, + "loss": 1.0647, + "step": 12232 + }, + { + "epoch": 0.37, + "learning_rate": 3.642066445141337e-06, + "loss": 1.2833, + "step": 12233 + }, + { + "epoch": 0.37, + "learning_rate": 3.6418494592180487e-06, + "loss": 1.0999, + "step": 12234 + }, + { + "epoch": 0.37, + "learning_rate": 3.6416324624249033e-06, + "loss": 1.2614, + "step": 12235 + }, + { + "epoch": 0.37, + "learning_rate": 3.641415454763967e-06, + "loss": 1.0389, + "step": 12236 + }, + { + "epoch": 0.37, + "learning_rate": 3.641198436237305e-06, + "loss": 1.198, + "step": 12237 + }, + { + "epoch": 0.37, + "learning_rate": 3.640981406846983e-06, + "loss": 1.2281, + "step": 12238 + }, + { + "epoch": 0.37, + "learning_rate": 3.640764366595068e-06, + "loss": 1.1489, + "step": 12239 + }, + { + "epoch": 0.37, + "learning_rate": 3.6405473154836257e-06, + "loss": 1.1187, + "step": 12240 + }, + { + "epoch": 0.37, + "learning_rate": 3.640330253514722e-06, + "loss": 1.0682, + "step": 12241 + }, + { + "epoch": 0.37, + "learning_rate": 3.6401131806904234e-06, + "loss": 1.2128, + "step": 12242 + }, + { + "epoch": 0.37, + "learning_rate": 3.639896097012797e-06, + "loss": 1.21, + "step": 12243 + }, + { + "epoch": 0.37, + "learning_rate": 3.6396790024839077e-06, + "loss": 1.1714, + "step": 12244 + }, + { + "epoch": 0.37, + "learning_rate": 3.6394618971058243e-06, + "loss": 1.1255, + "step": 12245 + }, + { + "epoch": 0.37, + "learning_rate": 3.639244780880612e-06, + "loss": 1.1263, + "step": 12246 + }, + { + "epoch": 0.37, + "learning_rate": 3.6390276538103383e-06, + "loss": 1.1681, + "step": 12247 + }, + { + "epoch": 0.37, + "learning_rate": 3.63881051589707e-06, + "loss": 1.1916, + "step": 12248 + }, + { + "epoch": 0.37, + "learning_rate": 3.6385933671428732e-06, + "loss": 1.1273, + "step": 12249 + }, + { + "epoch": 0.37, + "learning_rate": 3.638376207549817e-06, + "loss": 1.1255, + "step": 12250 + }, + { + "epoch": 0.37, + "learning_rate": 3.6381590371199667e-06, + "loss": 1.0791, + "step": 12251 + }, + { + "epoch": 0.37, + "learning_rate": 3.637941855855391e-06, + "loss": 1.1346, + "step": 12252 + }, + { + "epoch": 0.37, + "learning_rate": 3.6377246637581564e-06, + "loss": 0.9947, + "step": 12253 + }, + { + "epoch": 0.37, + "learning_rate": 3.6375074608303314e-06, + "loss": 1.1168, + "step": 12254 + }, + { + "epoch": 0.37, + "learning_rate": 3.6372902470739834e-06, + "loss": 1.2406, + "step": 12255 + }, + { + "epoch": 0.37, + "learning_rate": 3.6370730224911792e-06, + "loss": 1.1238, + "step": 12256 + }, + { + "epoch": 0.37, + "learning_rate": 3.636855787083988e-06, + "loss": 1.0399, + "step": 12257 + }, + { + "epoch": 0.37, + "learning_rate": 3.6366385408544768e-06, + "loss": 1.0781, + "step": 12258 + }, + { + "epoch": 0.37, + "learning_rate": 3.6364212838047154e-06, + "loss": 1.0507, + "step": 12259 + }, + { + "epoch": 0.37, + "learning_rate": 3.636204015936769e-06, + "loss": 1.1289, + "step": 12260 + }, + { + "epoch": 0.37, + "learning_rate": 3.635986737252709e-06, + "loss": 1.1435, + "step": 12261 + }, + { + "epoch": 0.37, + "learning_rate": 3.635769447754601e-06, + "loss": 1.1508, + "step": 12262 + }, + { + "epoch": 0.37, + "learning_rate": 3.6355521474445167e-06, + "loss": 1.1956, + "step": 12263 + }, + { + "epoch": 0.37, + "learning_rate": 3.635334836324521e-06, + "loss": 1.2203, + "step": 12264 + }, + { + "epoch": 0.37, + "learning_rate": 3.6351175143966854e-06, + "loss": 1.209, + "step": 12265 + }, + { + "epoch": 0.37, + "learning_rate": 3.6349001816630776e-06, + "loss": 1.1381, + "step": 12266 + }, + { + "epoch": 0.37, + "learning_rate": 3.6346828381257665e-06, + "loss": 1.0688, + "step": 12267 + }, + { + "epoch": 0.37, + "learning_rate": 3.6344654837868215e-06, + "loss": 1.2382, + "step": 12268 + }, + { + "epoch": 0.37, + "learning_rate": 3.6342481186483115e-06, + "loss": 1.1426, + "step": 12269 + }, + { + "epoch": 0.37, + "learning_rate": 3.634030742712305e-06, + "loss": 1.2439, + "step": 12270 + }, + { + "epoch": 0.37, + "learning_rate": 3.6338133559808723e-06, + "loss": 1.0554, + "step": 12271 + }, + { + "epoch": 0.37, + "learning_rate": 3.633595958456083e-06, + "loss": 1.0665, + "step": 12272 + }, + { + "epoch": 0.37, + "learning_rate": 3.6333785501400058e-06, + "loss": 1.1827, + "step": 12273 + }, + { + "epoch": 0.37, + "learning_rate": 3.6331611310347113e-06, + "loss": 1.1652, + "step": 12274 + }, + { + "epoch": 0.37, + "learning_rate": 3.6329437011422677e-06, + "loss": 1.0258, + "step": 12275 + }, + { + "epoch": 0.37, + "learning_rate": 3.632726260464746e-06, + "loss": 1.1655, + "step": 12276 + }, + { + "epoch": 0.37, + "learning_rate": 3.632508809004216e-06, + "loss": 1.0211, + "step": 12277 + }, + { + "epoch": 0.37, + "learning_rate": 3.632291346762748e-06, + "loss": 1.1124, + "step": 12278 + }, + { + "epoch": 0.37, + "learning_rate": 3.632073873742411e-06, + "loss": 1.0954, + "step": 12279 + }, + { + "epoch": 0.37, + "learning_rate": 3.6318563899452756e-06, + "loss": 1.1771, + "step": 12280 + }, + { + "epoch": 0.37, + "learning_rate": 3.6316388953734135e-06, + "loss": 1.1286, + "step": 12281 + }, + { + "epoch": 0.37, + "learning_rate": 3.631421390028893e-06, + "loss": 1.1547, + "step": 12282 + }, + { + "epoch": 0.37, + "learning_rate": 3.631203873913787e-06, + "loss": 1.0486, + "step": 12283 + }, + { + "epoch": 0.37, + "learning_rate": 3.6309863470301643e-06, + "loss": 1.1062, + "step": 12284 + }, + { + "epoch": 0.37, + "learning_rate": 3.6307688093800957e-06, + "loss": 1.0222, + "step": 12285 + }, + { + "epoch": 0.37, + "learning_rate": 3.6305512609656534e-06, + "loss": 1.0738, + "step": 12286 + }, + { + "epoch": 0.37, + "learning_rate": 3.6303337017889074e-06, + "loss": 1.1357, + "step": 12287 + }, + { + "epoch": 0.37, + "learning_rate": 3.630116131851929e-06, + "loss": 1.0372, + "step": 12288 + }, + { + "epoch": 0.37, + "learning_rate": 3.6298985511567897e-06, + "loss": 1.1125, + "step": 12289 + }, + { + "epoch": 0.37, + "learning_rate": 3.629680959705559e-06, + "loss": 1.0859, + "step": 12290 + }, + { + "epoch": 0.37, + "learning_rate": 3.629463357500311e-06, + "loss": 1.0981, + "step": 12291 + }, + { + "epoch": 0.37, + "learning_rate": 3.6292457445431157e-06, + "loss": 1.0484, + "step": 12292 + }, + { + "epoch": 0.37, + "learning_rate": 3.6290281208360446e-06, + "loss": 1.1016, + "step": 12293 + }, + { + "epoch": 0.37, + "learning_rate": 3.6288104863811695e-06, + "loss": 1.0958, + "step": 12294 + }, + { + "epoch": 0.37, + "learning_rate": 3.6285928411805616e-06, + "loss": 1.0773, + "step": 12295 + }, + { + "epoch": 0.37, + "learning_rate": 3.6283751852362946e-06, + "loss": 1.2026, + "step": 12296 + }, + { + "epoch": 0.37, + "learning_rate": 3.628157518550438e-06, + "loss": 1.1691, + "step": 12297 + }, + { + "epoch": 0.37, + "learning_rate": 3.627939841125066e-06, + "loss": 1.1084, + "step": 12298 + }, + { + "epoch": 0.37, + "learning_rate": 3.6277221529622497e-06, + "loss": 1.2235, + "step": 12299 + }, + { + "epoch": 0.37, + "learning_rate": 3.627504454064062e-06, + "loss": 1.2161, + "step": 12300 + }, + { + "epoch": 0.37, + "learning_rate": 3.6272867444325744e-06, + "loss": 1.1578, + "step": 12301 + }, + { + "epoch": 0.37, + "learning_rate": 3.62706902406986e-06, + "loss": 1.177, + "step": 12302 + }, + { + "epoch": 0.37, + "learning_rate": 3.6268512929779913e-06, + "loss": 1.0402, + "step": 12303 + }, + { + "epoch": 0.37, + "learning_rate": 3.626633551159041e-06, + "loss": 1.2166, + "step": 12304 + }, + { + "epoch": 0.37, + "learning_rate": 3.6264157986150823e-06, + "loss": 1.1365, + "step": 12305 + }, + { + "epoch": 0.37, + "learning_rate": 3.6261980353481876e-06, + "loss": 1.2209, + "step": 12306 + }, + { + "epoch": 0.37, + "learning_rate": 3.62598026136043e-06, + "loss": 1.0623, + "step": 12307 + }, + { + "epoch": 0.37, + "learning_rate": 3.625762476653882e-06, + "loss": 1.0901, + "step": 12308 + }, + { + "epoch": 0.37, + "learning_rate": 3.6255446812306183e-06, + "loss": 1.1322, + "step": 12309 + }, + { + "epoch": 0.37, + "learning_rate": 3.6253268750927107e-06, + "loss": 1.1544, + "step": 12310 + }, + { + "epoch": 0.37, + "learning_rate": 3.6251090582422326e-06, + "loss": 1.1238, + "step": 12311 + }, + { + "epoch": 0.37, + "learning_rate": 3.624891230681259e-06, + "loss": 1.1094, + "step": 12312 + }, + { + "epoch": 0.37, + "learning_rate": 3.624673392411863e-06, + "loss": 1.14, + "step": 12313 + }, + { + "epoch": 0.37, + "learning_rate": 3.6244555434361173e-06, + "loss": 1.0953, + "step": 12314 + }, + { + "epoch": 0.37, + "learning_rate": 3.6242376837560967e-06, + "loss": 1.0691, + "step": 12315 + }, + { + "epoch": 0.37, + "learning_rate": 3.6240198133738746e-06, + "loss": 1.1116, + "step": 12316 + }, + { + "epoch": 0.37, + "learning_rate": 3.623801932291525e-06, + "loss": 1.2587, + "step": 12317 + }, + { + "epoch": 0.37, + "learning_rate": 3.6235840405111226e-06, + "loss": 1.2123, + "step": 12318 + }, + { + "epoch": 0.37, + "learning_rate": 3.623366138034741e-06, + "loss": 1.1716, + "step": 12319 + }, + { + "epoch": 0.37, + "learning_rate": 3.6231482248644557e-06, + "loss": 1.1, + "step": 12320 + }, + { + "epoch": 0.37, + "learning_rate": 3.6229303010023393e-06, + "loss": 1.0953, + "step": 12321 + }, + { + "epoch": 0.37, + "learning_rate": 3.6227123664504676e-06, + "loss": 1.1802, + "step": 12322 + }, + { + "epoch": 0.37, + "learning_rate": 3.6224944212109146e-06, + "loss": 1.1478, + "step": 12323 + }, + { + "epoch": 0.37, + "learning_rate": 3.6222764652857556e-06, + "loss": 1.0317, + "step": 12324 + }, + { + "epoch": 0.37, + "learning_rate": 3.6220584986770652e-06, + "loss": 1.188, + "step": 12325 + }, + { + "epoch": 0.37, + "learning_rate": 3.621840521386918e-06, + "loss": 1.1674, + "step": 12326 + }, + { + "epoch": 0.37, + "learning_rate": 3.6216225334173895e-06, + "loss": 1.0129, + "step": 12327 + }, + { + "epoch": 0.37, + "learning_rate": 3.621404534770555e-06, + "loss": 1.1494, + "step": 12328 + }, + { + "epoch": 0.37, + "learning_rate": 3.621186525448489e-06, + "loss": 1.1321, + "step": 12329 + }, + { + "epoch": 0.37, + "learning_rate": 3.6209685054532674e-06, + "loss": 1.2148, + "step": 12330 + }, + { + "epoch": 0.37, + "learning_rate": 3.6207504747869654e-06, + "loss": 1.3036, + "step": 12331 + }, + { + "epoch": 0.37, + "learning_rate": 3.6205324334516584e-06, + "loss": 1.0821, + "step": 12332 + }, + { + "epoch": 0.37, + "learning_rate": 3.620314381449423e-06, + "loss": 1.08, + "step": 12333 + }, + { + "epoch": 0.37, + "learning_rate": 3.6200963187823335e-06, + "loss": 1.0784, + "step": 12334 + }, + { + "epoch": 0.37, + "learning_rate": 3.6198782454524672e-06, + "loss": 1.1465, + "step": 12335 + }, + { + "epoch": 0.37, + "learning_rate": 3.6196601614618986e-06, + "loss": 1.1937, + "step": 12336 + }, + { + "epoch": 0.37, + "learning_rate": 3.6194420668127056e-06, + "loss": 1.2167, + "step": 12337 + }, + { + "epoch": 0.37, + "learning_rate": 3.6192239615069623e-06, + "loss": 1.0833, + "step": 12338 + }, + { + "epoch": 0.37, + "learning_rate": 3.6190058455467457e-06, + "loss": 1.181, + "step": 12339 + }, + { + "epoch": 0.37, + "learning_rate": 3.618787718934133e-06, + "loss": 1.1902, + "step": 12340 + }, + { + "epoch": 0.37, + "learning_rate": 3.6185695816712004e-06, + "loss": 1.089, + "step": 12341 + }, + { + "epoch": 0.37, + "learning_rate": 3.6183514337600235e-06, + "loss": 1.1046, + "step": 12342 + }, + { + "epoch": 0.37, + "learning_rate": 3.61813327520268e-06, + "loss": 1.1824, + "step": 12343 + }, + { + "epoch": 0.37, + "learning_rate": 3.6179151060012456e-06, + "loss": 1.1183, + "step": 12344 + }, + { + "epoch": 0.37, + "learning_rate": 3.6176969261577978e-06, + "loss": 1.1425, + "step": 12345 + }, + { + "epoch": 0.37, + "learning_rate": 3.6174787356744145e-06, + "loss": 1.1496, + "step": 12346 + }, + { + "epoch": 0.37, + "learning_rate": 3.617260534553171e-06, + "loss": 1.1011, + "step": 12347 + }, + { + "epoch": 0.37, + "learning_rate": 3.617042322796146e-06, + "loss": 1.0813, + "step": 12348 + }, + { + "epoch": 0.37, + "learning_rate": 3.616824100405415e-06, + "loss": 1.1428, + "step": 12349 + }, + { + "epoch": 0.37, + "learning_rate": 3.616605867383057e-06, + "loss": 1.1527, + "step": 12350 + }, + { + "epoch": 0.37, + "learning_rate": 3.616387623731149e-06, + "loss": 1.0539, + "step": 12351 + }, + { + "epoch": 0.37, + "learning_rate": 3.6161693694517684e-06, + "loss": 1.097, + "step": 12352 + }, + { + "epoch": 0.37, + "learning_rate": 3.615951104546993e-06, + "loss": 1.0858, + "step": 12353 + }, + { + "epoch": 0.37, + "learning_rate": 3.615732829018901e-06, + "loss": 1.0938, + "step": 12354 + }, + { + "epoch": 0.37, + "learning_rate": 3.615514542869569e-06, + "loss": 1.1398, + "step": 12355 + }, + { + "epoch": 0.37, + "learning_rate": 3.6152962461010765e-06, + "loss": 1.0455, + "step": 12356 + }, + { + "epoch": 0.37, + "learning_rate": 3.6150779387155003e-06, + "loss": 1.1075, + "step": 12357 + }, + { + "epoch": 0.37, + "learning_rate": 3.61485962071492e-06, + "loss": 1.1603, + "step": 12358 + }, + { + "epoch": 0.37, + "learning_rate": 3.6146412921014122e-06, + "loss": 1.1244, + "step": 12359 + }, + { + "epoch": 0.37, + "learning_rate": 3.6144229528770564e-06, + "loss": 1.177, + "step": 12360 + }, + { + "epoch": 0.37, + "learning_rate": 3.614204603043931e-06, + "loss": 1.1126, + "step": 12361 + }, + { + "epoch": 0.37, + "learning_rate": 3.613986242604114e-06, + "loss": 1.2108, + "step": 12362 + }, + { + "epoch": 0.37, + "learning_rate": 3.613767871559685e-06, + "loss": 1.2134, + "step": 12363 + }, + { + "epoch": 0.37, + "learning_rate": 3.613549489912722e-06, + "loss": 1.1245, + "step": 12364 + }, + { + "epoch": 0.37, + "learning_rate": 3.613331097665304e-06, + "loss": 1.0144, + "step": 12365 + }, + { + "epoch": 0.37, + "learning_rate": 3.6131126948195106e-06, + "loss": 1.0989, + "step": 12366 + }, + { + "epoch": 0.37, + "learning_rate": 3.6128942813774197e-06, + "loss": 1.3331, + "step": 12367 + }, + { + "epoch": 0.37, + "learning_rate": 3.6126758573411117e-06, + "loss": 1.1478, + "step": 12368 + }, + { + "epoch": 0.37, + "learning_rate": 3.6124574227126656e-06, + "loss": 1.2028, + "step": 12369 + }, + { + "epoch": 0.37, + "learning_rate": 3.61223897749416e-06, + "loss": 1.1877, + "step": 12370 + }, + { + "epoch": 0.37, + "learning_rate": 3.6120205216876757e-06, + "loss": 1.1725, + "step": 12371 + }, + { + "epoch": 0.37, + "learning_rate": 3.6118020552952916e-06, + "loss": 1.1371, + "step": 12372 + }, + { + "epoch": 0.37, + "learning_rate": 3.611583578319087e-06, + "loss": 1.1051, + "step": 12373 + }, + { + "epoch": 0.37, + "learning_rate": 3.6113650907611426e-06, + "loss": 1.1483, + "step": 12374 + }, + { + "epoch": 0.37, + "learning_rate": 3.6111465926235366e-06, + "loss": 1.1085, + "step": 12375 + }, + { + "epoch": 0.37, + "learning_rate": 3.6109280839083517e-06, + "loss": 1.0294, + "step": 12376 + }, + { + "epoch": 0.37, + "learning_rate": 3.6107095646176653e-06, + "loss": 1.0939, + "step": 12377 + }, + { + "epoch": 0.37, + "learning_rate": 3.6104910347535598e-06, + "loss": 1.0613, + "step": 12378 + }, + { + "epoch": 0.37, + "learning_rate": 3.6102724943181133e-06, + "loss": 1.1254, + "step": 12379 + }, + { + "epoch": 0.37, + "learning_rate": 3.610053943313408e-06, + "loss": 1.1762, + "step": 12380 + }, + { + "epoch": 0.37, + "learning_rate": 3.6098353817415236e-06, + "loss": 1.1996, + "step": 12381 + }, + { + "epoch": 0.37, + "learning_rate": 3.6096168096045414e-06, + "loss": 1.0309, + "step": 12382 + }, + { + "epoch": 0.37, + "learning_rate": 3.6093982269045412e-06, + "loss": 1.1242, + "step": 12383 + }, + { + "epoch": 0.37, + "learning_rate": 3.6091796336436047e-06, + "loss": 1.1802, + "step": 12384 + }, + { + "epoch": 0.37, + "learning_rate": 3.6089610298238116e-06, + "loss": 1.1758, + "step": 12385 + }, + { + "epoch": 0.37, + "learning_rate": 3.6087424154472432e-06, + "loss": 1.1704, + "step": 12386 + }, + { + "epoch": 0.37, + "learning_rate": 3.608523790515982e-06, + "loss": 1.2847, + "step": 12387 + }, + { + "epoch": 0.37, + "learning_rate": 3.608305155032108e-06, + "loss": 1.1306, + "step": 12388 + }, + { + "epoch": 0.37, + "learning_rate": 3.6080865089977023e-06, + "loss": 1.1157, + "step": 12389 + }, + { + "epoch": 0.37, + "learning_rate": 3.6078678524148467e-06, + "loss": 1.1677, + "step": 12390 + }, + { + "epoch": 0.37, + "learning_rate": 3.6076491852856233e-06, + "loss": 1.0076, + "step": 12391 + }, + { + "epoch": 0.37, + "learning_rate": 3.607430507612113e-06, + "loss": 1.2226, + "step": 12392 + }, + { + "epoch": 0.37, + "learning_rate": 3.6072118193963968e-06, + "loss": 1.1808, + "step": 12393 + }, + { + "epoch": 0.37, + "learning_rate": 3.606993120640558e-06, + "loss": 1.0797, + "step": 12394 + }, + { + "epoch": 0.37, + "learning_rate": 3.606774411346678e-06, + "loss": 1.1646, + "step": 12395 + }, + { + "epoch": 0.37, + "learning_rate": 3.606555691516838e-06, + "loss": 1.1723, + "step": 12396 + }, + { + "epoch": 0.37, + "learning_rate": 3.6063369611531213e-06, + "loss": 1.087, + "step": 12397 + }, + { + "epoch": 0.37, + "learning_rate": 3.6061182202576095e-06, + "loss": 1.1599, + "step": 12398 + }, + { + "epoch": 0.37, + "learning_rate": 3.6058994688323846e-06, + "loss": 1.1031, + "step": 12399 + }, + { + "epoch": 0.37, + "learning_rate": 3.6056807068795295e-06, + "loss": 1.1719, + "step": 12400 + }, + { + "epoch": 0.37, + "learning_rate": 3.6054619344011267e-06, + "loss": 1.1252, + "step": 12401 + }, + { + "epoch": 0.37, + "learning_rate": 3.6052431513992593e-06, + "loss": 1.2201, + "step": 12402 + }, + { + "epoch": 0.37, + "learning_rate": 3.6050243578760086e-06, + "loss": 1.1695, + "step": 12403 + }, + { + "epoch": 0.37, + "learning_rate": 3.6048055538334587e-06, + "loss": 1.1024, + "step": 12404 + }, + { + "epoch": 0.37, + "learning_rate": 3.6045867392736916e-06, + "loss": 1.0978, + "step": 12405 + }, + { + "epoch": 0.37, + "learning_rate": 3.604367914198791e-06, + "loss": 1.1492, + "step": 12406 + }, + { + "epoch": 0.37, + "learning_rate": 3.60414907861084e-06, + "loss": 1.1241, + "step": 12407 + }, + { + "epoch": 0.37, + "learning_rate": 3.6039302325119208e-06, + "loss": 1.0602, + "step": 12408 + }, + { + "epoch": 0.37, + "learning_rate": 3.6037113759041177e-06, + "loss": 1.0582, + "step": 12409 + }, + { + "epoch": 0.37, + "learning_rate": 3.603492508789514e-06, + "loss": 1.2258, + "step": 12410 + }, + { + "epoch": 0.37, + "learning_rate": 3.6032736311701927e-06, + "loss": 1.1405, + "step": 12411 + }, + { + "epoch": 0.37, + "learning_rate": 3.603054743048238e-06, + "loss": 0.9793, + "step": 12412 + }, + { + "epoch": 0.37, + "learning_rate": 3.602835844425734e-06, + "loss": 1.0823, + "step": 12413 + }, + { + "epoch": 0.37, + "learning_rate": 3.602616935304763e-06, + "loss": 1.1096, + "step": 12414 + }, + { + "epoch": 0.37, + "learning_rate": 3.6023980156874106e-06, + "loss": 1.0665, + "step": 12415 + }, + { + "epoch": 0.37, + "learning_rate": 3.6021790855757595e-06, + "loss": 1.1306, + "step": 12416 + }, + { + "epoch": 0.37, + "learning_rate": 3.6019601449718948e-06, + "loss": 1.1257, + "step": 12417 + }, + { + "epoch": 0.37, + "learning_rate": 3.6017411938779e-06, + "loss": 1.1445, + "step": 12418 + }, + { + "epoch": 0.37, + "learning_rate": 3.60152223229586e-06, + "loss": 1.0715, + "step": 12419 + }, + { + "epoch": 0.37, + "learning_rate": 3.601303260227858e-06, + "loss": 1.1312, + "step": 12420 + }, + { + "epoch": 0.37, + "learning_rate": 3.6010842776759795e-06, + "loss": 1.0476, + "step": 12421 + }, + { + "epoch": 0.37, + "learning_rate": 3.6008652846423093e-06, + "loss": 1.1331, + "step": 12422 + }, + { + "epoch": 0.37, + "learning_rate": 3.6006462811289323e-06, + "loss": 1.1312, + "step": 12423 + }, + { + "epoch": 0.37, + "learning_rate": 3.600427267137932e-06, + "loss": 1.1854, + "step": 12424 + }, + { + "epoch": 0.37, + "learning_rate": 3.600208242671394e-06, + "loss": 1.1505, + "step": 12425 + }, + { + "epoch": 0.37, + "learning_rate": 3.5999892077314042e-06, + "loss": 1.1487, + "step": 12426 + }, + { + "epoch": 0.37, + "learning_rate": 3.5997701623200465e-06, + "loss": 1.1946, + "step": 12427 + }, + { + "epoch": 0.37, + "learning_rate": 3.599551106439407e-06, + "loss": 1.0819, + "step": 12428 + }, + { + "epoch": 0.37, + "learning_rate": 3.5993320400915695e-06, + "loss": 1.1003, + "step": 12429 + }, + { + "epoch": 0.37, + "learning_rate": 3.5991129632786214e-06, + "loss": 1.1302, + "step": 12430 + }, + { + "epoch": 0.37, + "learning_rate": 3.5988938760026463e-06, + "loss": 1.2175, + "step": 12431 + }, + { + "epoch": 0.37, + "learning_rate": 3.5986747782657317e-06, + "loss": 1.2223, + "step": 12432 + }, + { + "epoch": 0.37, + "learning_rate": 3.598455670069962e-06, + "loss": 1.1357, + "step": 12433 + }, + { + "epoch": 0.37, + "learning_rate": 3.598236551417423e-06, + "loss": 1.0928, + "step": 12434 + }, + { + "epoch": 0.37, + "learning_rate": 3.598017422310201e-06, + "loss": 1.1297, + "step": 12435 + }, + { + "epoch": 0.37, + "learning_rate": 3.5977982827503827e-06, + "loss": 1.2681, + "step": 12436 + }, + { + "epoch": 0.37, + "learning_rate": 3.597579132740053e-06, + "loss": 1.0499, + "step": 12437 + }, + { + "epoch": 0.37, + "learning_rate": 3.597359972281298e-06, + "loss": 1.2749, + "step": 12438 + }, + { + "epoch": 0.37, + "learning_rate": 3.5971408013762054e-06, + "loss": 1.287, + "step": 12439 + }, + { + "epoch": 0.37, + "learning_rate": 3.59692162002686e-06, + "loss": 1.1264, + "step": 12440 + }, + { + "epoch": 0.37, + "learning_rate": 3.5967024282353504e-06, + "loss": 1.1444, + "step": 12441 + }, + { + "epoch": 0.37, + "learning_rate": 3.596483226003761e-06, + "loss": 1.0738, + "step": 12442 + }, + { + "epoch": 0.37, + "learning_rate": 3.59626401333418e-06, + "loss": 1.3298, + "step": 12443 + }, + { + "epoch": 0.37, + "learning_rate": 3.596044790228692e-06, + "loss": 1.1602, + "step": 12444 + }, + { + "epoch": 0.37, + "learning_rate": 3.595825556689387e-06, + "loss": 1.1285, + "step": 12445 + }, + { + "epoch": 0.37, + "learning_rate": 3.5956063127183495e-06, + "loss": 1.1315, + "step": 12446 + }, + { + "epoch": 0.37, + "learning_rate": 3.595387058317668e-06, + "loss": 1.0502, + "step": 12447 + }, + { + "epoch": 0.37, + "learning_rate": 3.59516779348943e-06, + "loss": 1.1444, + "step": 12448 + }, + { + "epoch": 0.38, + "learning_rate": 3.594948518235721e-06, + "loss": 1.1342, + "step": 12449 + }, + { + "epoch": 0.38, + "learning_rate": 3.594729232558629e-06, + "loss": 1.1294, + "step": 12450 + }, + { + "epoch": 0.38, + "learning_rate": 3.594509936460243e-06, + "loss": 1.1654, + "step": 12451 + }, + { + "epoch": 0.38, + "learning_rate": 3.5942906299426492e-06, + "loss": 1.178, + "step": 12452 + }, + { + "epoch": 0.38, + "learning_rate": 3.594071313007936e-06, + "loss": 1.0925, + "step": 12453 + }, + { + "epoch": 0.38, + "learning_rate": 3.5938519856581906e-06, + "loss": 1.0681, + "step": 12454 + }, + { + "epoch": 0.38, + "learning_rate": 3.5936326478955007e-06, + "loss": 1.2289, + "step": 12455 + }, + { + "epoch": 0.38, + "learning_rate": 3.5934132997219552e-06, + "loss": 1.1204, + "step": 12456 + }, + { + "epoch": 0.38, + "learning_rate": 3.593193941139641e-06, + "loss": 1.025, + "step": 12457 + }, + { + "epoch": 0.38, + "learning_rate": 3.592974572150648e-06, + "loss": 1.1111, + "step": 12458 + }, + { + "epoch": 0.38, + "learning_rate": 3.592755192757063e-06, + "loss": 1.1743, + "step": 12459 + }, + { + "epoch": 0.38, + "learning_rate": 3.5925358029609745e-06, + "loss": 1.1562, + "step": 12460 + }, + { + "epoch": 0.38, + "learning_rate": 3.592316402764472e-06, + "loss": 1.1683, + "step": 12461 + }, + { + "epoch": 0.38, + "learning_rate": 3.592096992169643e-06, + "loss": 1.2518, + "step": 12462 + }, + { + "epoch": 0.38, + "learning_rate": 3.5918775711785765e-06, + "loss": 1.2887, + "step": 12463 + }, + { + "epoch": 0.38, + "learning_rate": 3.5916581397933613e-06, + "loss": 1.1059, + "step": 12464 + }, + { + "epoch": 0.38, + "learning_rate": 3.591438698016087e-06, + "loss": 1.1776, + "step": 12465 + }, + { + "epoch": 0.38, + "learning_rate": 3.5912192458488416e-06, + "loss": 1.0381, + "step": 12466 + }, + { + "epoch": 0.38, + "learning_rate": 3.5909997832937144e-06, + "loss": 1.1527, + "step": 12467 + }, + { + "epoch": 0.38, + "learning_rate": 3.590780310352795e-06, + "loss": 1.0754, + "step": 12468 + }, + { + "epoch": 0.38, + "learning_rate": 3.590560827028172e-06, + "loss": 1.1879, + "step": 12469 + }, + { + "epoch": 0.38, + "learning_rate": 3.5903413333219357e-06, + "loss": 1.1945, + "step": 12470 + }, + { + "epoch": 0.38, + "learning_rate": 3.5901218292361744e-06, + "loss": 1.0941, + "step": 12471 + }, + { + "epoch": 0.38, + "learning_rate": 3.5899023147729784e-06, + "loss": 1.0605, + "step": 12472 + }, + { + "epoch": 0.38, + "learning_rate": 3.5896827899344377e-06, + "loss": 1.1901, + "step": 12473 + }, + { + "epoch": 0.38, + "learning_rate": 3.5894632547226415e-06, + "loss": 1.0938, + "step": 12474 + }, + { + "epoch": 0.38, + "learning_rate": 3.58924370913968e-06, + "loss": 1.1437, + "step": 12475 + }, + { + "epoch": 0.38, + "learning_rate": 3.5890241531876425e-06, + "loss": 1.1064, + "step": 12476 + }, + { + "epoch": 0.38, + "learning_rate": 3.58880458686862e-06, + "loss": 1.2241, + "step": 12477 + }, + { + "epoch": 0.38, + "learning_rate": 3.5885850101847018e-06, + "loss": 1.1407, + "step": 12478 + }, + { + "epoch": 0.38, + "learning_rate": 3.588365423137978e-06, + "loss": 1.1085, + "step": 12479 + }, + { + "epoch": 0.38, + "learning_rate": 3.5881458257305415e-06, + "loss": 1.194, + "step": 12480 + }, + { + "epoch": 0.38, + "learning_rate": 3.5879262179644793e-06, + "loss": 1.1242, + "step": 12481 + }, + { + "epoch": 0.38, + "learning_rate": 3.5877065998418837e-06, + "loss": 1.0776, + "step": 12482 + }, + { + "epoch": 0.38, + "learning_rate": 3.5874869713648453e-06, + "loss": 1.0767, + "step": 12483 + }, + { + "epoch": 0.38, + "learning_rate": 3.5872673325354544e-06, + "loss": 1.0839, + "step": 12484 + }, + { + "epoch": 0.38, + "learning_rate": 3.5870476833558025e-06, + "loss": 1.187, + "step": 12485 + }, + { + "epoch": 0.38, + "learning_rate": 3.586828023827981e-06, + "loss": 1.1154, + "step": 12486 + }, + { + "epoch": 0.38, + "learning_rate": 3.5866083539540787e-06, + "loss": 1.1383, + "step": 12487 + }, + { + "epoch": 0.38, + "learning_rate": 3.5863886737361885e-06, + "loss": 1.1581, + "step": 12488 + }, + { + "epoch": 0.38, + "learning_rate": 3.5861689831764017e-06, + "loss": 1.2209, + "step": 12489 + }, + { + "epoch": 0.38, + "learning_rate": 3.5859492822768088e-06, + "loss": 1.057, + "step": 12490 + }, + { + "epoch": 0.38, + "learning_rate": 3.5857295710395023e-06, + "loss": 1.0992, + "step": 12491 + }, + { + "epoch": 0.38, + "learning_rate": 3.5855098494665723e-06, + "loss": 1.2119, + "step": 12492 + }, + { + "epoch": 0.38, + "learning_rate": 3.5852901175601122e-06, + "loss": 1.1857, + "step": 12493 + }, + { + "epoch": 0.38, + "learning_rate": 3.5850703753222126e-06, + "loss": 0.991, + "step": 12494 + }, + { + "epoch": 0.38, + "learning_rate": 3.5848506227549664e-06, + "loss": 1.1619, + "step": 12495 + }, + { + "epoch": 0.38, + "learning_rate": 3.584630859860464e-06, + "loss": 1.0284, + "step": 12496 + }, + { + "epoch": 0.38, + "learning_rate": 3.5844110866407983e-06, + "loss": 0.9839, + "step": 12497 + }, + { + "epoch": 0.38, + "learning_rate": 3.5841913030980612e-06, + "loss": 1.175, + "step": 12498 + }, + { + "epoch": 0.38, + "learning_rate": 3.5839715092343454e-06, + "loss": 1.0822, + "step": 12499 + }, + { + "epoch": 0.38, + "learning_rate": 3.583751705051742e-06, + "loss": 1.248, + "step": 12500 + }, + { + "epoch": 0.38, + "learning_rate": 3.5835318905523455e-06, + "loss": 1.1545, + "step": 12501 + }, + { + "epoch": 0.38, + "learning_rate": 3.583312065738247e-06, + "loss": 1.1305, + "step": 12502 + }, + { + "epoch": 0.38, + "learning_rate": 3.5830922306115383e-06, + "loss": 1.1902, + "step": 12503 + }, + { + "epoch": 0.38, + "learning_rate": 3.582872385174314e-06, + "loss": 1.1645, + "step": 12504 + }, + { + "epoch": 0.38, + "learning_rate": 3.5826525294286657e-06, + "loss": 1.0501, + "step": 12505 + }, + { + "epoch": 0.38, + "learning_rate": 3.5824326633766876e-06, + "loss": 1.0857, + "step": 12506 + }, + { + "epoch": 0.38, + "learning_rate": 3.5822127870204716e-06, + "loss": 1.1683, + "step": 12507 + }, + { + "epoch": 0.38, + "learning_rate": 3.5819929003621107e-06, + "loss": 1.1528, + "step": 12508 + }, + { + "epoch": 0.38, + "learning_rate": 3.5817730034036986e-06, + "loss": 1.0998, + "step": 12509 + }, + { + "epoch": 0.38, + "learning_rate": 3.581553096147329e-06, + "loss": 1.0237, + "step": 12510 + }, + { + "epoch": 0.38, + "learning_rate": 3.5813331785950938e-06, + "loss": 1.1207, + "step": 12511 + }, + { + "epoch": 0.38, + "learning_rate": 3.5811132507490887e-06, + "loss": 1.1367, + "step": 12512 + }, + { + "epoch": 0.38, + "learning_rate": 3.5808933126114055e-06, + "loss": 1.0913, + "step": 12513 + }, + { + "epoch": 0.38, + "learning_rate": 3.5806733641841384e-06, + "loss": 1.1518, + "step": 12514 + }, + { + "epoch": 0.38, + "learning_rate": 3.5804534054693817e-06, + "loss": 1.0828, + "step": 12515 + }, + { + "epoch": 0.38, + "learning_rate": 3.5802334364692285e-06, + "loss": 1.1261, + "step": 12516 + }, + { + "epoch": 0.38, + "learning_rate": 3.580013457185774e-06, + "loss": 1.2501, + "step": 12517 + }, + { + "epoch": 0.38, + "learning_rate": 3.5797934676211103e-06, + "loss": 1.219, + "step": 12518 + }, + { + "epoch": 0.38, + "learning_rate": 3.579573467777334e-06, + "loss": 1.1533, + "step": 12519 + }, + { + "epoch": 0.38, + "learning_rate": 3.5793534576565374e-06, + "loss": 1.1279, + "step": 12520 + }, + { + "epoch": 0.38, + "learning_rate": 3.5791334372608165e-06, + "loss": 1.1718, + "step": 12521 + }, + { + "epoch": 0.38, + "learning_rate": 3.578913406592265e-06, + "loss": 1.1394, + "step": 12522 + }, + { + "epoch": 0.38, + "learning_rate": 3.578693365652977e-06, + "loss": 1.1697, + "step": 12523 + }, + { + "epoch": 0.38, + "learning_rate": 3.5784733144450477e-06, + "loss": 1.1714, + "step": 12524 + }, + { + "epoch": 0.38, + "learning_rate": 3.5782532529705722e-06, + "loss": 1.2118, + "step": 12525 + }, + { + "epoch": 0.38, + "learning_rate": 3.5780331812316447e-06, + "loss": 1.1973, + "step": 12526 + }, + { + "epoch": 0.38, + "learning_rate": 3.5778130992303612e-06, + "loss": 1.1554, + "step": 12527 + }, + { + "epoch": 0.38, + "learning_rate": 3.577593006968815e-06, + "loss": 1.0536, + "step": 12528 + }, + { + "epoch": 0.38, + "learning_rate": 3.577372904449103e-06, + "loss": 1.1342, + "step": 12529 + }, + { + "epoch": 0.38, + "learning_rate": 3.5771527916733194e-06, + "loss": 1.1568, + "step": 12530 + }, + { + "epoch": 0.38, + "learning_rate": 3.5769326686435607e-06, + "loss": 1.1064, + "step": 12531 + }, + { + "epoch": 0.38, + "learning_rate": 3.576712535361921e-06, + "loss": 1.1357, + "step": 12532 + }, + { + "epoch": 0.38, + "learning_rate": 3.5764923918304968e-06, + "loss": 1.1164, + "step": 12533 + }, + { + "epoch": 0.38, + "learning_rate": 3.576272238051384e-06, + "loss": 1.1499, + "step": 12534 + }, + { + "epoch": 0.38, + "learning_rate": 3.576052074026677e-06, + "loss": 1.0696, + "step": 12535 + }, + { + "epoch": 0.38, + "learning_rate": 3.575831899758473e-06, + "loss": 1.158, + "step": 12536 + }, + { + "epoch": 0.38, + "learning_rate": 3.5756117152488667e-06, + "loss": 1.0806, + "step": 12537 + }, + { + "epoch": 0.38, + "learning_rate": 3.5753915204999555e-06, + "loss": 1.1331, + "step": 12538 + }, + { + "epoch": 0.38, + "learning_rate": 3.575171315513835e-06, + "loss": 1.0712, + "step": 12539 + }, + { + "epoch": 0.38, + "learning_rate": 3.5749511002926017e-06, + "loss": 1.1085, + "step": 12540 + }, + { + "epoch": 0.38, + "learning_rate": 3.5747308748383515e-06, + "loss": 1.083, + "step": 12541 + }, + { + "epoch": 0.38, + "learning_rate": 3.574510639153181e-06, + "loss": 1.1093, + "step": 12542 + }, + { + "epoch": 0.38, + "learning_rate": 3.574290393239186e-06, + "loss": 1.1823, + "step": 12543 + }, + { + "epoch": 0.38, + "learning_rate": 3.5740701370984644e-06, + "loss": 1.1915, + "step": 12544 + }, + { + "epoch": 0.38, + "learning_rate": 3.5738498707331115e-06, + "loss": 1.1727, + "step": 12545 + }, + { + "epoch": 0.38, + "learning_rate": 3.573629594145226e-06, + "loss": 1.0376, + "step": 12546 + }, + { + "epoch": 0.38, + "learning_rate": 3.5734093073369035e-06, + "loss": 1.0377, + "step": 12547 + }, + { + "epoch": 0.38, + "learning_rate": 3.5731890103102416e-06, + "loss": 1.0861, + "step": 12548 + }, + { + "epoch": 0.38, + "learning_rate": 3.572968703067338e-06, + "loss": 1.099, + "step": 12549 + }, + { + "epoch": 0.38, + "learning_rate": 3.5727483856102874e-06, + "loss": 1.0587, + "step": 12550 + }, + { + "epoch": 0.38, + "learning_rate": 3.57252805794119e-06, + "loss": 1.1573, + "step": 12551 + }, + { + "epoch": 0.38, + "learning_rate": 3.5723077200621414e-06, + "loss": 1.1428, + "step": 12552 + }, + { + "epoch": 0.38, + "learning_rate": 3.5720873719752404e-06, + "loss": 1.2992, + "step": 12553 + }, + { + "epoch": 0.38, + "learning_rate": 3.5718670136825833e-06, + "loss": 1.0422, + "step": 12554 + }, + { + "epoch": 0.38, + "learning_rate": 3.5716466451862693e-06, + "loss": 1.1763, + "step": 12555 + }, + { + "epoch": 0.38, + "learning_rate": 3.5714262664883945e-06, + "loss": 1.0751, + "step": 12556 + }, + { + "epoch": 0.38, + "learning_rate": 3.571205877591058e-06, + "loss": 1.0661, + "step": 12557 + }, + { + "epoch": 0.38, + "learning_rate": 3.5709854784963573e-06, + "loss": 1.1573, + "step": 12558 + }, + { + "epoch": 0.38, + "learning_rate": 3.5707650692063906e-06, + "loss": 1.1988, + "step": 12559 + }, + { + "epoch": 0.38, + "learning_rate": 3.5705446497232565e-06, + "loss": 1.2266, + "step": 12560 + }, + { + "epoch": 0.38, + "learning_rate": 3.5703242200490522e-06, + "loss": 1.1246, + "step": 12561 + }, + { + "epoch": 0.38, + "learning_rate": 3.570103780185878e-06, + "loss": 1.1796, + "step": 12562 + }, + { + "epoch": 0.38, + "learning_rate": 3.5698833301358304e-06, + "loss": 1.0385, + "step": 12563 + }, + { + "epoch": 0.38, + "learning_rate": 3.569662869901009e-06, + "loss": 1.1649, + "step": 12564 + }, + { + "epoch": 0.38, + "learning_rate": 3.569442399483512e-06, + "loss": 1.0692, + "step": 12565 + }, + { + "epoch": 0.38, + "learning_rate": 3.569221918885439e-06, + "loss": 1.1668, + "step": 12566 + }, + { + "epoch": 0.38, + "learning_rate": 3.5690014281088875e-06, + "loss": 1.2339, + "step": 12567 + }, + { + "epoch": 0.38, + "learning_rate": 3.5687809271559582e-06, + "loss": 1.1293, + "step": 12568 + }, + { + "epoch": 0.38, + "learning_rate": 3.568560416028748e-06, + "loss": 1.0173, + "step": 12569 + }, + { + "epoch": 0.38, + "learning_rate": 3.568339894729358e-06, + "loss": 1.0404, + "step": 12570 + }, + { + "epoch": 0.38, + "learning_rate": 3.5681193632598865e-06, + "loss": 1.1588, + "step": 12571 + }, + { + "epoch": 0.38, + "learning_rate": 3.567898821622433e-06, + "loss": 1.0924, + "step": 12572 + }, + { + "epoch": 0.38, + "learning_rate": 3.567678269819097e-06, + "loss": 1.0819, + "step": 12573 + }, + { + "epoch": 0.38, + "learning_rate": 3.5674577078519785e-06, + "loss": 1.1094, + "step": 12574 + }, + { + "epoch": 0.38, + "learning_rate": 3.5672371357231765e-06, + "loss": 1.1172, + "step": 12575 + }, + { + "epoch": 0.38, + "learning_rate": 3.567016553434791e-06, + "loss": 1.1651, + "step": 12576 + }, + { + "epoch": 0.38, + "learning_rate": 3.5667959609889225e-06, + "loss": 1.0901, + "step": 12577 + }, + { + "epoch": 0.38, + "learning_rate": 3.5665753583876692e-06, + "loss": 1.0991, + "step": 12578 + }, + { + "epoch": 0.38, + "learning_rate": 3.5663547456331325e-06, + "loss": 1.1486, + "step": 12579 + }, + { + "epoch": 0.38, + "learning_rate": 3.5661341227274128e-06, + "loss": 1.1891, + "step": 12580 + }, + { + "epoch": 0.38, + "learning_rate": 3.5659134896726087e-06, + "loss": 1.1631, + "step": 12581 + }, + { + "epoch": 0.38, + "learning_rate": 3.5656928464708217e-06, + "loss": 1.2069, + "step": 12582 + }, + { + "epoch": 0.38, + "learning_rate": 3.5654721931241533e-06, + "loss": 1.1671, + "step": 12583 + }, + { + "epoch": 0.38, + "learning_rate": 3.565251529634701e-06, + "loss": 1.0645, + "step": 12584 + }, + { + "epoch": 0.38, + "learning_rate": 3.5650308560045683e-06, + "loss": 1.1855, + "step": 12585 + }, + { + "epoch": 0.38, + "learning_rate": 3.564810172235854e-06, + "loss": 1.1104, + "step": 12586 + }, + { + "epoch": 0.38, + "learning_rate": 3.56458947833066e-06, + "loss": 1.1035, + "step": 12587 + }, + { + "epoch": 0.38, + "learning_rate": 3.5643687742910877e-06, + "loss": 1.0855, + "step": 12588 + }, + { + "epoch": 0.38, + "learning_rate": 3.564148060119236e-06, + "loss": 1.2375, + "step": 12589 + }, + { + "epoch": 0.38, + "learning_rate": 3.563927335817209e-06, + "loss": 1.1848, + "step": 12590 + }, + { + "epoch": 0.38, + "learning_rate": 3.5637066013871046e-06, + "loss": 0.9589, + "step": 12591 + }, + { + "epoch": 0.38, + "learning_rate": 3.563485856831026e-06, + "loss": 1.1115, + "step": 12592 + }, + { + "epoch": 0.38, + "learning_rate": 3.5632651021510743e-06, + "loss": 1.1166, + "step": 12593 + }, + { + "epoch": 0.38, + "learning_rate": 3.5630443373493518e-06, + "loss": 1.1119, + "step": 12594 + }, + { + "epoch": 0.38, + "learning_rate": 3.5628235624279576e-06, + "loss": 1.2274, + "step": 12595 + }, + { + "epoch": 0.38, + "learning_rate": 3.5626027773889967e-06, + "loss": 1.0874, + "step": 12596 + }, + { + "epoch": 0.38, + "learning_rate": 3.562381982234567e-06, + "loss": 1.1082, + "step": 12597 + }, + { + "epoch": 0.38, + "learning_rate": 3.562161176966774e-06, + "loss": 1.1705, + "step": 12598 + }, + { + "epoch": 0.38, + "learning_rate": 3.561940361587718e-06, + "loss": 1.1641, + "step": 12599 + }, + { + "epoch": 0.38, + "learning_rate": 3.5617195360995004e-06, + "loss": 1.0925, + "step": 12600 + }, + { + "epoch": 0.38, + "learning_rate": 3.5614987005042252e-06, + "loss": 1.1354, + "step": 12601 + }, + { + "epoch": 0.38, + "learning_rate": 3.5612778548039927e-06, + "loss": 1.0851, + "step": 12602 + }, + { + "epoch": 0.38, + "learning_rate": 3.5610569990009077e-06, + "loss": 1.0831, + "step": 12603 + }, + { + "epoch": 0.38, + "learning_rate": 3.56083613309707e-06, + "loss": 1.1599, + "step": 12604 + }, + { + "epoch": 0.38, + "learning_rate": 3.5606152570945827e-06, + "loss": 1.121, + "step": 12605 + }, + { + "epoch": 0.38, + "learning_rate": 3.5603943709955495e-06, + "loss": 1.0992, + "step": 12606 + }, + { + "epoch": 0.38, + "learning_rate": 3.5601734748020732e-06, + "loss": 1.1234, + "step": 12607 + }, + { + "epoch": 0.38, + "learning_rate": 3.559952568516255e-06, + "loss": 1.1631, + "step": 12608 + }, + { + "epoch": 0.38, + "learning_rate": 3.5597316521401997e-06, + "loss": 0.9899, + "step": 12609 + }, + { + "epoch": 0.38, + "learning_rate": 3.5595107256760088e-06, + "loss": 1.0768, + "step": 12610 + }, + { + "epoch": 0.38, + "learning_rate": 3.559289789125786e-06, + "loss": 1.0573, + "step": 12611 + }, + { + "epoch": 0.38, + "learning_rate": 3.5590688424916346e-06, + "loss": 1.2432, + "step": 12612 + }, + { + "epoch": 0.38, + "learning_rate": 3.5588478857756586e-06, + "loss": 1.3024, + "step": 12613 + }, + { + "epoch": 0.38, + "learning_rate": 3.55862691897996e-06, + "loss": 1.1677, + "step": 12614 + }, + { + "epoch": 0.38, + "learning_rate": 3.558405942106643e-06, + "loss": 1.1697, + "step": 12615 + }, + { + "epoch": 0.38, + "learning_rate": 3.558184955157812e-06, + "loss": 1.1329, + "step": 12616 + }, + { + "epoch": 0.38, + "learning_rate": 3.557963958135569e-06, + "loss": 1.2333, + "step": 12617 + }, + { + "epoch": 0.38, + "learning_rate": 3.557742951042019e-06, + "loss": 1.0948, + "step": 12618 + }, + { + "epoch": 0.38, + "learning_rate": 3.5575219338792656e-06, + "loss": 1.1879, + "step": 12619 + }, + { + "epoch": 0.38, + "learning_rate": 3.5573009066494125e-06, + "loss": 1.1331, + "step": 12620 + }, + { + "epoch": 0.38, + "learning_rate": 3.5570798693545637e-06, + "loss": 1.145, + "step": 12621 + }, + { + "epoch": 0.38, + "learning_rate": 3.5568588219968246e-06, + "loss": 1.0811, + "step": 12622 + }, + { + "epoch": 0.38, + "learning_rate": 3.556637764578298e-06, + "loss": 1.266, + "step": 12623 + }, + { + "epoch": 0.38, + "learning_rate": 3.556416697101088e-06, + "loss": 1.095, + "step": 12624 + }, + { + "epoch": 0.38, + "learning_rate": 3.556195619567301e-06, + "loss": 1.1003, + "step": 12625 + }, + { + "epoch": 0.38, + "learning_rate": 3.5559745319790396e-06, + "loss": 1.1427, + "step": 12626 + }, + { + "epoch": 0.38, + "learning_rate": 3.5557534343384093e-06, + "loss": 1.116, + "step": 12627 + }, + { + "epoch": 0.38, + "learning_rate": 3.555532326647515e-06, + "loss": 1.1571, + "step": 12628 + }, + { + "epoch": 0.38, + "learning_rate": 3.555311208908462e-06, + "loss": 1.158, + "step": 12629 + }, + { + "epoch": 0.38, + "learning_rate": 3.5550900811233534e-06, + "loss": 1.2047, + "step": 12630 + }, + { + "epoch": 0.38, + "learning_rate": 3.5548689432942962e-06, + "loss": 1.1459, + "step": 12631 + }, + { + "epoch": 0.38, + "learning_rate": 3.5546477954233937e-06, + "loss": 1.137, + "step": 12632 + }, + { + "epoch": 0.38, + "learning_rate": 3.5544266375127533e-06, + "loss": 1.1124, + "step": 12633 + }, + { + "epoch": 0.38, + "learning_rate": 3.5542054695644785e-06, + "loss": 1.1196, + "step": 12634 + }, + { + "epoch": 0.38, + "learning_rate": 3.5539842915806755e-06, + "loss": 1.1188, + "step": 12635 + }, + { + "epoch": 0.38, + "learning_rate": 3.5537631035634496e-06, + "loss": 1.2346, + "step": 12636 + }, + { + "epoch": 0.38, + "learning_rate": 3.553541905514907e-06, + "loss": 1.0797, + "step": 12637 + }, + { + "epoch": 0.38, + "learning_rate": 3.553320697437152e-06, + "loss": 1.0876, + "step": 12638 + }, + { + "epoch": 0.38, + "learning_rate": 3.5530994793322917e-06, + "loss": 1.0064, + "step": 12639 + }, + { + "epoch": 0.38, + "learning_rate": 3.5528782512024306e-06, + "loss": 1.0752, + "step": 12640 + }, + { + "epoch": 0.38, + "learning_rate": 3.552657013049677e-06, + "loss": 1.1032, + "step": 12641 + }, + { + "epoch": 0.38, + "learning_rate": 3.5524357648761355e-06, + "loss": 1.1923, + "step": 12642 + }, + { + "epoch": 0.38, + "learning_rate": 3.5522145066839113e-06, + "loss": 1.0286, + "step": 12643 + }, + { + "epoch": 0.38, + "learning_rate": 3.5519932384751125e-06, + "loss": 1.1705, + "step": 12644 + }, + { + "epoch": 0.38, + "learning_rate": 3.551771960251845e-06, + "loss": 1.1155, + "step": 12645 + }, + { + "epoch": 0.38, + "learning_rate": 3.5515506720162146e-06, + "loss": 1.1541, + "step": 12646 + }, + { + "epoch": 0.38, + "learning_rate": 3.551329373770328e-06, + "loss": 1.1961, + "step": 12647 + }, + { + "epoch": 0.38, + "learning_rate": 3.5511080655162934e-06, + "loss": 1.0679, + "step": 12648 + }, + { + "epoch": 0.38, + "learning_rate": 3.550886747256215e-06, + "loss": 1.1385, + "step": 12649 + }, + { + "epoch": 0.38, + "learning_rate": 3.550665418992201e-06, + "loss": 1.2548, + "step": 12650 + }, + { + "epoch": 0.38, + "learning_rate": 3.5504440807263584e-06, + "loss": 1.1277, + "step": 12651 + }, + { + "epoch": 0.38, + "learning_rate": 3.550222732460794e-06, + "loss": 1.1778, + "step": 12652 + }, + { + "epoch": 0.38, + "learning_rate": 3.550001374197615e-06, + "loss": 1.0812, + "step": 12653 + }, + { + "epoch": 0.38, + "learning_rate": 3.5497800059389285e-06, + "loss": 1.2609, + "step": 12654 + }, + { + "epoch": 0.38, + "learning_rate": 3.5495586276868423e-06, + "loss": 1.1895, + "step": 12655 + }, + { + "epoch": 0.38, + "learning_rate": 3.5493372394434625e-06, + "loss": 1.2906, + "step": 12656 + }, + { + "epoch": 0.38, + "learning_rate": 3.5491158412108987e-06, + "loss": 1.0495, + "step": 12657 + }, + { + "epoch": 0.38, + "learning_rate": 3.5488944329912566e-06, + "loss": 1.1799, + "step": 12658 + }, + { + "epoch": 0.38, + "learning_rate": 3.5486730147866456e-06, + "loss": 1.0574, + "step": 12659 + }, + { + "epoch": 0.38, + "learning_rate": 3.548451586599172e-06, + "loss": 1.1013, + "step": 12660 + }, + { + "epoch": 0.38, + "learning_rate": 3.5482301484309444e-06, + "loss": 1.0745, + "step": 12661 + }, + { + "epoch": 0.38, + "learning_rate": 3.5480087002840702e-06, + "loss": 1.1174, + "step": 12662 + }, + { + "epoch": 0.38, + "learning_rate": 3.5477872421606587e-06, + "loss": 1.2559, + "step": 12663 + }, + { + "epoch": 0.38, + "learning_rate": 3.5475657740628162e-06, + "loss": 1.1161, + "step": 12664 + }, + { + "epoch": 0.38, + "learning_rate": 3.5473442959926525e-06, + "loss": 1.108, + "step": 12665 + }, + { + "epoch": 0.38, + "learning_rate": 3.5471228079522757e-06, + "loss": 1.1876, + "step": 12666 + }, + { + "epoch": 0.38, + "learning_rate": 3.5469013099437936e-06, + "loss": 1.2356, + "step": 12667 + }, + { + "epoch": 0.38, + "learning_rate": 3.546679801969316e-06, + "loss": 1.1219, + "step": 12668 + }, + { + "epoch": 0.38, + "learning_rate": 3.5464582840309503e-06, + "loss": 1.0869, + "step": 12669 + }, + { + "epoch": 0.38, + "learning_rate": 3.546236756130806e-06, + "loss": 1.1838, + "step": 12670 + }, + { + "epoch": 0.38, + "learning_rate": 3.546015218270991e-06, + "loss": 1.1222, + "step": 12671 + }, + { + "epoch": 0.38, + "learning_rate": 3.5457936704536155e-06, + "loss": 1.0813, + "step": 12672 + }, + { + "epoch": 0.38, + "learning_rate": 3.545572112680788e-06, + "loss": 1.147, + "step": 12673 + }, + { + "epoch": 0.38, + "learning_rate": 3.5453505449546177e-06, + "loss": 1.1813, + "step": 12674 + }, + { + "epoch": 0.38, + "learning_rate": 3.545128967277213e-06, + "loss": 1.0887, + "step": 12675 + }, + { + "epoch": 0.38, + "learning_rate": 3.544907379650685e-06, + "loss": 1.097, + "step": 12676 + }, + { + "epoch": 0.38, + "learning_rate": 3.5446857820771406e-06, + "loss": 1.1533, + "step": 12677 + }, + { + "epoch": 0.38, + "learning_rate": 3.5444641745586915e-06, + "loss": 1.0654, + "step": 12678 + }, + { + "epoch": 0.38, + "learning_rate": 3.5442425570974465e-06, + "loss": 1.2966, + "step": 12679 + }, + { + "epoch": 0.38, + "learning_rate": 3.5440209296955147e-06, + "loss": 1.1907, + "step": 12680 + }, + { + "epoch": 0.38, + "learning_rate": 3.543799292355007e-06, + "loss": 1.1561, + "step": 12681 + }, + { + "epoch": 0.38, + "learning_rate": 3.5435776450780324e-06, + "loss": 1.0557, + "step": 12682 + }, + { + "epoch": 0.38, + "learning_rate": 3.543355987866702e-06, + "loss": 1.1025, + "step": 12683 + }, + { + "epoch": 0.38, + "learning_rate": 3.543134320723124e-06, + "loss": 1.1737, + "step": 12684 + }, + { + "epoch": 0.38, + "learning_rate": 3.5429126436494106e-06, + "loss": 1.098, + "step": 12685 + }, + { + "epoch": 0.38, + "learning_rate": 3.5426909566476704e-06, + "loss": 1.1094, + "step": 12686 + }, + { + "epoch": 0.38, + "learning_rate": 3.542469259720015e-06, + "loss": 1.3087, + "step": 12687 + }, + { + "epoch": 0.38, + "learning_rate": 3.5422475528685542e-06, + "loss": 1.1222, + "step": 12688 + }, + { + "epoch": 0.38, + "learning_rate": 3.5420258360953986e-06, + "loss": 1.0912, + "step": 12689 + }, + { + "epoch": 0.38, + "learning_rate": 3.541804109402659e-06, + "loss": 1.155, + "step": 12690 + }, + { + "epoch": 0.38, + "learning_rate": 3.541582372792445e-06, + "loss": 1.171, + "step": 12691 + }, + { + "epoch": 0.38, + "learning_rate": 3.54136062626687e-06, + "loss": 1.1652, + "step": 12692 + }, + { + "epoch": 0.38, + "learning_rate": 3.5411388698280426e-06, + "loss": 1.2458, + "step": 12693 + }, + { + "epoch": 0.38, + "learning_rate": 3.5409171034780744e-06, + "loss": 1.0707, + "step": 12694 + }, + { + "epoch": 0.38, + "learning_rate": 3.5406953272190774e-06, + "loss": 1.0299, + "step": 12695 + }, + { + "epoch": 0.38, + "learning_rate": 3.5404735410531613e-06, + "loss": 1.0509, + "step": 12696 + }, + { + "epoch": 0.38, + "learning_rate": 3.5402517449824384e-06, + "loss": 1.0428, + "step": 12697 + }, + { + "epoch": 0.38, + "learning_rate": 3.5400299390090203e-06, + "loss": 1.0981, + "step": 12698 + }, + { + "epoch": 0.38, + "learning_rate": 3.539808123135018e-06, + "loss": 1.1874, + "step": 12699 + }, + { + "epoch": 0.38, + "learning_rate": 3.5395862973625433e-06, + "loss": 1.2067, + "step": 12700 + }, + { + "epoch": 0.38, + "learning_rate": 3.5393644616937074e-06, + "loss": 1.0221, + "step": 12701 + }, + { + "epoch": 0.38, + "learning_rate": 3.5391426161306224e-06, + "loss": 1.1954, + "step": 12702 + }, + { + "epoch": 0.38, + "learning_rate": 3.5389207606754e-06, + "loss": 1.0615, + "step": 12703 + }, + { + "epoch": 0.38, + "learning_rate": 3.5386988953301527e-06, + "loss": 1.0917, + "step": 12704 + }, + { + "epoch": 0.38, + "learning_rate": 3.538477020096992e-06, + "loss": 1.0591, + "step": 12705 + }, + { + "epoch": 0.38, + "learning_rate": 3.53825513497803e-06, + "loss": 1.1688, + "step": 12706 + }, + { + "epoch": 0.38, + "learning_rate": 3.53803323997538e-06, + "loss": 0.9057, + "step": 12707 + }, + { + "epoch": 0.38, + "learning_rate": 3.5378113350911526e-06, + "loss": 1.1583, + "step": 12708 + }, + { + "epoch": 0.38, + "learning_rate": 3.537589420327461e-06, + "loss": 1.12, + "step": 12709 + }, + { + "epoch": 0.38, + "learning_rate": 3.537367495686418e-06, + "loss": 1.0471, + "step": 12710 + }, + { + "epoch": 0.38, + "learning_rate": 3.5371455611701367e-06, + "loss": 1.0917, + "step": 12711 + }, + { + "epoch": 0.38, + "learning_rate": 3.5369236167807286e-06, + "loss": 1.1197, + "step": 12712 + }, + { + "epoch": 0.38, + "learning_rate": 3.5367016625203076e-06, + "loss": 1.0759, + "step": 12713 + }, + { + "epoch": 0.38, + "learning_rate": 3.5364796983909855e-06, + "loss": 1.173, + "step": 12714 + }, + { + "epoch": 0.38, + "learning_rate": 3.536257724394876e-06, + "loss": 1.1839, + "step": 12715 + }, + { + "epoch": 0.38, + "learning_rate": 3.5360357405340917e-06, + "loss": 1.1812, + "step": 12716 + }, + { + "epoch": 0.38, + "learning_rate": 3.5358137468107467e-06, + "loss": 1.2395, + "step": 12717 + }, + { + "epoch": 0.38, + "learning_rate": 3.535591743226954e-06, + "loss": 1.1613, + "step": 12718 + }, + { + "epoch": 0.38, + "learning_rate": 3.5353697297848254e-06, + "loss": 1.1616, + "step": 12719 + }, + { + "epoch": 0.38, + "learning_rate": 3.535147706486477e-06, + "loss": 1.2064, + "step": 12720 + }, + { + "epoch": 0.38, + "learning_rate": 3.53492567333402e-06, + "loss": 1.0447, + "step": 12721 + }, + { + "epoch": 0.38, + "learning_rate": 3.534703630329569e-06, + "loss": 1.1985, + "step": 12722 + }, + { + "epoch": 0.38, + "learning_rate": 3.534481577475238e-06, + "loss": 1.108, + "step": 12723 + }, + { + "epoch": 0.38, + "learning_rate": 3.5342595147731413e-06, + "loss": 1.2112, + "step": 12724 + }, + { + "epoch": 0.38, + "learning_rate": 3.5340374422253913e-06, + "loss": 1.1881, + "step": 12725 + }, + { + "epoch": 0.38, + "learning_rate": 3.5338153598341037e-06, + "loss": 1.116, + "step": 12726 + }, + { + "epoch": 0.38, + "learning_rate": 3.5335932676013906e-06, + "loss": 0.9906, + "step": 12727 + }, + { + "epoch": 0.38, + "learning_rate": 3.5333711655293683e-06, + "loss": 1.0804, + "step": 12728 + }, + { + "epoch": 0.38, + "learning_rate": 3.53314905362015e-06, + "loss": 1.2641, + "step": 12729 + }, + { + "epoch": 0.38, + "learning_rate": 3.5329269318758508e-06, + "loss": 1.2264, + "step": 12730 + }, + { + "epoch": 0.38, + "learning_rate": 3.5327048002985835e-06, + "loss": 1.0438, + "step": 12731 + }, + { + "epoch": 0.38, + "learning_rate": 3.532482658890464e-06, + "loss": 1.2009, + "step": 12732 + }, + { + "epoch": 0.38, + "learning_rate": 3.5322605076536084e-06, + "loss": 1.1442, + "step": 12733 + }, + { + "epoch": 0.38, + "learning_rate": 3.532038346590128e-06, + "loss": 1.0728, + "step": 12734 + }, + { + "epoch": 0.38, + "learning_rate": 3.531816175702141e-06, + "loss": 1.095, + "step": 12735 + }, + { + "epoch": 0.38, + "learning_rate": 3.5315939949917598e-06, + "loss": 1.1334, + "step": 12736 + }, + { + "epoch": 0.38, + "learning_rate": 3.531371804461101e-06, + "loss": 1.0933, + "step": 12737 + }, + { + "epoch": 0.38, + "learning_rate": 3.5311496041122796e-06, + "loss": 1.0524, + "step": 12738 + }, + { + "epoch": 0.38, + "learning_rate": 3.530927393947411e-06, + "loss": 1.1342, + "step": 12739 + }, + { + "epoch": 0.38, + "learning_rate": 3.5307051739686092e-06, + "loss": 1.2136, + "step": 12740 + }, + { + "epoch": 0.38, + "learning_rate": 3.5304829441779916e-06, + "loss": 1.0613, + "step": 12741 + }, + { + "epoch": 0.38, + "learning_rate": 3.5302607045776715e-06, + "loss": 1.0876, + "step": 12742 + }, + { + "epoch": 0.38, + "learning_rate": 3.5300384551697665e-06, + "loss": 1.1123, + "step": 12743 + }, + { + "epoch": 0.38, + "learning_rate": 3.529816195956391e-06, + "loss": 1.1604, + "step": 12744 + }, + { + "epoch": 0.38, + "learning_rate": 3.5295939269396613e-06, + "loss": 1.1272, + "step": 12745 + }, + { + "epoch": 0.38, + "learning_rate": 3.5293716481216938e-06, + "loss": 1.1642, + "step": 12746 + }, + { + "epoch": 0.38, + "learning_rate": 3.529149359504603e-06, + "loss": 1.1254, + "step": 12747 + }, + { + "epoch": 0.38, + "learning_rate": 3.5289270610905076e-06, + "loss": 1.1977, + "step": 12748 + }, + { + "epoch": 0.38, + "learning_rate": 3.5287047528815212e-06, + "loss": 1.1073, + "step": 12749 + }, + { + "epoch": 0.38, + "learning_rate": 3.5284824348797604e-06, + "loss": 1.2683, + "step": 12750 + }, + { + "epoch": 0.38, + "learning_rate": 3.528260107087342e-06, + "loss": 1.0622, + "step": 12751 + }, + { + "epoch": 0.38, + "learning_rate": 3.528037769506384e-06, + "loss": 1.0687, + "step": 12752 + }, + { + "epoch": 0.38, + "learning_rate": 3.5278154221390004e-06, + "loss": 1.1149, + "step": 12753 + }, + { + "epoch": 0.38, + "learning_rate": 3.5275930649873102e-06, + "loss": 1.0522, + "step": 12754 + }, + { + "epoch": 0.38, + "learning_rate": 3.527370698053428e-06, + "loss": 1.0836, + "step": 12755 + }, + { + "epoch": 0.38, + "learning_rate": 3.527148321339472e-06, + "loss": 1.0834, + "step": 12756 + }, + { + "epoch": 0.38, + "learning_rate": 3.526925934847558e-06, + "loss": 1.0904, + "step": 12757 + }, + { + "epoch": 0.38, + "learning_rate": 3.5267035385798038e-06, + "loss": 1.1833, + "step": 12758 + }, + { + "epoch": 0.38, + "learning_rate": 3.526481132538327e-06, + "loss": 1.1166, + "step": 12759 + }, + { + "epoch": 0.38, + "learning_rate": 3.5262587167252438e-06, + "loss": 1.1075, + "step": 12760 + }, + { + "epoch": 0.38, + "learning_rate": 3.526036291142672e-06, + "loss": 1.1615, + "step": 12761 + }, + { + "epoch": 0.38, + "learning_rate": 3.5258138557927286e-06, + "loss": 1.1931, + "step": 12762 + }, + { + "epoch": 0.38, + "learning_rate": 3.525591410677531e-06, + "loss": 1.1714, + "step": 12763 + }, + { + "epoch": 0.38, + "learning_rate": 3.5253689557991975e-06, + "loss": 1.101, + "step": 12764 + }, + { + "epoch": 0.38, + "learning_rate": 3.525146491159846e-06, + "loss": 0.9733, + "step": 12765 + }, + { + "epoch": 0.38, + "learning_rate": 3.524924016761593e-06, + "loss": 1.212, + "step": 12766 + }, + { + "epoch": 0.38, + "learning_rate": 3.5247015326065577e-06, + "loss": 1.1415, + "step": 12767 + }, + { + "epoch": 0.38, + "learning_rate": 3.5244790386968564e-06, + "loss": 1.0754, + "step": 12768 + }, + { + "epoch": 0.38, + "learning_rate": 3.5242565350346088e-06, + "loss": 1.0306, + "step": 12769 + }, + { + "epoch": 0.38, + "learning_rate": 3.5240340216219315e-06, + "loss": 1.1735, + "step": 12770 + }, + { + "epoch": 0.38, + "learning_rate": 3.523811498460944e-06, + "loss": 1.1417, + "step": 12771 + }, + { + "epoch": 0.38, + "learning_rate": 3.523588965553764e-06, + "loss": 1.1052, + "step": 12772 + }, + { + "epoch": 0.38, + "learning_rate": 3.5233664229025098e-06, + "loss": 1.2075, + "step": 12773 + }, + { + "epoch": 0.38, + "learning_rate": 3.5231438705093013e-06, + "loss": 1.2371, + "step": 12774 + }, + { + "epoch": 0.38, + "learning_rate": 3.522921308376255e-06, + "loss": 0.986, + "step": 12775 + }, + { + "epoch": 0.38, + "learning_rate": 3.52269873650549e-06, + "loss": 1.2732, + "step": 12776 + }, + { + "epoch": 0.38, + "learning_rate": 3.5224761548991253e-06, + "loss": 1.1771, + "step": 12777 + }, + { + "epoch": 0.38, + "learning_rate": 3.5222535635592814e-06, + "loss": 1.1035, + "step": 12778 + }, + { + "epoch": 0.38, + "learning_rate": 3.522030962488075e-06, + "loss": 1.1401, + "step": 12779 + }, + { + "epoch": 0.38, + "learning_rate": 3.5218083516876266e-06, + "loss": 1.1334, + "step": 12780 + }, + { + "epoch": 0.39, + "learning_rate": 3.521585731160055e-06, + "loss": 1.1922, + "step": 12781 + }, + { + "epoch": 0.39, + "learning_rate": 3.5213631009074788e-06, + "loss": 1.1219, + "step": 12782 + }, + { + "epoch": 0.39, + "learning_rate": 3.5211404609320177e-06, + "loss": 1.188, + "step": 12783 + }, + { + "epoch": 0.39, + "learning_rate": 3.520917811235791e-06, + "loss": 1.0478, + "step": 12784 + }, + { + "epoch": 0.39, + "learning_rate": 3.5206951518209192e-06, + "loss": 1.1262, + "step": 12785 + }, + { + "epoch": 0.39, + "learning_rate": 3.5204724826895203e-06, + "loss": 1.0997, + "step": 12786 + }, + { + "epoch": 0.39, + "learning_rate": 3.520249803843716e-06, + "loss": 1.158, + "step": 12787 + }, + { + "epoch": 0.39, + "learning_rate": 3.5200271152856237e-06, + "loss": 1.2258, + "step": 12788 + }, + { + "epoch": 0.39, + "learning_rate": 3.519804417017365e-06, + "loss": 1.1532, + "step": 12789 + }, + { + "epoch": 0.39, + "learning_rate": 3.5195817090410593e-06, + "loss": 1.1434, + "step": 12790 + }, + { + "epoch": 0.39, + "learning_rate": 3.519358991358827e-06, + "loss": 1.1844, + "step": 12791 + }, + { + "epoch": 0.39, + "learning_rate": 3.5191362639727875e-06, + "loss": 1.2716, + "step": 12792 + }, + { + "epoch": 0.39, + "learning_rate": 3.5189135268850626e-06, + "loss": 1.1664, + "step": 12793 + }, + { + "epoch": 0.39, + "learning_rate": 3.5186907800977708e-06, + "loss": 1.2273, + "step": 12794 + }, + { + "epoch": 0.39, + "learning_rate": 3.518468023613034e-06, + "loss": 1.091, + "step": 12795 + }, + { + "epoch": 0.39, + "learning_rate": 3.5182452574329717e-06, + "loss": 1.0894, + "step": 12796 + }, + { + "epoch": 0.39, + "learning_rate": 3.5180224815597047e-06, + "loss": 1.1056, + "step": 12797 + }, + { + "epoch": 0.39, + "learning_rate": 3.5177996959953546e-06, + "loss": 1.174, + "step": 12798 + }, + { + "epoch": 0.39, + "learning_rate": 3.517576900742041e-06, + "loss": 1.0443, + "step": 12799 + }, + { + "epoch": 0.39, + "learning_rate": 3.5173540958018865e-06, + "loss": 1.1282, + "step": 12800 + }, + { + "epoch": 0.39, + "learning_rate": 3.5171312811770096e-06, + "loss": 1.2771, + "step": 12801 + }, + { + "epoch": 0.39, + "learning_rate": 3.516908456869534e-06, + "loss": 1.1516, + "step": 12802 + }, + { + "epoch": 0.39, + "learning_rate": 3.5166856228815786e-06, + "loss": 1.1185, + "step": 12803 + }, + { + "epoch": 0.39, + "learning_rate": 3.516462779215266e-06, + "loss": 1.0839, + "step": 12804 + }, + { + "epoch": 0.39, + "learning_rate": 3.5162399258727177e-06, + "loss": 1.0844, + "step": 12805 + }, + { + "epoch": 0.39, + "learning_rate": 3.516017062856054e-06, + "loss": 1.2119, + "step": 12806 + }, + { + "epoch": 0.39, + "learning_rate": 3.5157941901673976e-06, + "loss": 1.0508, + "step": 12807 + }, + { + "epoch": 0.39, + "learning_rate": 3.5155713078088704e-06, + "loss": 1.1942, + "step": 12808 + }, + { + "epoch": 0.39, + "learning_rate": 3.5153484157825924e-06, + "loss": 1.1257, + "step": 12809 + }, + { + "epoch": 0.39, + "learning_rate": 3.515125514090687e-06, + "loss": 1.0925, + "step": 12810 + }, + { + "epoch": 0.39, + "learning_rate": 3.5149026027352758e-06, + "loss": 1.0437, + "step": 12811 + }, + { + "epoch": 0.39, + "learning_rate": 3.5146796817184803e-06, + "loss": 1.2087, + "step": 12812 + }, + { + "epoch": 0.39, + "learning_rate": 3.514456751042423e-06, + "loss": 1.1509, + "step": 12813 + }, + { + "epoch": 0.39, + "learning_rate": 3.514233810709226e-06, + "loss": 1.1556, + "step": 12814 + }, + { + "epoch": 0.39, + "learning_rate": 3.514010860721012e-06, + "loss": 1.1281, + "step": 12815 + }, + { + "epoch": 0.39, + "learning_rate": 3.5137879010799025e-06, + "loss": 1.1232, + "step": 12816 + }, + { + "epoch": 0.39, + "learning_rate": 3.51356493178802e-06, + "loss": 1.2056, + "step": 12817 + }, + { + "epoch": 0.39, + "learning_rate": 3.513341952847488e-06, + "loss": 1.1411, + "step": 12818 + }, + { + "epoch": 0.39, + "learning_rate": 3.5131189642604292e-06, + "loss": 1.0745, + "step": 12819 + }, + { + "epoch": 0.39, + "learning_rate": 3.5128959660289646e-06, + "loss": 1.0607, + "step": 12820 + }, + { + "epoch": 0.39, + "learning_rate": 3.5126729581552194e-06, + "loss": 1.132, + "step": 12821 + }, + { + "epoch": 0.39, + "learning_rate": 3.5124499406413144e-06, + "loss": 1.0295, + "step": 12822 + }, + { + "epoch": 0.39, + "learning_rate": 3.5122269134893743e-06, + "loss": 1.1774, + "step": 12823 + }, + { + "epoch": 0.39, + "learning_rate": 3.512003876701521e-06, + "loss": 1.1486, + "step": 12824 + }, + { + "epoch": 0.39, + "learning_rate": 3.5117808302798784e-06, + "loss": 1.2402, + "step": 12825 + }, + { + "epoch": 0.39, + "learning_rate": 3.5115577742265694e-06, + "loss": 1.146, + "step": 12826 + }, + { + "epoch": 0.39, + "learning_rate": 3.511334708543718e-06, + "loss": 1.1484, + "step": 12827 + }, + { + "epoch": 0.39, + "learning_rate": 3.5111116332334472e-06, + "loss": 1.0554, + "step": 12828 + }, + { + "epoch": 0.39, + "learning_rate": 3.51088854829788e-06, + "loss": 1.1833, + "step": 12829 + }, + { + "epoch": 0.39, + "learning_rate": 3.5106654537391418e-06, + "loss": 1.1882, + "step": 12830 + }, + { + "epoch": 0.39, + "learning_rate": 3.5104423495593544e-06, + "loss": 1.1888, + "step": 12831 + }, + { + "epoch": 0.39, + "learning_rate": 3.5102192357606422e-06, + "loss": 1.1298, + "step": 12832 + }, + { + "epoch": 0.39, + "learning_rate": 3.5099961123451297e-06, + "loss": 1.1555, + "step": 12833 + }, + { + "epoch": 0.39, + "learning_rate": 3.509772979314941e-06, + "loss": 1.0938, + "step": 12834 + }, + { + "epoch": 0.39, + "learning_rate": 3.5095498366721994e-06, + "loss": 1.043, + "step": 12835 + }, + { + "epoch": 0.39, + "learning_rate": 3.50932668441903e-06, + "loss": 1.1289, + "step": 12836 + }, + { + "epoch": 0.39, + "learning_rate": 3.5091035225575563e-06, + "loss": 1.2224, + "step": 12837 + }, + { + "epoch": 0.39, + "learning_rate": 3.5088803510899028e-06, + "loss": 1.2036, + "step": 12838 + }, + { + "epoch": 0.39, + "learning_rate": 3.5086571700181954e-06, + "loss": 1.1472, + "step": 12839 + }, + { + "epoch": 0.39, + "learning_rate": 3.5084339793445563e-06, + "loss": 1.1525, + "step": 12840 + }, + { + "epoch": 0.39, + "learning_rate": 3.508210779071112e-06, + "loss": 1.0886, + "step": 12841 + }, + { + "epoch": 0.39, + "learning_rate": 3.5079875691999864e-06, + "loss": 1.1331, + "step": 12842 + }, + { + "epoch": 0.39, + "learning_rate": 3.507764349733305e-06, + "loss": 1.1697, + "step": 12843 + }, + { + "epoch": 0.39, + "learning_rate": 3.5075411206731925e-06, + "loss": 1.1791, + "step": 12844 + }, + { + "epoch": 0.39, + "learning_rate": 3.507317882021773e-06, + "loss": 1.2053, + "step": 12845 + }, + { + "epoch": 0.39, + "learning_rate": 3.507094633781173e-06, + "loss": 1.1106, + "step": 12846 + }, + { + "epoch": 0.39, + "learning_rate": 3.5068713759535167e-06, + "loss": 1.1509, + "step": 12847 + }, + { + "epoch": 0.39, + "learning_rate": 3.5066481085409297e-06, + "loss": 1.2367, + "step": 12848 + }, + { + "epoch": 0.39, + "learning_rate": 3.5064248315455383e-06, + "loss": 0.9528, + "step": 12849 + }, + { + "epoch": 0.39, + "learning_rate": 3.5062015449694666e-06, + "loss": 1.2608, + "step": 12850 + }, + { + "epoch": 0.39, + "learning_rate": 3.505978248814841e-06, + "loss": 1.1544, + "step": 12851 + }, + { + "epoch": 0.39, + "learning_rate": 3.5057549430837873e-06, + "loss": 1.1575, + "step": 12852 + }, + { + "epoch": 0.39, + "learning_rate": 3.5055316277784303e-06, + "loss": 1.1855, + "step": 12853 + }, + { + "epoch": 0.39, + "learning_rate": 3.505308302900897e-06, + "loss": 1.1901, + "step": 12854 + }, + { + "epoch": 0.39, + "learning_rate": 3.5050849684533124e-06, + "loss": 1.1942, + "step": 12855 + }, + { + "epoch": 0.39, + "learning_rate": 3.5048616244378036e-06, + "loss": 1.1652, + "step": 12856 + }, + { + "epoch": 0.39, + "learning_rate": 3.504638270856495e-06, + "loss": 1.0707, + "step": 12857 + }, + { + "epoch": 0.39, + "learning_rate": 3.5044149077115147e-06, + "loss": 1.1098, + "step": 12858 + }, + { + "epoch": 0.39, + "learning_rate": 3.5041915350049875e-06, + "loss": 1.1591, + "step": 12859 + }, + { + "epoch": 0.39, + "learning_rate": 3.5039681527390417e-06, + "loss": 1.1727, + "step": 12860 + }, + { + "epoch": 0.39, + "learning_rate": 3.5037447609158016e-06, + "loss": 1.2108, + "step": 12861 + }, + { + "epoch": 0.39, + "learning_rate": 3.503521359537396e-06, + "loss": 1.1376, + "step": 12862 + }, + { + "epoch": 0.39, + "learning_rate": 3.5032979486059493e-06, + "loss": 1.0881, + "step": 12863 + }, + { + "epoch": 0.39, + "learning_rate": 3.5030745281235888e-06, + "loss": 1.2238, + "step": 12864 + }, + { + "epoch": 0.39, + "learning_rate": 3.5028510980924437e-06, + "loss": 1.1534, + "step": 12865 + }, + { + "epoch": 0.39, + "learning_rate": 3.502627658514638e-06, + "loss": 1.1005, + "step": 12866 + }, + { + "epoch": 0.39, + "learning_rate": 3.5024042093923e-06, + "loss": 1.2382, + "step": 12867 + }, + { + "epoch": 0.39, + "learning_rate": 3.5021807507275564e-06, + "loss": 1.1747, + "step": 12868 + }, + { + "epoch": 0.39, + "learning_rate": 3.501957282522536e-06, + "loss": 1.2826, + "step": 12869 + }, + { + "epoch": 0.39, + "learning_rate": 3.501733804779363e-06, + "loss": 1.1226, + "step": 12870 + }, + { + "epoch": 0.39, + "learning_rate": 3.501510317500168e-06, + "loss": 1.1357, + "step": 12871 + }, + { + "epoch": 0.39, + "learning_rate": 3.5012868206870766e-06, + "loss": 1.1573, + "step": 12872 + }, + { + "epoch": 0.39, + "learning_rate": 3.501063314342217e-06, + "loss": 1.1771, + "step": 12873 + }, + { + "epoch": 0.39, + "learning_rate": 3.500839798467716e-06, + "loss": 1.111, + "step": 12874 + }, + { + "epoch": 0.39, + "learning_rate": 3.5006162730657035e-06, + "loss": 1.2794, + "step": 12875 + }, + { + "epoch": 0.39, + "learning_rate": 3.5003927381383045e-06, + "loss": 1.1602, + "step": 12876 + }, + { + "epoch": 0.39, + "learning_rate": 3.500169193687649e-06, + "loss": 1.0966, + "step": 12877 + }, + { + "epoch": 0.39, + "learning_rate": 3.4999456397158655e-06, + "loss": 1.1699, + "step": 12878 + }, + { + "epoch": 0.39, + "learning_rate": 3.49972207622508e-06, + "loss": 1.1322, + "step": 12879 + }, + { + "epoch": 0.39, + "learning_rate": 3.4994985032174222e-06, + "loss": 1.0244, + "step": 12880 + }, + { + "epoch": 0.39, + "learning_rate": 3.49927492069502e-06, + "loss": 1.3572, + "step": 12881 + }, + { + "epoch": 0.39, + "learning_rate": 3.4990513286600027e-06, + "loss": 1.0399, + "step": 12882 + }, + { + "epoch": 0.39, + "learning_rate": 3.4988277271144966e-06, + "loss": 1.0788, + "step": 12883 + }, + { + "epoch": 0.39, + "learning_rate": 3.4986041160606323e-06, + "loss": 1.0488, + "step": 12884 + }, + { + "epoch": 0.39, + "learning_rate": 3.4983804955005367e-06, + "loss": 1.1099, + "step": 12885 + }, + { + "epoch": 0.39, + "learning_rate": 3.4981568654363405e-06, + "loss": 1.1749, + "step": 12886 + }, + { + "epoch": 0.39, + "learning_rate": 3.4979332258701715e-06, + "loss": 1.1776, + "step": 12887 + }, + { + "epoch": 0.39, + "learning_rate": 3.497709576804159e-06, + "loss": 1.2434, + "step": 12888 + }, + { + "epoch": 0.39, + "learning_rate": 3.4974859182404315e-06, + "loss": 1.1525, + "step": 12889 + }, + { + "epoch": 0.39, + "learning_rate": 3.497262250181118e-06, + "loss": 1.1626, + "step": 12890 + }, + { + "epoch": 0.39, + "learning_rate": 3.4970385726283497e-06, + "loss": 1.0375, + "step": 12891 + }, + { + "epoch": 0.39, + "learning_rate": 3.496814885584253e-06, + "loss": 1.251, + "step": 12892 + }, + { + "epoch": 0.39, + "learning_rate": 3.4965911890509594e-06, + "loss": 1.1008, + "step": 12893 + }, + { + "epoch": 0.39, + "learning_rate": 3.4963674830305978e-06, + "loss": 1.0565, + "step": 12894 + }, + { + "epoch": 0.39, + "learning_rate": 3.4961437675252976e-06, + "loss": 1.1668, + "step": 12895 + }, + { + "epoch": 0.39, + "learning_rate": 3.4959200425371874e-06, + "loss": 1.1395, + "step": 12896 + }, + { + "epoch": 0.39, + "learning_rate": 3.4956963080683996e-06, + "loss": 1.1106, + "step": 12897 + }, + { + "epoch": 0.39, + "learning_rate": 3.495472564121061e-06, + "loss": 1.1335, + "step": 12898 + }, + { + "epoch": 0.39, + "learning_rate": 3.4952488106973036e-06, + "loss": 1.1139, + "step": 12899 + }, + { + "epoch": 0.39, + "learning_rate": 3.4950250477992577e-06, + "loss": 1.1984, + "step": 12900 + }, + { + "epoch": 0.39, + "learning_rate": 3.494801275429052e-06, + "loss": 1.1599, + "step": 12901 + }, + { + "epoch": 0.39, + "learning_rate": 3.4945774935888166e-06, + "loss": 1.064, + "step": 12902 + }, + { + "epoch": 0.39, + "learning_rate": 3.494353702280683e-06, + "loss": 1.1275, + "step": 12903 + }, + { + "epoch": 0.39, + "learning_rate": 3.4941299015067807e-06, + "loss": 1.1646, + "step": 12904 + }, + { + "epoch": 0.39, + "learning_rate": 3.493906091269241e-06, + "loss": 1.1263, + "step": 12905 + }, + { + "epoch": 0.39, + "learning_rate": 3.4936822715701945e-06, + "loss": 1.1837, + "step": 12906 + }, + { + "epoch": 0.39, + "learning_rate": 3.49345844241177e-06, + "loss": 1.1188, + "step": 12907 + }, + { + "epoch": 0.39, + "learning_rate": 3.4932346037961006e-06, + "loss": 1.2433, + "step": 12908 + }, + { + "epoch": 0.39, + "learning_rate": 3.4930107557253156e-06, + "loss": 1.1089, + "step": 12909 + }, + { + "epoch": 0.39, + "learning_rate": 3.492786898201547e-06, + "loss": 1.0659, + "step": 12910 + }, + { + "epoch": 0.39, + "learning_rate": 3.4925630312269253e-06, + "loss": 1.0608, + "step": 12911 + }, + { + "epoch": 0.39, + "learning_rate": 3.4923391548035814e-06, + "loss": 1.1425, + "step": 12912 + }, + { + "epoch": 0.39, + "learning_rate": 3.492115268933646e-06, + "loss": 1.1066, + "step": 12913 + }, + { + "epoch": 0.39, + "learning_rate": 3.4918913736192517e-06, + "loss": 1.0202, + "step": 12914 + }, + { + "epoch": 0.39, + "learning_rate": 3.491667468862529e-06, + "loss": 1.0333, + "step": 12915 + }, + { + "epoch": 0.39, + "learning_rate": 3.49144355466561e-06, + "loss": 1.0766, + "step": 12916 + }, + { + "epoch": 0.39, + "learning_rate": 3.491219631030625e-06, + "loss": 1.1796, + "step": 12917 + }, + { + "epoch": 0.39, + "learning_rate": 3.490995697959707e-06, + "loss": 1.1696, + "step": 12918 + }, + { + "epoch": 0.39, + "learning_rate": 3.4907717554549882e-06, + "loss": 1.1546, + "step": 12919 + }, + { + "epoch": 0.39, + "learning_rate": 3.490547803518598e-06, + "loss": 1.1542, + "step": 12920 + }, + { + "epoch": 0.39, + "learning_rate": 3.4903238421526706e-06, + "loss": 1.0907, + "step": 12921 + }, + { + "epoch": 0.39, + "learning_rate": 3.4900998713593367e-06, + "loss": 1.2152, + "step": 12922 + }, + { + "epoch": 0.39, + "learning_rate": 3.489875891140729e-06, + "loss": 1.135, + "step": 12923 + }, + { + "epoch": 0.39, + "learning_rate": 3.48965190149898e-06, + "loss": 1.1099, + "step": 12924 + }, + { + "epoch": 0.39, + "learning_rate": 3.489427902436221e-06, + "loss": 1.1409, + "step": 12925 + }, + { + "epoch": 0.39, + "learning_rate": 3.4892038939545854e-06, + "loss": 1.2159, + "step": 12926 + }, + { + "epoch": 0.39, + "learning_rate": 3.4889798760562043e-06, + "loss": 1.0767, + "step": 12927 + }, + { + "epoch": 0.39, + "learning_rate": 3.4887558487432116e-06, + "loss": 1.1139, + "step": 12928 + }, + { + "epoch": 0.39, + "learning_rate": 3.4885318120177398e-06, + "loss": 1.0987, + "step": 12929 + }, + { + "epoch": 0.39, + "learning_rate": 3.4883077658819204e-06, + "loss": 1.1414, + "step": 12930 + }, + { + "epoch": 0.39, + "learning_rate": 3.4880837103378875e-06, + "loss": 1.2441, + "step": 12931 + }, + { + "epoch": 0.39, + "learning_rate": 3.487859645387774e-06, + "loss": 1.1537, + "step": 12932 + }, + { + "epoch": 0.39, + "learning_rate": 3.4876355710337117e-06, + "loss": 1.186, + "step": 12933 + }, + { + "epoch": 0.39, + "learning_rate": 3.4874114872778345e-06, + "loss": 1.149, + "step": 12934 + }, + { + "epoch": 0.39, + "learning_rate": 3.4871873941222756e-06, + "loss": 1.1317, + "step": 12935 + }, + { + "epoch": 0.39, + "learning_rate": 3.4869632915691686e-06, + "loss": 1.1406, + "step": 12936 + }, + { + "epoch": 0.39, + "learning_rate": 3.4867391796206464e-06, + "loss": 0.973, + "step": 12937 + }, + { + "epoch": 0.39, + "learning_rate": 3.486515058278842e-06, + "loss": 1.1524, + "step": 12938 + }, + { + "epoch": 0.39, + "learning_rate": 3.4862909275458896e-06, + "loss": 1.2191, + "step": 12939 + }, + { + "epoch": 0.39, + "learning_rate": 3.4860667874239225e-06, + "loss": 1.1203, + "step": 12940 + }, + { + "epoch": 0.39, + "learning_rate": 3.485842637915074e-06, + "loss": 1.098, + "step": 12941 + }, + { + "epoch": 0.39, + "learning_rate": 3.485618479021479e-06, + "loss": 1.1069, + "step": 12942 + }, + { + "epoch": 0.39, + "learning_rate": 3.4853943107452704e-06, + "loss": 1.1184, + "step": 12943 + }, + { + "epoch": 0.39, + "learning_rate": 3.4851701330885828e-06, + "loss": 1.1972, + "step": 12944 + }, + { + "epoch": 0.39, + "learning_rate": 3.48494594605355e-06, + "loss": 1.261, + "step": 12945 + }, + { + "epoch": 0.39, + "learning_rate": 3.4847217496423062e-06, + "loss": 1.1406, + "step": 12946 + }, + { + "epoch": 0.39, + "learning_rate": 3.484497543856986e-06, + "loss": 1.1389, + "step": 12947 + }, + { + "epoch": 0.39, + "learning_rate": 3.4842733286997225e-06, + "loss": 1.2441, + "step": 12948 + }, + { + "epoch": 0.39, + "learning_rate": 3.4840491041726514e-06, + "loss": 1.0935, + "step": 12949 + }, + { + "epoch": 0.39, + "learning_rate": 3.4838248702779066e-06, + "loss": 1.0865, + "step": 12950 + }, + { + "epoch": 0.39, + "learning_rate": 3.4836006270176236e-06, + "loss": 1.0657, + "step": 12951 + }, + { + "epoch": 0.39, + "learning_rate": 3.483376374393935e-06, + "loss": 1.0892, + "step": 12952 + }, + { + "epoch": 0.39, + "learning_rate": 3.4831521124089783e-06, + "loss": 1.0846, + "step": 12953 + }, + { + "epoch": 0.39, + "learning_rate": 3.482927841064886e-06, + "loss": 1.09, + "step": 12954 + }, + { + "epoch": 0.39, + "learning_rate": 3.4827035603637942e-06, + "loss": 1.2578, + "step": 12955 + }, + { + "epoch": 0.39, + "learning_rate": 3.482479270307838e-06, + "loss": 1.0939, + "step": 12956 + }, + { + "epoch": 0.39, + "learning_rate": 3.482254970899152e-06, + "loss": 1.0418, + "step": 12957 + }, + { + "epoch": 0.39, + "learning_rate": 3.4820306621398726e-06, + "loss": 1.1382, + "step": 12958 + }, + { + "epoch": 0.39, + "learning_rate": 3.481806344032133e-06, + "loss": 0.9881, + "step": 12959 + }, + { + "epoch": 0.39, + "learning_rate": 3.481582016578071e-06, + "loss": 1.0876, + "step": 12960 + }, + { + "epoch": 0.39, + "learning_rate": 3.4813576797798206e-06, + "loss": 1.2086, + "step": 12961 + }, + { + "epoch": 0.39, + "learning_rate": 3.4811333336395176e-06, + "loss": 1.1804, + "step": 12962 + }, + { + "epoch": 0.39, + "learning_rate": 3.4809089781592974e-06, + "loss": 1.05, + "step": 12963 + }, + { + "epoch": 0.39, + "learning_rate": 3.480684613341297e-06, + "loss": 1.0497, + "step": 12964 + }, + { + "epoch": 0.39, + "learning_rate": 3.4804602391876507e-06, + "loss": 0.9976, + "step": 12965 + }, + { + "epoch": 0.39, + "learning_rate": 3.4802358557004957e-06, + "loss": 1.2047, + "step": 12966 + }, + { + "epoch": 0.39, + "learning_rate": 3.480011462881967e-06, + "loss": 1.1429, + "step": 12967 + }, + { + "epoch": 0.39, + "learning_rate": 3.479787060734201e-06, + "loss": 1.1224, + "step": 12968 + }, + { + "epoch": 0.39, + "learning_rate": 3.4795626492593344e-06, + "loss": 1.1367, + "step": 12969 + }, + { + "epoch": 0.39, + "learning_rate": 3.4793382284595027e-06, + "loss": 1.0373, + "step": 12970 + }, + { + "epoch": 0.39, + "learning_rate": 3.479113798336844e-06, + "loss": 1.1185, + "step": 12971 + }, + { + "epoch": 0.39, + "learning_rate": 3.4788893588934923e-06, + "loss": 1.0435, + "step": 12972 + }, + { + "epoch": 0.39, + "learning_rate": 3.478664910131586e-06, + "loss": 1.1738, + "step": 12973 + }, + { + "epoch": 0.39, + "learning_rate": 3.4784404520532604e-06, + "loss": 1.2348, + "step": 12974 + }, + { + "epoch": 0.39, + "learning_rate": 3.4782159846606535e-06, + "loss": 1.0502, + "step": 12975 + }, + { + "epoch": 0.39, + "learning_rate": 3.477991507955901e-06, + "loss": 1.1012, + "step": 12976 + }, + { + "epoch": 0.39, + "learning_rate": 3.4777670219411414e-06, + "loss": 1.149, + "step": 12977 + }, + { + "epoch": 0.39, + "learning_rate": 3.47754252661851e-06, + "loss": 1.0762, + "step": 12978 + }, + { + "epoch": 0.39, + "learning_rate": 3.477318021990145e-06, + "loss": 1.2213, + "step": 12979 + }, + { + "epoch": 0.39, + "learning_rate": 3.4770935080581826e-06, + "loss": 1.2108, + "step": 12980 + }, + { + "epoch": 0.39, + "learning_rate": 3.47686898482476e-06, + "loss": 1.1461, + "step": 12981 + }, + { + "epoch": 0.39, + "learning_rate": 3.4766444522920157e-06, + "loss": 1.0872, + "step": 12982 + }, + { + "epoch": 0.39, + "learning_rate": 3.4764199104620864e-06, + "loss": 1.2036, + "step": 12983 + }, + { + "epoch": 0.39, + "learning_rate": 3.47619535933711e-06, + "loss": 1.0948, + "step": 12984 + }, + { + "epoch": 0.39, + "learning_rate": 3.4759707989192243e-06, + "loss": 1.059, + "step": 12985 + }, + { + "epoch": 0.39, + "learning_rate": 3.4757462292105664e-06, + "loss": 1.1663, + "step": 12986 + }, + { + "epoch": 0.39, + "learning_rate": 3.4755216502132744e-06, + "loss": 1.1074, + "step": 12987 + }, + { + "epoch": 0.39, + "learning_rate": 3.4752970619294863e-06, + "loss": 1.141, + "step": 12988 + }, + { + "epoch": 0.39, + "learning_rate": 3.4750724643613392e-06, + "loss": 1.1216, + "step": 12989 + }, + { + "epoch": 0.39, + "learning_rate": 3.474847857510973e-06, + "loss": 1.0673, + "step": 12990 + }, + { + "epoch": 0.39, + "learning_rate": 3.4746232413805237e-06, + "loss": 1.0458, + "step": 12991 + }, + { + "epoch": 0.39, + "learning_rate": 3.474398615972131e-06, + "loss": 1.1592, + "step": 12992 + }, + { + "epoch": 0.39, + "learning_rate": 3.474173981287932e-06, + "loss": 1.1157, + "step": 12993 + }, + { + "epoch": 0.39, + "learning_rate": 3.473949337330067e-06, + "loss": 1.2185, + "step": 12994 + }, + { + "epoch": 0.39, + "learning_rate": 3.473724684100672e-06, + "loss": 1.156, + "step": 12995 + }, + { + "epoch": 0.39, + "learning_rate": 3.4735000216018883e-06, + "loss": 1.1496, + "step": 12996 + }, + { + "epoch": 0.39, + "learning_rate": 3.4732753498358522e-06, + "loss": 1.194, + "step": 12997 + }, + { + "epoch": 0.39, + "learning_rate": 3.4730506688047038e-06, + "loss": 1.2562, + "step": 12998 + }, + { + "epoch": 0.39, + "learning_rate": 3.472825978510582e-06, + "loss": 1.2246, + "step": 12999 + }, + { + "epoch": 0.39, + "learning_rate": 3.4726012789556257e-06, + "loss": 1.2668, + "step": 13000 + }, + { + "epoch": 0.39, + "learning_rate": 3.4723765701419732e-06, + "loss": 1.104, + "step": 13001 + }, + { + "epoch": 0.39, + "learning_rate": 3.472151852071764e-06, + "loss": 1.0623, + "step": 13002 + }, + { + "epoch": 0.39, + "learning_rate": 3.471927124747138e-06, + "loss": 1.1057, + "step": 13003 + }, + { + "epoch": 0.39, + "learning_rate": 3.4717023881702332e-06, + "loss": 1.152, + "step": 13004 + }, + { + "epoch": 0.39, + "learning_rate": 3.47147764234319e-06, + "loss": 1.2186, + "step": 13005 + }, + { + "epoch": 0.39, + "learning_rate": 3.4712528872681473e-06, + "loss": 1.1698, + "step": 13006 + }, + { + "epoch": 0.39, + "learning_rate": 3.4710281229472455e-06, + "loss": 1.0957, + "step": 13007 + }, + { + "epoch": 0.39, + "learning_rate": 3.4708033493826226e-06, + "loss": 1.1307, + "step": 13008 + }, + { + "epoch": 0.39, + "learning_rate": 3.4705785665764197e-06, + "loss": 1.2391, + "step": 13009 + }, + { + "epoch": 0.39, + "learning_rate": 3.470353774530776e-06, + "loss": 1.1578, + "step": 13010 + }, + { + "epoch": 0.39, + "learning_rate": 3.470128973247832e-06, + "loss": 1.2556, + "step": 13011 + }, + { + "epoch": 0.39, + "learning_rate": 3.4699041627297283e-06, + "loss": 1.2441, + "step": 13012 + }, + { + "epoch": 0.39, + "learning_rate": 3.4696793429786024e-06, + "loss": 1.1851, + "step": 13013 + }, + { + "epoch": 0.39, + "learning_rate": 3.4694545139965974e-06, + "loss": 1.0704, + "step": 13014 + }, + { + "epoch": 0.39, + "learning_rate": 3.4692296757858525e-06, + "loss": 1.1176, + "step": 13015 + }, + { + "epoch": 0.39, + "learning_rate": 3.4690048283485074e-06, + "loss": 1.1026, + "step": 13016 + }, + { + "epoch": 0.39, + "learning_rate": 3.4687799716867028e-06, + "loss": 1.2176, + "step": 13017 + }, + { + "epoch": 0.39, + "learning_rate": 3.46855510580258e-06, + "loss": 1.1631, + "step": 13018 + }, + { + "epoch": 0.39, + "learning_rate": 3.4683302306982784e-06, + "loss": 1.0754, + "step": 13019 + }, + { + "epoch": 0.39, + "learning_rate": 3.46810534637594e-06, + "loss": 1.1805, + "step": 13020 + }, + { + "epoch": 0.39, + "learning_rate": 3.4678804528377047e-06, + "loss": 1.127, + "step": 13021 + }, + { + "epoch": 0.39, + "learning_rate": 3.4676555500857136e-06, + "loss": 1.0577, + "step": 13022 + }, + { + "epoch": 0.39, + "learning_rate": 3.4674306381221074e-06, + "loss": 1.1419, + "step": 13023 + }, + { + "epoch": 0.39, + "learning_rate": 3.467205716949028e-06, + "loss": 1.128, + "step": 13024 + }, + { + "epoch": 0.39, + "learning_rate": 3.4669807865686157e-06, + "loss": 1.0308, + "step": 13025 + }, + { + "epoch": 0.39, + "learning_rate": 3.466755846983012e-06, + "loss": 1.1111, + "step": 13026 + }, + { + "epoch": 0.39, + "learning_rate": 3.4665308981943583e-06, + "loss": 1.1439, + "step": 13027 + }, + { + "epoch": 0.39, + "learning_rate": 3.466305940204796e-06, + "loss": 1.1375, + "step": 13028 + }, + { + "epoch": 0.39, + "learning_rate": 3.466080973016467e-06, + "loss": 0.9979, + "step": 13029 + }, + { + "epoch": 0.39, + "learning_rate": 3.4658559966315115e-06, + "loss": 1.0165, + "step": 13030 + }, + { + "epoch": 0.39, + "learning_rate": 3.465631011052073e-06, + "loss": 1.2375, + "step": 13031 + }, + { + "epoch": 0.39, + "learning_rate": 3.4654060162802918e-06, + "loss": 1.2238, + "step": 13032 + }, + { + "epoch": 0.39, + "learning_rate": 3.4651810123183104e-06, + "loss": 1.1254, + "step": 13033 + }, + { + "epoch": 0.39, + "learning_rate": 3.4649559991682703e-06, + "loss": 1.0142, + "step": 13034 + }, + { + "epoch": 0.39, + "learning_rate": 3.4647309768323147e-06, + "loss": 1.1145, + "step": 13035 + }, + { + "epoch": 0.39, + "learning_rate": 3.464505945312584e-06, + "loss": 1.0945, + "step": 13036 + }, + { + "epoch": 0.39, + "learning_rate": 3.464280904611221e-06, + "loss": 1.1427, + "step": 13037 + }, + { + "epoch": 0.39, + "learning_rate": 3.4640558547303683e-06, + "loss": 1.0853, + "step": 13038 + }, + { + "epoch": 0.39, + "learning_rate": 3.4638307956721683e-06, + "loss": 1.1553, + "step": 13039 + }, + { + "epoch": 0.39, + "learning_rate": 3.4636057274387642e-06, + "loss": 1.2469, + "step": 13040 + }, + { + "epoch": 0.39, + "learning_rate": 3.4633806500322966e-06, + "loss": 1.1013, + "step": 13041 + }, + { + "epoch": 0.39, + "learning_rate": 3.4631555634549096e-06, + "loss": 1.2518, + "step": 13042 + }, + { + "epoch": 0.39, + "learning_rate": 3.4629304677087455e-06, + "loss": 1.0541, + "step": 13043 + }, + { + "epoch": 0.39, + "learning_rate": 3.462705362795947e-06, + "loss": 1.2051, + "step": 13044 + }, + { + "epoch": 0.39, + "learning_rate": 3.462480248718657e-06, + "loss": 1.1212, + "step": 13045 + }, + { + "epoch": 0.39, + "learning_rate": 3.462255125479019e-06, + "loss": 1.0823, + "step": 13046 + }, + { + "epoch": 0.39, + "learning_rate": 3.4620299930791755e-06, + "loss": 1.2076, + "step": 13047 + }, + { + "epoch": 0.39, + "learning_rate": 3.4618048515212704e-06, + "loss": 1.0881, + "step": 13048 + }, + { + "epoch": 0.39, + "learning_rate": 3.4615797008074452e-06, + "loss": 1.1683, + "step": 13049 + }, + { + "epoch": 0.39, + "learning_rate": 3.4613545409398447e-06, + "loss": 1.1501, + "step": 13050 + }, + { + "epoch": 0.39, + "learning_rate": 3.461129371920612e-06, + "loss": 1.1521, + "step": 13051 + }, + { + "epoch": 0.39, + "learning_rate": 3.4609041937518904e-06, + "loss": 1.1057, + "step": 13052 + }, + { + "epoch": 0.39, + "learning_rate": 3.4606790064358243e-06, + "loss": 1.2153, + "step": 13053 + }, + { + "epoch": 0.39, + "learning_rate": 3.460453809974556e-06, + "loss": 1.114, + "step": 13054 + }, + { + "epoch": 0.39, + "learning_rate": 3.4602286043702304e-06, + "loss": 1.0911, + "step": 13055 + }, + { + "epoch": 0.39, + "learning_rate": 3.4600033896249907e-06, + "loss": 1.0635, + "step": 13056 + }, + { + "epoch": 0.39, + "learning_rate": 3.4597781657409817e-06, + "loss": 1.1529, + "step": 13057 + }, + { + "epoch": 0.39, + "learning_rate": 3.4595529327203463e-06, + "loss": 1.0875, + "step": 13058 + }, + { + "epoch": 0.39, + "learning_rate": 3.4593276905652297e-06, + "loss": 1.0488, + "step": 13059 + }, + { + "epoch": 0.39, + "learning_rate": 3.459102439277775e-06, + "loss": 1.2125, + "step": 13060 + }, + { + "epoch": 0.39, + "learning_rate": 3.4588771788601273e-06, + "loss": 1.0454, + "step": 13061 + }, + { + "epoch": 0.39, + "learning_rate": 3.45865190931443e-06, + "loss": 1.0284, + "step": 13062 + }, + { + "epoch": 0.39, + "learning_rate": 3.458426630642828e-06, + "loss": 1.1139, + "step": 13063 + }, + { + "epoch": 0.39, + "learning_rate": 3.458201342847467e-06, + "loss": 1.1198, + "step": 13064 + }, + { + "epoch": 0.39, + "learning_rate": 3.4579760459304903e-06, + "loss": 1.1648, + "step": 13065 + }, + { + "epoch": 0.39, + "learning_rate": 3.4577507398940436e-06, + "loss": 1.1305, + "step": 13066 + }, + { + "epoch": 0.39, + "learning_rate": 3.45752542474027e-06, + "loss": 1.1758, + "step": 13067 + }, + { + "epoch": 0.39, + "learning_rate": 3.457300100471317e-06, + "loss": 1.1464, + "step": 13068 + }, + { + "epoch": 0.39, + "learning_rate": 3.4570747670893268e-06, + "loss": 1.1947, + "step": 13069 + }, + { + "epoch": 0.39, + "learning_rate": 3.456849424596446e-06, + "loss": 1.0255, + "step": 13070 + }, + { + "epoch": 0.39, + "learning_rate": 3.4566240729948196e-06, + "loss": 1.1669, + "step": 13071 + }, + { + "epoch": 0.39, + "learning_rate": 3.4563987122865936e-06, + "loss": 1.0193, + "step": 13072 + }, + { + "epoch": 0.39, + "learning_rate": 3.4561733424739112e-06, + "loss": 1.1205, + "step": 13073 + }, + { + "epoch": 0.39, + "learning_rate": 3.45594796355892e-06, + "loss": 1.3475, + "step": 13074 + }, + { + "epoch": 0.39, + "learning_rate": 3.455722575543764e-06, + "loss": 1.2115, + "step": 13075 + }, + { + "epoch": 0.39, + "learning_rate": 3.4554971784305895e-06, + "loss": 1.2199, + "step": 13076 + }, + { + "epoch": 0.39, + "learning_rate": 3.455271772221542e-06, + "loss": 1.1525, + "step": 13077 + }, + { + "epoch": 0.39, + "learning_rate": 3.4550463569187677e-06, + "loss": 1.1382, + "step": 13078 + }, + { + "epoch": 0.39, + "learning_rate": 3.454820932524412e-06, + "loss": 1.1647, + "step": 13079 + }, + { + "epoch": 0.39, + "learning_rate": 3.4545954990406205e-06, + "loss": 1.1359, + "step": 13080 + }, + { + "epoch": 0.39, + "learning_rate": 3.4543700564695397e-06, + "loss": 1.2172, + "step": 13081 + }, + { + "epoch": 0.39, + "learning_rate": 3.4541446048133152e-06, + "loss": 1.2517, + "step": 13082 + }, + { + "epoch": 0.39, + "learning_rate": 3.4539191440740947e-06, + "loss": 1.1028, + "step": 13083 + }, + { + "epoch": 0.39, + "learning_rate": 3.453693674254023e-06, + "loss": 1.0032, + "step": 13084 + }, + { + "epoch": 0.39, + "learning_rate": 3.4534681953552464e-06, + "loss": 1.1021, + "step": 13085 + }, + { + "epoch": 0.39, + "learning_rate": 3.453242707379912e-06, + "loss": 1.2041, + "step": 13086 + }, + { + "epoch": 0.39, + "learning_rate": 3.4530172103301664e-06, + "loss": 1.1219, + "step": 13087 + }, + { + "epoch": 0.39, + "learning_rate": 3.4527917042081556e-06, + "loss": 1.1642, + "step": 13088 + }, + { + "epoch": 0.39, + "learning_rate": 3.452566189016026e-06, + "loss": 1.1605, + "step": 13089 + }, + { + "epoch": 0.39, + "learning_rate": 3.4523406647559266e-06, + "loss": 1.1141, + "step": 13090 + }, + { + "epoch": 0.39, + "learning_rate": 3.4521151314300017e-06, + "loss": 1.1785, + "step": 13091 + }, + { + "epoch": 0.39, + "learning_rate": 3.451889589040399e-06, + "loss": 1.2239, + "step": 13092 + }, + { + "epoch": 0.39, + "learning_rate": 3.4516640375892662e-06, + "loss": 1.1445, + "step": 13093 + }, + { + "epoch": 0.39, + "learning_rate": 3.45143847707875e-06, + "loss": 1.1456, + "step": 13094 + }, + { + "epoch": 0.39, + "learning_rate": 3.451212907510998e-06, + "loss": 1.1757, + "step": 13095 + }, + { + "epoch": 0.39, + "learning_rate": 3.450987328888158e-06, + "loss": 1.129, + "step": 13096 + }, + { + "epoch": 0.39, + "learning_rate": 3.450761741212375e-06, + "loss": 1.1645, + "step": 13097 + }, + { + "epoch": 0.39, + "learning_rate": 3.4505361444857997e-06, + "loss": 1.0592, + "step": 13098 + }, + { + "epoch": 0.39, + "learning_rate": 3.4503105387105773e-06, + "loss": 1.165, + "step": 13099 + }, + { + "epoch": 0.39, + "learning_rate": 3.4500849238888567e-06, + "loss": 1.2172, + "step": 13100 + }, + { + "epoch": 0.39, + "learning_rate": 3.4498593000227843e-06, + "loss": 1.1033, + "step": 13101 + }, + { + "epoch": 0.39, + "learning_rate": 3.4496336671145098e-06, + "loss": 1.1747, + "step": 13102 + }, + { + "epoch": 0.39, + "learning_rate": 3.449408025166179e-06, + "loss": 1.0286, + "step": 13103 + }, + { + "epoch": 0.39, + "learning_rate": 3.4491823741799417e-06, + "loss": 1.1921, + "step": 13104 + }, + { + "epoch": 0.39, + "learning_rate": 3.4489567141579456e-06, + "loss": 1.1152, + "step": 13105 + }, + { + "epoch": 0.39, + "learning_rate": 3.448731045102338e-06, + "loss": 1.0801, + "step": 13106 + }, + { + "epoch": 0.39, + "learning_rate": 3.4485053670152684e-06, + "loss": 1.2043, + "step": 13107 + }, + { + "epoch": 0.39, + "learning_rate": 3.4482796798988842e-06, + "loss": 1.084, + "step": 13108 + }, + { + "epoch": 0.39, + "learning_rate": 3.448053983755335e-06, + "loss": 1.1263, + "step": 13109 + }, + { + "epoch": 0.39, + "learning_rate": 3.4478282785867674e-06, + "loss": 1.072, + "step": 13110 + }, + { + "epoch": 0.39, + "learning_rate": 3.4476025643953317e-06, + "loss": 1.2198, + "step": 13111 + }, + { + "epoch": 0.39, + "learning_rate": 3.4473768411831755e-06, + "loss": 1.2976, + "step": 13112 + }, + { + "epoch": 0.4, + "learning_rate": 3.4471511089524486e-06, + "loss": 1.2669, + "step": 13113 + }, + { + "epoch": 0.4, + "learning_rate": 3.4469253677052983e-06, + "loss": 1.1429, + "step": 13114 + }, + { + "epoch": 0.4, + "learning_rate": 3.446699617443876e-06, + "loss": 1.1858, + "step": 13115 + }, + { + "epoch": 0.4, + "learning_rate": 3.4464738581703284e-06, + "loss": 1.1018, + "step": 13116 + }, + { + "epoch": 0.4, + "learning_rate": 3.446248089886805e-06, + "loss": 1.0948, + "step": 13117 + }, + { + "epoch": 0.4, + "learning_rate": 3.4460223125954563e-06, + "loss": 1.2131, + "step": 13118 + }, + { + "epoch": 0.4, + "learning_rate": 3.4457965262984305e-06, + "loss": 1.1304, + "step": 13119 + }, + { + "epoch": 0.4, + "learning_rate": 3.445570730997877e-06, + "loss": 1.1656, + "step": 13120 + }, + { + "epoch": 0.4, + "learning_rate": 3.445344926695946e-06, + "loss": 1.1423, + "step": 13121 + }, + { + "epoch": 0.4, + "learning_rate": 3.445119113394787e-06, + "loss": 1.0006, + "step": 13122 + }, + { + "epoch": 0.4, + "learning_rate": 3.4448932910965484e-06, + "loss": 1.0903, + "step": 13123 + }, + { + "epoch": 0.4, + "learning_rate": 3.444667459803381e-06, + "loss": 1.2366, + "step": 13124 + }, + { + "epoch": 0.4, + "learning_rate": 3.4444416195174345e-06, + "loss": 1.1622, + "step": 13125 + }, + { + "epoch": 0.4, + "learning_rate": 3.444215770240859e-06, + "loss": 1.2274, + "step": 13126 + }, + { + "epoch": 0.4, + "learning_rate": 3.4439899119758035e-06, + "loss": 1.0807, + "step": 13127 + }, + { + "epoch": 0.4, + "learning_rate": 3.443764044724419e-06, + "loss": 1.0544, + "step": 13128 + }, + { + "epoch": 0.4, + "learning_rate": 3.4435381684888554e-06, + "loss": 1.0768, + "step": 13129 + }, + { + "epoch": 0.4, + "learning_rate": 3.443312283271262e-06, + "loss": 1.0817, + "step": 13130 + }, + { + "epoch": 0.4, + "learning_rate": 3.4430863890737907e-06, + "loss": 1.1063, + "step": 13131 + }, + { + "epoch": 0.4, + "learning_rate": 3.4428604858985916e-06, + "loss": 1.1633, + "step": 13132 + }, + { + "epoch": 0.4, + "learning_rate": 3.442634573747814e-06, + "loss": 1.1807, + "step": 13133 + }, + { + "epoch": 0.4, + "learning_rate": 3.442408652623609e-06, + "loss": 1.1333, + "step": 13134 + }, + { + "epoch": 0.4, + "learning_rate": 3.4421827225281285e-06, + "loss": 1.2164, + "step": 13135 + }, + { + "epoch": 0.4, + "learning_rate": 3.4419567834635213e-06, + "loss": 1.2023, + "step": 13136 + }, + { + "epoch": 0.4, + "learning_rate": 3.44173083543194e-06, + "loss": 1.1967, + "step": 13137 + }, + { + "epoch": 0.4, + "learning_rate": 3.4415048784355343e-06, + "loss": 1.1603, + "step": 13138 + }, + { + "epoch": 0.4, + "learning_rate": 3.441278912476456e-06, + "loss": 1.0486, + "step": 13139 + }, + { + "epoch": 0.4, + "learning_rate": 3.441052937556856e-06, + "loss": 1.1155, + "step": 13140 + }, + { + "epoch": 0.4, + "learning_rate": 3.4408269536788846e-06, + "loss": 1.1486, + "step": 13141 + }, + { + "epoch": 0.4, + "learning_rate": 3.4406009608446933e-06, + "loss": 1.1292, + "step": 13142 + }, + { + "epoch": 0.4, + "learning_rate": 3.4403749590564344e-06, + "loss": 1.036, + "step": 13143 + }, + { + "epoch": 0.4, + "learning_rate": 3.4401489483162592e-06, + "loss": 1.1167, + "step": 13144 + }, + { + "epoch": 0.4, + "learning_rate": 3.4399229286263182e-06, + "loss": 1.0782, + "step": 13145 + }, + { + "epoch": 0.4, + "learning_rate": 3.4396968999887637e-06, + "loss": 1.1484, + "step": 13146 + }, + { + "epoch": 0.4, + "learning_rate": 3.4394708624057472e-06, + "loss": 1.1242, + "step": 13147 + }, + { + "epoch": 0.4, + "learning_rate": 3.439244815879421e-06, + "loss": 1.1725, + "step": 13148 + }, + { + "epoch": 0.4, + "learning_rate": 3.439018760411936e-06, + "loss": 1.2198, + "step": 13149 + }, + { + "epoch": 0.4, + "learning_rate": 3.4387926960054453e-06, + "loss": 1.0642, + "step": 13150 + }, + { + "epoch": 0.4, + "learning_rate": 3.4385666226620996e-06, + "loss": 1.1615, + "step": 13151 + }, + { + "epoch": 0.4, + "learning_rate": 3.4383405403840526e-06, + "loss": 1.0474, + "step": 13152 + }, + { + "epoch": 0.4, + "learning_rate": 3.4381144491734545e-06, + "loss": 1.1432, + "step": 13153 + }, + { + "epoch": 0.4, + "learning_rate": 3.4378883490324593e-06, + "loss": 1.0725, + "step": 13154 + }, + { + "epoch": 0.4, + "learning_rate": 3.437662239963219e-06, + "loss": 1.0368, + "step": 13155 + }, + { + "epoch": 0.4, + "learning_rate": 3.437436121967884e-06, + "loss": 1.2119, + "step": 13156 + }, + { + "epoch": 0.4, + "learning_rate": 3.4372099950486106e-06, + "loss": 1.1141, + "step": 13157 + }, + { + "epoch": 0.4, + "learning_rate": 3.4369838592075488e-06, + "loss": 1.1111, + "step": 13158 + }, + { + "epoch": 0.4, + "learning_rate": 3.4367577144468522e-06, + "loss": 1.0104, + "step": 13159 + }, + { + "epoch": 0.4, + "learning_rate": 3.4365315607686724e-06, + "loss": 1.1858, + "step": 13160 + }, + { + "epoch": 0.4, + "learning_rate": 3.436305398175164e-06, + "loss": 1.0375, + "step": 13161 + }, + { + "epoch": 0.4, + "learning_rate": 3.4360792266684782e-06, + "loss": 1.2441, + "step": 13162 + }, + { + "epoch": 0.4, + "learning_rate": 3.43585304625077e-06, + "loss": 1.1212, + "step": 13163 + }, + { + "epoch": 0.4, + "learning_rate": 3.4356268569241915e-06, + "loss": 1.1213, + "step": 13164 + }, + { + "epoch": 0.4, + "learning_rate": 3.4354006586908954e-06, + "loss": 1.2471, + "step": 13165 + }, + { + "epoch": 0.4, + "learning_rate": 3.435174451553036e-06, + "loss": 1.1146, + "step": 13166 + }, + { + "epoch": 0.4, + "learning_rate": 3.4349482355127663e-06, + "loss": 1.1023, + "step": 13167 + }, + { + "epoch": 0.4, + "learning_rate": 3.434722010572239e-06, + "loss": 1.2612, + "step": 13168 + }, + { + "epoch": 0.4, + "learning_rate": 3.4344957767336083e-06, + "loss": 1.2133, + "step": 13169 + }, + { + "epoch": 0.4, + "learning_rate": 3.434269533999029e-06, + "loss": 1.0122, + "step": 13170 + }, + { + "epoch": 0.4, + "learning_rate": 3.4340432823706525e-06, + "loss": 1.1226, + "step": 13171 + }, + { + "epoch": 0.4, + "learning_rate": 3.4338170218506344e-06, + "loss": 1.1879, + "step": 13172 + }, + { + "epoch": 0.4, + "learning_rate": 3.4335907524411275e-06, + "loss": 1.1154, + "step": 13173 + }, + { + "epoch": 0.4, + "learning_rate": 3.4333644741442867e-06, + "loss": 1.1706, + "step": 13174 + }, + { + "epoch": 0.4, + "learning_rate": 3.4331381869622655e-06, + "loss": 1.2142, + "step": 13175 + }, + { + "epoch": 0.4, + "learning_rate": 3.4329118908972187e-06, + "loss": 1.2493, + "step": 13176 + }, + { + "epoch": 0.4, + "learning_rate": 3.432685585951299e-06, + "loss": 1.0624, + "step": 13177 + }, + { + "epoch": 0.4, + "learning_rate": 3.4324592721266626e-06, + "loss": 1.0806, + "step": 13178 + }, + { + "epoch": 0.4, + "learning_rate": 3.4322329494254625e-06, + "loss": 1.09, + "step": 13179 + }, + { + "epoch": 0.4, + "learning_rate": 3.4320066178498545e-06, + "loss": 1.1607, + "step": 13180 + }, + { + "epoch": 0.4, + "learning_rate": 3.4317802774019915e-06, + "loss": 1.0251, + "step": 13181 + }, + { + "epoch": 0.4, + "learning_rate": 3.431553928084029e-06, + "loss": 1.1533, + "step": 13182 + }, + { + "epoch": 0.4, + "learning_rate": 3.4313275698981226e-06, + "loss": 1.1762, + "step": 13183 + }, + { + "epoch": 0.4, + "learning_rate": 3.431101202846425e-06, + "loss": 1.1212, + "step": 13184 + }, + { + "epoch": 0.4, + "learning_rate": 3.4308748269310938e-06, + "loss": 1.0188, + "step": 13185 + }, + { + "epoch": 0.4, + "learning_rate": 3.430648442154282e-06, + "loss": 1.2032, + "step": 13186 + }, + { + "epoch": 0.4, + "learning_rate": 3.4304220485181446e-06, + "loss": 1.1606, + "step": 13187 + }, + { + "epoch": 0.4, + "learning_rate": 3.4301956460248374e-06, + "loss": 1.0953, + "step": 13188 + }, + { + "epoch": 0.4, + "learning_rate": 3.429969234676517e-06, + "loss": 1.0743, + "step": 13189 + }, + { + "epoch": 0.4, + "learning_rate": 3.4297428144753363e-06, + "loss": 1.1816, + "step": 13190 + }, + { + "epoch": 0.4, + "learning_rate": 3.429516385423452e-06, + "loss": 1.2112, + "step": 13191 + }, + { + "epoch": 0.4, + "learning_rate": 3.429289947523019e-06, + "loss": 1.0394, + "step": 13192 + }, + { + "epoch": 0.4, + "learning_rate": 3.429063500776194e-06, + "loss": 1.2973, + "step": 13193 + }, + { + "epoch": 0.4, + "learning_rate": 3.4288370451851315e-06, + "loss": 1.1227, + "step": 13194 + }, + { + "epoch": 0.4, + "learning_rate": 3.428610580751988e-06, + "loss": 1.0471, + "step": 13195 + }, + { + "epoch": 0.4, + "learning_rate": 3.428384107478919e-06, + "loss": 1.2012, + "step": 13196 + }, + { + "epoch": 0.4, + "learning_rate": 3.42815762536808e-06, + "loss": 1.1338, + "step": 13197 + }, + { + "epoch": 0.4, + "learning_rate": 3.4279311344216275e-06, + "loss": 1.165, + "step": 13198 + }, + { + "epoch": 0.4, + "learning_rate": 3.4277046346417176e-06, + "loss": 1.0981, + "step": 13199 + }, + { + "epoch": 0.4, + "learning_rate": 3.4274781260305066e-06, + "loss": 1.1855, + "step": 13200 + }, + { + "epoch": 0.4, + "learning_rate": 3.4272516085901503e-06, + "loss": 1.0825, + "step": 13201 + }, + { + "epoch": 0.4, + "learning_rate": 3.4270250823228052e-06, + "loss": 1.1985, + "step": 13202 + }, + { + "epoch": 0.4, + "learning_rate": 3.4267985472306275e-06, + "loss": 1.038, + "step": 13203 + }, + { + "epoch": 0.4, + "learning_rate": 3.4265720033157744e-06, + "loss": 1.266, + "step": 13204 + }, + { + "epoch": 0.4, + "learning_rate": 3.4263454505804023e-06, + "loss": 1.1946, + "step": 13205 + }, + { + "epoch": 0.4, + "learning_rate": 3.426118889026668e-06, + "loss": 1.0734, + "step": 13206 + }, + { + "epoch": 0.4, + "learning_rate": 3.4258923186567266e-06, + "loss": 1.1881, + "step": 13207 + }, + { + "epoch": 0.4, + "learning_rate": 3.4256657394727376e-06, + "loss": 1.1572, + "step": 13208 + }, + { + "epoch": 0.4, + "learning_rate": 3.425439151476856e-06, + "loss": 1.186, + "step": 13209 + }, + { + "epoch": 0.4, + "learning_rate": 3.4252125546712387e-06, + "loss": 1.1165, + "step": 13210 + }, + { + "epoch": 0.4, + "learning_rate": 3.4249859490580446e-06, + "loss": 1.2418, + "step": 13211 + }, + { + "epoch": 0.4, + "learning_rate": 3.4247593346394293e-06, + "loss": 1.1401, + "step": 13212 + }, + { + "epoch": 0.4, + "learning_rate": 3.424532711417551e-06, + "loss": 1.173, + "step": 13213 + }, + { + "epoch": 0.4, + "learning_rate": 3.4243060793945654e-06, + "loss": 1.2389, + "step": 13214 + }, + { + "epoch": 0.4, + "learning_rate": 3.4240794385726317e-06, + "loss": 1.1887, + "step": 13215 + }, + { + "epoch": 0.4, + "learning_rate": 3.4238527889539063e-06, + "loss": 1.1698, + "step": 13216 + }, + { + "epoch": 0.4, + "learning_rate": 3.4236261305405483e-06, + "loss": 1.2107, + "step": 13217 + }, + { + "epoch": 0.4, + "learning_rate": 3.4233994633347135e-06, + "loss": 1.2339, + "step": 13218 + }, + { + "epoch": 0.4, + "learning_rate": 3.4231727873385614e-06, + "loss": 1.1454, + "step": 13219 + }, + { + "epoch": 0.4, + "learning_rate": 3.422946102554248e-06, + "loss": 1.1583, + "step": 13220 + }, + { + "epoch": 0.4, + "learning_rate": 3.4227194089839333e-06, + "loss": 1.1323, + "step": 13221 + }, + { + "epoch": 0.4, + "learning_rate": 3.422492706629773e-06, + "loss": 1.0919, + "step": 13222 + }, + { + "epoch": 0.4, + "learning_rate": 3.4222659954939276e-06, + "loss": 1.1846, + "step": 13223 + }, + { + "epoch": 0.4, + "learning_rate": 3.4220392755785534e-06, + "loss": 1.2834, + "step": 13224 + }, + { + "epoch": 0.4, + "learning_rate": 3.4218125468858093e-06, + "loss": 1.0615, + "step": 13225 + }, + { + "epoch": 0.4, + "learning_rate": 3.4215858094178546e-06, + "loss": 1.1252, + "step": 13226 + }, + { + "epoch": 0.4, + "learning_rate": 3.4213590631768455e-06, + "loss": 1.0986, + "step": 13227 + }, + { + "epoch": 0.4, + "learning_rate": 3.4211323081649428e-06, + "loss": 1.1603, + "step": 13228 + }, + { + "epoch": 0.4, + "learning_rate": 3.420905544384303e-06, + "loss": 0.9957, + "step": 13229 + }, + { + "epoch": 0.4, + "learning_rate": 3.420678771837088e-06, + "loss": 1.3405, + "step": 13230 + }, + { + "epoch": 0.4, + "learning_rate": 3.420451990525453e-06, + "loss": 1.1025, + "step": 13231 + }, + { + "epoch": 0.4, + "learning_rate": 3.4202252004515586e-06, + "loss": 1.0943, + "step": 13232 + }, + { + "epoch": 0.4, + "learning_rate": 3.4199984016175636e-06, + "loss": 1.157, + "step": 13233 + }, + { + "epoch": 0.4, + "learning_rate": 3.419771594025627e-06, + "loss": 1.1241, + "step": 13234 + }, + { + "epoch": 0.4, + "learning_rate": 3.4195447776779077e-06, + "loss": 1.0722, + "step": 13235 + }, + { + "epoch": 0.4, + "learning_rate": 3.4193179525765647e-06, + "loss": 1.1823, + "step": 13236 + }, + { + "epoch": 0.4, + "learning_rate": 3.419091118723758e-06, + "loss": 1.2811, + "step": 13237 + }, + { + "epoch": 0.4, + "learning_rate": 3.4188642761216462e-06, + "loss": 1.1704, + "step": 13238 + }, + { + "epoch": 0.4, + "learning_rate": 3.41863742477239e-06, + "loss": 1.1491, + "step": 13239 + }, + { + "epoch": 0.4, + "learning_rate": 3.4184105646781464e-06, + "loss": 1.1528, + "step": 13240 + }, + { + "epoch": 0.4, + "learning_rate": 3.4181836958410774e-06, + "loss": 1.031, + "step": 13241 + }, + { + "epoch": 0.4, + "learning_rate": 3.4179568182633417e-06, + "loss": 1.1808, + "step": 13242 + }, + { + "epoch": 0.4, + "learning_rate": 3.417729931947099e-06, + "loss": 1.0583, + "step": 13243 + }, + { + "epoch": 0.4, + "learning_rate": 3.4175030368945095e-06, + "loss": 1.1576, + "step": 13244 + }, + { + "epoch": 0.4, + "learning_rate": 3.4172761331077333e-06, + "loss": 1.1506, + "step": 13245 + }, + { + "epoch": 0.4, + "learning_rate": 3.4170492205889296e-06, + "loss": 1.0964, + "step": 13246 + }, + { + "epoch": 0.4, + "learning_rate": 3.416822299340259e-06, + "loss": 1.168, + "step": 13247 + }, + { + "epoch": 0.4, + "learning_rate": 3.416595369363882e-06, + "loss": 1.144, + "step": 13248 + }, + { + "epoch": 0.4, + "learning_rate": 3.4163684306619576e-06, + "loss": 1.1993, + "step": 13249 + }, + { + "epoch": 0.4, + "learning_rate": 3.4161414832366483e-06, + "loss": 1.078, + "step": 13250 + }, + { + "epoch": 0.4, + "learning_rate": 3.415914527090113e-06, + "loss": 1.1087, + "step": 13251 + }, + { + "epoch": 0.4, + "learning_rate": 3.415687562224512e-06, + "loss": 1.0286, + "step": 13252 + }, + { + "epoch": 0.4, + "learning_rate": 3.415460588642007e-06, + "loss": 1.1291, + "step": 13253 + }, + { + "epoch": 0.4, + "learning_rate": 3.415233606344758e-06, + "loss": 1.1265, + "step": 13254 + }, + { + "epoch": 0.4, + "learning_rate": 3.415006615334926e-06, + "loss": 1.1765, + "step": 13255 + }, + { + "epoch": 0.4, + "learning_rate": 3.414779615614671e-06, + "loss": 1.1163, + "step": 13256 + }, + { + "epoch": 0.4, + "learning_rate": 3.4145526071861546e-06, + "loss": 1.0082, + "step": 13257 + }, + { + "epoch": 0.4, + "learning_rate": 3.414325590051539e-06, + "loss": 1.1179, + "step": 13258 + }, + { + "epoch": 0.4, + "learning_rate": 3.414098564212983e-06, + "loss": 1.0811, + "step": 13259 + }, + { + "epoch": 0.4, + "learning_rate": 3.41387152967265e-06, + "loss": 1.0844, + "step": 13260 + }, + { + "epoch": 0.4, + "learning_rate": 3.4136444864326988e-06, + "loss": 1.2817, + "step": 13261 + }, + { + "epoch": 0.4, + "learning_rate": 3.413417434495293e-06, + "loss": 1.1396, + "step": 13262 + }, + { + "epoch": 0.4, + "learning_rate": 3.4131903738625933e-06, + "loss": 1.145, + "step": 13263 + }, + { + "epoch": 0.4, + "learning_rate": 3.4129633045367606e-06, + "loss": 1.1012, + "step": 13264 + }, + { + "epoch": 0.4, + "learning_rate": 3.412736226519957e-06, + "loss": 1.0554, + "step": 13265 + }, + { + "epoch": 0.4, + "learning_rate": 3.4125091398143444e-06, + "loss": 1.209, + "step": 13266 + }, + { + "epoch": 0.4, + "learning_rate": 3.4122820444220846e-06, + "loss": 1.1269, + "step": 13267 + }, + { + "epoch": 0.4, + "learning_rate": 3.412054940345338e-06, + "loss": 1.0817, + "step": 13268 + }, + { + "epoch": 0.4, + "learning_rate": 3.4118278275862683e-06, + "loss": 1.0325, + "step": 13269 + }, + { + "epoch": 0.4, + "learning_rate": 3.4116007061470363e-06, + "loss": 1.0875, + "step": 13270 + }, + { + "epoch": 0.4, + "learning_rate": 3.4113735760298057e-06, + "loss": 1.1835, + "step": 13271 + }, + { + "epoch": 0.4, + "learning_rate": 3.4111464372367364e-06, + "loss": 1.1092, + "step": 13272 + }, + { + "epoch": 0.4, + "learning_rate": 3.4109192897699926e-06, + "loss": 1.14, + "step": 13273 + }, + { + "epoch": 0.4, + "learning_rate": 3.4106921336317358e-06, + "loss": 1.2495, + "step": 13274 + }, + { + "epoch": 0.4, + "learning_rate": 3.410464968824128e-06, + "loss": 1.0733, + "step": 13275 + }, + { + "epoch": 0.4, + "learning_rate": 3.4102377953493324e-06, + "loss": 1.0828, + "step": 13276 + }, + { + "epoch": 0.4, + "learning_rate": 3.4100106132095117e-06, + "loss": 1.0531, + "step": 13277 + }, + { + "epoch": 0.4, + "learning_rate": 3.4097834224068284e-06, + "loss": 1.1855, + "step": 13278 + }, + { + "epoch": 0.4, + "learning_rate": 3.409556222943444e-06, + "loss": 1.2194, + "step": 13279 + }, + { + "epoch": 0.4, + "learning_rate": 3.4093290148215243e-06, + "loss": 1.2396, + "step": 13280 + }, + { + "epoch": 0.4, + "learning_rate": 3.4091017980432284e-06, + "loss": 1.1202, + "step": 13281 + }, + { + "epoch": 0.4, + "learning_rate": 3.4088745726107224e-06, + "loss": 0.9875, + "step": 13282 + }, + { + "epoch": 0.4, + "learning_rate": 3.4086473385261674e-06, + "loss": 1.0741, + "step": 13283 + }, + { + "epoch": 0.4, + "learning_rate": 3.408420095791728e-06, + "loss": 1.1942, + "step": 13284 + }, + { + "epoch": 0.4, + "learning_rate": 3.4081928444095664e-06, + "loss": 1.138, + "step": 13285 + }, + { + "epoch": 0.4, + "learning_rate": 3.4079655843818466e-06, + "loss": 1.2538, + "step": 13286 + }, + { + "epoch": 0.4, + "learning_rate": 3.407738315710731e-06, + "loss": 1.0142, + "step": 13287 + }, + { + "epoch": 0.4, + "learning_rate": 3.407511038398385e-06, + "loss": 1.1654, + "step": 13288 + }, + { + "epoch": 0.4, + "learning_rate": 3.4072837524469703e-06, + "loss": 1.0969, + "step": 13289 + }, + { + "epoch": 0.4, + "learning_rate": 3.407056457858651e-06, + "loss": 1.162, + "step": 13290 + }, + { + "epoch": 0.4, + "learning_rate": 3.4068291546355917e-06, + "loss": 1.1261, + "step": 13291 + }, + { + "epoch": 0.4, + "learning_rate": 3.4066018427799554e-06, + "loss": 1.2355, + "step": 13292 + }, + { + "epoch": 0.4, + "learning_rate": 3.4063745222939067e-06, + "loss": 1.1506, + "step": 13293 + }, + { + "epoch": 0.4, + "learning_rate": 3.406147193179608e-06, + "loss": 1.1123, + "step": 13294 + }, + { + "epoch": 0.4, + "learning_rate": 3.405919855439225e-06, + "loss": 1.1639, + "step": 13295 + }, + { + "epoch": 0.4, + "learning_rate": 3.4056925090749214e-06, + "loss": 1.1317, + "step": 13296 + }, + { + "epoch": 0.4, + "learning_rate": 3.4054651540888604e-06, + "loss": 1.2368, + "step": 13297 + }, + { + "epoch": 0.4, + "learning_rate": 3.405237790483208e-06, + "loss": 1.2747, + "step": 13298 + }, + { + "epoch": 0.4, + "learning_rate": 3.405010418260128e-06, + "loss": 1.1825, + "step": 13299 + }, + { + "epoch": 0.4, + "learning_rate": 3.4047830374217845e-06, + "loss": 1.1375, + "step": 13300 + }, + { + "epoch": 0.4, + "learning_rate": 3.4045556479703424e-06, + "loss": 1.1425, + "step": 13301 + }, + { + "epoch": 0.4, + "learning_rate": 3.4043282499079656e-06, + "loss": 1.0815, + "step": 13302 + }, + { + "epoch": 0.4, + "learning_rate": 3.4041008432368193e-06, + "loss": 1.0814, + "step": 13303 + }, + { + "epoch": 0.4, + "learning_rate": 3.4038734279590696e-06, + "loss": 1.1367, + "step": 13304 + }, + { + "epoch": 0.4, + "learning_rate": 3.403646004076879e-06, + "loss": 1.0855, + "step": 13305 + }, + { + "epoch": 0.4, + "learning_rate": 3.4034185715924144e-06, + "loss": 1.19, + "step": 13306 + }, + { + "epoch": 0.4, + "learning_rate": 3.4031911305078395e-06, + "loss": 0.9985, + "step": 13307 + }, + { + "epoch": 0.4, + "learning_rate": 3.4029636808253208e-06, + "loss": 1.1305, + "step": 13308 + }, + { + "epoch": 0.4, + "learning_rate": 3.402736222547022e-06, + "loss": 1.1645, + "step": 13309 + }, + { + "epoch": 0.4, + "learning_rate": 3.402508755675109e-06, + "loss": 1.1346, + "step": 13310 + }, + { + "epoch": 0.4, + "learning_rate": 3.402281280211748e-06, + "loss": 1.1606, + "step": 13311 + }, + { + "epoch": 0.4, + "learning_rate": 3.402053796159104e-06, + "loss": 1.2241, + "step": 13312 + }, + { + "epoch": 0.4, + "learning_rate": 3.401826303519341e-06, + "loss": 1.084, + "step": 13313 + }, + { + "epoch": 0.4, + "learning_rate": 3.401598802294627e-06, + "loss": 1.1565, + "step": 13314 + }, + { + "epoch": 0.4, + "learning_rate": 3.4013712924871263e-06, + "loss": 1.0405, + "step": 13315 + }, + { + "epoch": 0.4, + "learning_rate": 3.401143774099005e-06, + "loss": 1.0034, + "step": 13316 + }, + { + "epoch": 0.4, + "learning_rate": 3.400916247132429e-06, + "loss": 1.1282, + "step": 13317 + }, + { + "epoch": 0.4, + "learning_rate": 3.4006887115895643e-06, + "loss": 1.0906, + "step": 13318 + }, + { + "epoch": 0.4, + "learning_rate": 3.4004611674725768e-06, + "loss": 1.0854, + "step": 13319 + }, + { + "epoch": 0.4, + "learning_rate": 3.4002336147836324e-06, + "loss": 1.0949, + "step": 13320 + }, + { + "epoch": 0.4, + "learning_rate": 3.400006053524898e-06, + "loss": 1.1213, + "step": 13321 + }, + { + "epoch": 0.4, + "learning_rate": 3.399778483698539e-06, + "loss": 1.0303, + "step": 13322 + }, + { + "epoch": 0.4, + "learning_rate": 3.3995509053067226e-06, + "loss": 1.1136, + "step": 13323 + }, + { + "epoch": 0.4, + "learning_rate": 3.399323318351615e-06, + "loss": 1.1439, + "step": 13324 + }, + { + "epoch": 0.4, + "learning_rate": 3.3990957228353817e-06, + "loss": 1.0303, + "step": 13325 + }, + { + "epoch": 0.4, + "learning_rate": 3.398868118760191e-06, + "loss": 1.0635, + "step": 13326 + }, + { + "epoch": 0.4, + "learning_rate": 3.398640506128208e-06, + "loss": 1.0492, + "step": 13327 + }, + { + "epoch": 0.4, + "learning_rate": 3.3984128849416005e-06, + "loss": 1.1901, + "step": 13328 + }, + { + "epoch": 0.4, + "learning_rate": 3.3981852552025352e-06, + "loss": 1.2225, + "step": 13329 + }, + { + "epoch": 0.4, + "learning_rate": 3.397957616913179e-06, + "loss": 1.0745, + "step": 13330 + }, + { + "epoch": 0.4, + "learning_rate": 3.397729970075698e-06, + "loss": 1.1536, + "step": 13331 + }, + { + "epoch": 0.4, + "learning_rate": 3.3975023146922608e-06, + "loss": 1.1691, + "step": 13332 + }, + { + "epoch": 0.4, + "learning_rate": 3.397274650765033e-06, + "loss": 1.2017, + "step": 13333 + }, + { + "epoch": 0.4, + "learning_rate": 3.3970469782961835e-06, + "loss": 1.0998, + "step": 13334 + }, + { + "epoch": 0.4, + "learning_rate": 3.3968192972878784e-06, + "loss": 1.1387, + "step": 13335 + }, + { + "epoch": 0.4, + "learning_rate": 3.3965916077422863e-06, + "loss": 1.3058, + "step": 13336 + }, + { + "epoch": 0.4, + "learning_rate": 3.396363909661573e-06, + "loss": 1.1462, + "step": 13337 + }, + { + "epoch": 0.4, + "learning_rate": 3.3961362030479066e-06, + "loss": 1.1739, + "step": 13338 + }, + { + "epoch": 0.4, + "learning_rate": 3.3959084879034554e-06, + "loss": 1.0863, + "step": 13339 + }, + { + "epoch": 0.4, + "learning_rate": 3.395680764230388e-06, + "loss": 1.1124, + "step": 13340 + }, + { + "epoch": 0.4, + "learning_rate": 3.39545303203087e-06, + "loss": 1.1901, + "step": 13341 + }, + { + "epoch": 0.4, + "learning_rate": 3.3952252913070703e-06, + "loss": 1.2205, + "step": 13342 + }, + { + "epoch": 0.4, + "learning_rate": 3.3949975420611573e-06, + "loss": 1.2812, + "step": 13343 + }, + { + "epoch": 0.4, + "learning_rate": 3.3947697842952987e-06, + "loss": 1.1754, + "step": 13344 + }, + { + "epoch": 0.4, + "learning_rate": 3.3945420180116632e-06, + "loss": 1.0326, + "step": 13345 + }, + { + "epoch": 0.4, + "learning_rate": 3.394314243212418e-06, + "loss": 1.0891, + "step": 13346 + }, + { + "epoch": 0.4, + "learning_rate": 3.3940864598997323e-06, + "loss": 1.1075, + "step": 13347 + }, + { + "epoch": 0.4, + "learning_rate": 3.393858668075774e-06, + "loss": 1.0717, + "step": 13348 + }, + { + "epoch": 0.4, + "learning_rate": 3.3936308677427122e-06, + "loss": 1.2943, + "step": 13349 + }, + { + "epoch": 0.4, + "learning_rate": 3.3934030589027134e-06, + "loss": 1.0706, + "step": 13350 + }, + { + "epoch": 0.4, + "learning_rate": 3.393175241557949e-06, + "loss": 1.1583, + "step": 13351 + }, + { + "epoch": 0.4, + "learning_rate": 3.3929474157105856e-06, + "loss": 1.0883, + "step": 13352 + }, + { + "epoch": 0.4, + "learning_rate": 3.3927195813627934e-06, + "loss": 1.1519, + "step": 13353 + }, + { + "epoch": 0.4, + "learning_rate": 3.3924917385167405e-06, + "loss": 1.1126, + "step": 13354 + }, + { + "epoch": 0.4, + "learning_rate": 3.392263887174596e-06, + "loss": 1.1887, + "step": 13355 + }, + { + "epoch": 0.4, + "learning_rate": 3.39203602733853e-06, + "loss": 1.1735, + "step": 13356 + }, + { + "epoch": 0.4, + "learning_rate": 3.39180815901071e-06, + "loss": 1.0269, + "step": 13357 + }, + { + "epoch": 0.4, + "learning_rate": 3.3915802821933057e-06, + "loss": 1.1639, + "step": 13358 + }, + { + "epoch": 0.4, + "learning_rate": 3.3913523968884867e-06, + "loss": 1.1789, + "step": 13359 + }, + { + "epoch": 0.4, + "learning_rate": 3.391124503098422e-06, + "loss": 1.1574, + "step": 13360 + }, + { + "epoch": 0.4, + "learning_rate": 3.3908966008252807e-06, + "loss": 1.2255, + "step": 13361 + }, + { + "epoch": 0.4, + "learning_rate": 3.390668690071234e-06, + "loss": 1.1923, + "step": 13362 + }, + { + "epoch": 0.4, + "learning_rate": 3.3904407708384496e-06, + "loss": 1.1597, + "step": 13363 + }, + { + "epoch": 0.4, + "learning_rate": 3.3902128431290983e-06, + "loss": 1.2268, + "step": 13364 + }, + { + "epoch": 0.4, + "learning_rate": 3.3899849069453496e-06, + "loss": 1.0294, + "step": 13365 + }, + { + "epoch": 0.4, + "learning_rate": 3.3897569622893724e-06, + "loss": 1.0811, + "step": 13366 + }, + { + "epoch": 0.4, + "learning_rate": 3.3895290091633376e-06, + "loss": 1.0883, + "step": 13367 + }, + { + "epoch": 0.4, + "learning_rate": 3.389301047569415e-06, + "loss": 1.1575, + "step": 13368 + }, + { + "epoch": 0.4, + "learning_rate": 3.3890730775097753e-06, + "loss": 1.212, + "step": 13369 + }, + { + "epoch": 0.4, + "learning_rate": 3.3888450989865875e-06, + "loss": 1.044, + "step": 13370 + }, + { + "epoch": 0.4, + "learning_rate": 3.3886171120020234e-06, + "loss": 1.1609, + "step": 13371 + }, + { + "epoch": 0.4, + "learning_rate": 3.388389116558252e-06, + "loss": 1.0839, + "step": 13372 + }, + { + "epoch": 0.4, + "learning_rate": 3.3881611126574432e-06, + "loss": 1.2251, + "step": 13373 + }, + { + "epoch": 0.4, + "learning_rate": 3.387933100301769e-06, + "loss": 1.1084, + "step": 13374 + }, + { + "epoch": 0.4, + "learning_rate": 3.3877050794933997e-06, + "loss": 1.2268, + "step": 13375 + }, + { + "epoch": 0.4, + "learning_rate": 3.387477050234505e-06, + "loss": 1.1581, + "step": 13376 + }, + { + "epoch": 0.4, + "learning_rate": 3.3872490125272567e-06, + "loss": 1.2279, + "step": 13377 + }, + { + "epoch": 0.4, + "learning_rate": 3.3870209663738244e-06, + "loss": 1.0444, + "step": 13378 + }, + { + "epoch": 0.4, + "learning_rate": 3.38679291177638e-06, + "loss": 1.1555, + "step": 13379 + }, + { + "epoch": 0.4, + "learning_rate": 3.386564848737094e-06, + "loss": 1.0876, + "step": 13380 + }, + { + "epoch": 0.4, + "learning_rate": 3.3863367772581384e-06, + "loss": 1.111, + "step": 13381 + }, + { + "epoch": 0.4, + "learning_rate": 3.386108697341683e-06, + "loss": 1.1911, + "step": 13382 + }, + { + "epoch": 0.4, + "learning_rate": 3.3858806089898995e-06, + "loss": 1.1381, + "step": 13383 + }, + { + "epoch": 0.4, + "learning_rate": 3.3856525122049593e-06, + "loss": 1.1522, + "step": 13384 + }, + { + "epoch": 0.4, + "learning_rate": 3.3854244069890342e-06, + "loss": 0.9037, + "step": 13385 + }, + { + "epoch": 0.4, + "learning_rate": 3.385196293344295e-06, + "loss": 1.1574, + "step": 13386 + }, + { + "epoch": 0.4, + "learning_rate": 3.384968171272913e-06, + "loss": 1.1324, + "step": 13387 + }, + { + "epoch": 0.4, + "learning_rate": 3.3847400407770603e-06, + "loss": 1.2072, + "step": 13388 + }, + { + "epoch": 0.4, + "learning_rate": 3.384511901858909e-06, + "loss": 1.1722, + "step": 13389 + }, + { + "epoch": 0.4, + "learning_rate": 3.3842837545206297e-06, + "loss": 1.0923, + "step": 13390 + }, + { + "epoch": 0.4, + "learning_rate": 3.384055598764395e-06, + "loss": 1.071, + "step": 13391 + }, + { + "epoch": 0.4, + "learning_rate": 3.383827434592377e-06, + "loss": 1.2811, + "step": 13392 + }, + { + "epoch": 0.4, + "learning_rate": 3.3835992620067476e-06, + "loss": 1.1524, + "step": 13393 + }, + { + "epoch": 0.4, + "learning_rate": 3.3833710810096787e-06, + "loss": 1.1885, + "step": 13394 + }, + { + "epoch": 0.4, + "learning_rate": 3.3831428916033425e-06, + "loss": 1.0879, + "step": 13395 + }, + { + "epoch": 0.4, + "learning_rate": 3.3829146937899117e-06, + "loss": 1.1008, + "step": 13396 + }, + { + "epoch": 0.4, + "learning_rate": 3.382686487571558e-06, + "loss": 1.1545, + "step": 13397 + }, + { + "epoch": 0.4, + "learning_rate": 3.382458272950454e-06, + "loss": 1.046, + "step": 13398 + }, + { + "epoch": 0.4, + "learning_rate": 3.3822300499287725e-06, + "loss": 1.1893, + "step": 13399 + }, + { + "epoch": 0.4, + "learning_rate": 3.3820018185086852e-06, + "loss": 1.079, + "step": 13400 + }, + { + "epoch": 0.4, + "learning_rate": 3.381773578692366e-06, + "loss": 1.142, + "step": 13401 + }, + { + "epoch": 0.4, + "learning_rate": 3.3815453304819868e-06, + "loss": 1.1209, + "step": 13402 + }, + { + "epoch": 0.4, + "learning_rate": 3.381317073879721e-06, + "loss": 1.0624, + "step": 13403 + }, + { + "epoch": 0.4, + "learning_rate": 3.3810888088877403e-06, + "loss": 1.2266, + "step": 13404 + }, + { + "epoch": 0.4, + "learning_rate": 3.3808605355082187e-06, + "loss": 1.0762, + "step": 13405 + }, + { + "epoch": 0.4, + "learning_rate": 3.380632253743329e-06, + "loss": 1.1876, + "step": 13406 + }, + { + "epoch": 0.4, + "learning_rate": 3.3804039635952447e-06, + "loss": 1.2363, + "step": 13407 + }, + { + "epoch": 0.4, + "learning_rate": 3.3801756650661384e-06, + "loss": 1.1154, + "step": 13408 + }, + { + "epoch": 0.4, + "learning_rate": 3.379947358158183e-06, + "loss": 1.0851, + "step": 13409 + }, + { + "epoch": 0.4, + "learning_rate": 3.3797190428735542e-06, + "loss": 1.2532, + "step": 13410 + }, + { + "epoch": 0.4, + "learning_rate": 3.379490719214423e-06, + "loss": 1.2546, + "step": 13411 + }, + { + "epoch": 0.4, + "learning_rate": 3.379262387182964e-06, + "loss": 1.2504, + "step": 13412 + }, + { + "epoch": 0.4, + "learning_rate": 3.37903404678135e-06, + "loss": 1.2216, + "step": 13413 + }, + { + "epoch": 0.4, + "learning_rate": 3.3788056980117554e-06, + "loss": 1.2076, + "step": 13414 + }, + { + "epoch": 0.4, + "learning_rate": 3.378577340876354e-06, + "loss": 1.2679, + "step": 13415 + }, + { + "epoch": 0.4, + "learning_rate": 3.3783489753773195e-06, + "loss": 1.0724, + "step": 13416 + }, + { + "epoch": 0.4, + "learning_rate": 3.3781206015168256e-06, + "loss": 1.1436, + "step": 13417 + }, + { + "epoch": 0.4, + "learning_rate": 3.3778922192970465e-06, + "loss": 1.1007, + "step": 13418 + }, + { + "epoch": 0.4, + "learning_rate": 3.3776638287201562e-06, + "loss": 1.1931, + "step": 13419 + }, + { + "epoch": 0.4, + "learning_rate": 3.3774354297883286e-06, + "loss": 1.1165, + "step": 13420 + }, + { + "epoch": 0.4, + "learning_rate": 3.377207022503739e-06, + "loss": 1.1268, + "step": 13421 + }, + { + "epoch": 0.4, + "learning_rate": 3.3769786068685604e-06, + "loss": 1.0305, + "step": 13422 + }, + { + "epoch": 0.4, + "learning_rate": 3.3767501828849685e-06, + "loss": 1.1814, + "step": 13423 + }, + { + "epoch": 0.4, + "learning_rate": 3.3765217505551366e-06, + "loss": 1.1679, + "step": 13424 + }, + { + "epoch": 0.4, + "learning_rate": 3.37629330988124e-06, + "loss": 1.1333, + "step": 13425 + }, + { + "epoch": 0.4, + "learning_rate": 3.3760648608654535e-06, + "loss": 1.2, + "step": 13426 + }, + { + "epoch": 0.4, + "learning_rate": 3.375836403509951e-06, + "loss": 1.122, + "step": 13427 + }, + { + "epoch": 0.4, + "learning_rate": 3.3756079378169076e-06, + "loss": 1.1411, + "step": 13428 + }, + { + "epoch": 0.4, + "learning_rate": 3.375379463788499e-06, + "loss": 0.9943, + "step": 13429 + }, + { + "epoch": 0.4, + "learning_rate": 3.375150981426899e-06, + "loss": 1.1017, + "step": 13430 + }, + { + "epoch": 0.4, + "learning_rate": 3.3749224907342837e-06, + "loss": 1.1968, + "step": 13431 + }, + { + "epoch": 0.4, + "learning_rate": 3.3746939917128265e-06, + "loss": 1.0461, + "step": 13432 + }, + { + "epoch": 0.4, + "learning_rate": 3.3744654843647042e-06, + "loss": 1.1428, + "step": 13433 + }, + { + "epoch": 0.4, + "learning_rate": 3.3742369686920916e-06, + "loss": 1.1072, + "step": 13434 + }, + { + "epoch": 0.4, + "learning_rate": 3.3740084446971644e-06, + "loss": 1.2136, + "step": 13435 + }, + { + "epoch": 0.4, + "learning_rate": 3.373779912382098e-06, + "loss": 1.1401, + "step": 13436 + }, + { + "epoch": 0.4, + "learning_rate": 3.3735513717490677e-06, + "loss": 1.1107, + "step": 13437 + }, + { + "epoch": 0.4, + "learning_rate": 3.3733228228002483e-06, + "loss": 1.093, + "step": 13438 + }, + { + "epoch": 0.4, + "learning_rate": 3.373094265537817e-06, + "loss": 1.1361, + "step": 13439 + }, + { + "epoch": 0.4, + "learning_rate": 3.3728656999639486e-06, + "loss": 1.1077, + "step": 13440 + }, + { + "epoch": 0.4, + "learning_rate": 3.3726371260808187e-06, + "loss": 1.2507, + "step": 13441 + }, + { + "epoch": 0.4, + "learning_rate": 3.372408543890604e-06, + "loss": 1.0823, + "step": 13442 + }, + { + "epoch": 0.4, + "learning_rate": 3.3721799533954802e-06, + "loss": 1.1115, + "step": 13443 + }, + { + "epoch": 0.41, + "learning_rate": 3.3719513545976233e-06, + "loss": 1.0919, + "step": 13444 + }, + { + "epoch": 0.41, + "learning_rate": 3.3717227474992093e-06, + "loss": 1.1293, + "step": 13445 + }, + { + "epoch": 0.41, + "learning_rate": 3.371494132102414e-06, + "loss": 1.1711, + "step": 13446 + }, + { + "epoch": 0.41, + "learning_rate": 3.3712655084094155e-06, + "loss": 1.0965, + "step": 13447 + }, + { + "epoch": 0.41, + "learning_rate": 3.371036876422388e-06, + "loss": 1.1512, + "step": 13448 + }, + { + "epoch": 0.41, + "learning_rate": 3.370808236143509e-06, + "loss": 1.2038, + "step": 13449 + }, + { + "epoch": 0.41, + "learning_rate": 3.370579587574955e-06, + "loss": 1.1855, + "step": 13450 + }, + { + "epoch": 0.41, + "learning_rate": 3.3703509307189036e-06, + "loss": 1.1822, + "step": 13451 + }, + { + "epoch": 0.41, + "learning_rate": 3.3701222655775294e-06, + "loss": 1.1879, + "step": 13452 + }, + { + "epoch": 0.41, + "learning_rate": 3.369893592153011e-06, + "loss": 1.2003, + "step": 13453 + }, + { + "epoch": 0.41, + "learning_rate": 3.3696649104475244e-06, + "loss": 1.0402, + "step": 13454 + }, + { + "epoch": 0.41, + "learning_rate": 3.369436220463247e-06, + "loss": 1.167, + "step": 13455 + }, + { + "epoch": 0.41, + "learning_rate": 3.3692075222023547e-06, + "loss": 1.1839, + "step": 13456 + }, + { + "epoch": 0.41, + "learning_rate": 3.368978815667026e-06, + "loss": 1.0717, + "step": 13457 + }, + { + "epoch": 0.41, + "learning_rate": 3.368750100859437e-06, + "loss": 1.114, + "step": 13458 + }, + { + "epoch": 0.41, + "learning_rate": 3.368521377781766e-06, + "loss": 1.1646, + "step": 13459 + }, + { + "epoch": 0.41, + "learning_rate": 3.368292646436189e-06, + "loss": 1.2875, + "step": 13460 + }, + { + "epoch": 0.41, + "learning_rate": 3.368063906824885e-06, + "loss": 1.2069, + "step": 13461 + }, + { + "epoch": 0.41, + "learning_rate": 3.36783515895003e-06, + "loss": 1.2393, + "step": 13462 + }, + { + "epoch": 0.41, + "learning_rate": 3.367606402813802e-06, + "loss": 1.1746, + "step": 13463 + }, + { + "epoch": 0.41, + "learning_rate": 3.36737763841838e-06, + "loss": 1.0947, + "step": 13464 + }, + { + "epoch": 0.41, + "learning_rate": 3.36714886576594e-06, + "loss": 1.1276, + "step": 13465 + }, + { + "epoch": 0.41, + "learning_rate": 3.3669200848586613e-06, + "loss": 1.1703, + "step": 13466 + }, + { + "epoch": 0.41, + "learning_rate": 3.3666912956987198e-06, + "loss": 1.2055, + "step": 13467 + }, + { + "epoch": 0.41, + "learning_rate": 3.3664624982882953e-06, + "loss": 1.2019, + "step": 13468 + }, + { + "epoch": 0.41, + "learning_rate": 3.3662336926295647e-06, + "loss": 1.1453, + "step": 13469 + }, + { + "epoch": 0.41, + "learning_rate": 3.3660048787247067e-06, + "loss": 1.1703, + "step": 13470 + }, + { + "epoch": 0.41, + "learning_rate": 3.365776056575899e-06, + "loss": 1.1131, + "step": 13471 + }, + { + "epoch": 0.41, + "learning_rate": 3.3655472261853213e-06, + "loss": 1.0697, + "step": 13472 + }, + { + "epoch": 0.41, + "learning_rate": 3.3653183875551497e-06, + "loss": 1.0984, + "step": 13473 + }, + { + "epoch": 0.41, + "learning_rate": 3.3650895406875637e-06, + "loss": 1.114, + "step": 13474 + }, + { + "epoch": 0.41, + "learning_rate": 3.364860685584742e-06, + "loss": 1.1841, + "step": 13475 + }, + { + "epoch": 0.41, + "learning_rate": 3.3646318222488633e-06, + "loss": 1.0691, + "step": 13476 + }, + { + "epoch": 0.41, + "learning_rate": 3.364402950682107e-06, + "loss": 0.996, + "step": 13477 + }, + { + "epoch": 0.41, + "learning_rate": 3.36417407088665e-06, + "loss": 1.0586, + "step": 13478 + }, + { + "epoch": 0.41, + "learning_rate": 3.3639451828646723e-06, + "loss": 1.1009, + "step": 13479 + }, + { + "epoch": 0.41, + "learning_rate": 3.363716286618352e-06, + "loss": 1.2298, + "step": 13480 + }, + { + "epoch": 0.41, + "learning_rate": 3.3634873821498696e-06, + "loss": 1.2118, + "step": 13481 + }, + { + "epoch": 0.41, + "learning_rate": 3.363258469461402e-06, + "loss": 1.01, + "step": 13482 + }, + { + "epoch": 0.41, + "learning_rate": 3.3630295485551313e-06, + "loss": 1.1282, + "step": 13483 + }, + { + "epoch": 0.41, + "learning_rate": 3.3628006194332337e-06, + "loss": 1.1766, + "step": 13484 + }, + { + "epoch": 0.41, + "learning_rate": 3.3625716820978897e-06, + "loss": 1.2213, + "step": 13485 + }, + { + "epoch": 0.41, + "learning_rate": 3.362342736551279e-06, + "loss": 1.1365, + "step": 13486 + }, + { + "epoch": 0.41, + "learning_rate": 3.36211378279558e-06, + "loss": 1.223, + "step": 13487 + }, + { + "epoch": 0.41, + "learning_rate": 3.3618848208329747e-06, + "loss": 1.1477, + "step": 13488 + }, + { + "epoch": 0.41, + "learning_rate": 3.3616558506656392e-06, + "loss": 1.0653, + "step": 13489 + }, + { + "epoch": 0.41, + "learning_rate": 3.3614268722957553e-06, + "loss": 1.1066, + "step": 13490 + }, + { + "epoch": 0.41, + "learning_rate": 3.3611978857255036e-06, + "loss": 1.1211, + "step": 13491 + }, + { + "epoch": 0.41, + "learning_rate": 3.3609688909570622e-06, + "loss": 1.1057, + "step": 13492 + }, + { + "epoch": 0.41, + "learning_rate": 3.360739887992611e-06, + "loss": 1.0656, + "step": 13493 + }, + { + "epoch": 0.41, + "learning_rate": 3.360510876834332e-06, + "loss": 1.1227, + "step": 13494 + }, + { + "epoch": 0.41, + "learning_rate": 3.3602818574844024e-06, + "loss": 1.0872, + "step": 13495 + }, + { + "epoch": 0.41, + "learning_rate": 3.3600528299450047e-06, + "loss": 1.1631, + "step": 13496 + }, + { + "epoch": 0.41, + "learning_rate": 3.3598237942183182e-06, + "loss": 1.0946, + "step": 13497 + }, + { + "epoch": 0.41, + "learning_rate": 3.3595947503065236e-06, + "loss": 0.9503, + "step": 13498 + }, + { + "epoch": 0.41, + "learning_rate": 3.3593656982118e-06, + "loss": 1.02, + "step": 13499 + }, + { + "epoch": 0.41, + "learning_rate": 3.35913663793633e-06, + "loss": 1.1342, + "step": 13500 + }, + { + "epoch": 0.41, + "learning_rate": 3.3589075694822916e-06, + "loss": 1.1108, + "step": 13501 + }, + { + "epoch": 0.41, + "learning_rate": 3.3586784928518674e-06, + "loss": 1.127, + "step": 13502 + }, + { + "epoch": 0.41, + "learning_rate": 3.3584494080472373e-06, + "loss": 1.0761, + "step": 13503 + }, + { + "epoch": 0.41, + "learning_rate": 3.358220315070583e-06, + "loss": 1.0953, + "step": 13504 + }, + { + "epoch": 0.41, + "learning_rate": 3.3579912139240846e-06, + "loss": 1.155, + "step": 13505 + }, + { + "epoch": 0.41, + "learning_rate": 3.3577621046099218e-06, + "loss": 1.0305, + "step": 13506 + }, + { + "epoch": 0.41, + "learning_rate": 3.3575329871302787e-06, + "loss": 1.2662, + "step": 13507 + }, + { + "epoch": 0.41, + "learning_rate": 3.357303861487333e-06, + "loss": 1.0782, + "step": 13508 + }, + { + "epoch": 0.41, + "learning_rate": 3.3570747276832684e-06, + "loss": 1.1178, + "step": 13509 + }, + { + "epoch": 0.41, + "learning_rate": 3.3568455857202646e-06, + "loss": 1.1706, + "step": 13510 + }, + { + "epoch": 0.41, + "learning_rate": 3.356616435600504e-06, + "loss": 1.1923, + "step": 13511 + }, + { + "epoch": 0.41, + "learning_rate": 3.3563872773261675e-06, + "loss": 1.1638, + "step": 13512 + }, + { + "epoch": 0.41, + "learning_rate": 3.356158110899437e-06, + "loss": 1.1497, + "step": 13513 + }, + { + "epoch": 0.41, + "learning_rate": 3.3559289363224924e-06, + "loss": 1.2426, + "step": 13514 + }, + { + "epoch": 0.41, + "learning_rate": 3.3556997535975167e-06, + "loss": 1.1464, + "step": 13515 + }, + { + "epoch": 0.41, + "learning_rate": 3.3554705627266916e-06, + "loss": 1.1197, + "step": 13516 + }, + { + "epoch": 0.41, + "learning_rate": 3.3552413637121987e-06, + "loss": 1.0822, + "step": 13517 + }, + { + "epoch": 0.41, + "learning_rate": 3.3550121565562204e-06, + "loss": 1.2084, + "step": 13518 + }, + { + "epoch": 0.41, + "learning_rate": 3.3547829412609377e-06, + "loss": 1.1492, + "step": 13519 + }, + { + "epoch": 0.41, + "learning_rate": 3.3545537178285343e-06, + "loss": 1.1205, + "step": 13520 + }, + { + "epoch": 0.41, + "learning_rate": 3.3543244862611897e-06, + "loss": 1.059, + "step": 13521 + }, + { + "epoch": 0.41, + "learning_rate": 3.3540952465610883e-06, + "loss": 1.2195, + "step": 13522 + }, + { + "epoch": 0.41, + "learning_rate": 3.353865998730411e-06, + "loss": 1.0473, + "step": 13523 + }, + { + "epoch": 0.41, + "learning_rate": 3.353636742771341e-06, + "loss": 1.1906, + "step": 13524 + }, + { + "epoch": 0.41, + "learning_rate": 3.353407478686059e-06, + "loss": 1.0538, + "step": 13525 + }, + { + "epoch": 0.41, + "learning_rate": 3.353178206476751e-06, + "loss": 1.1283, + "step": 13526 + }, + { + "epoch": 0.41, + "learning_rate": 3.352948926145596e-06, + "loss": 1.2272, + "step": 13527 + }, + { + "epoch": 0.41, + "learning_rate": 3.352719637694778e-06, + "loss": 1.1738, + "step": 13528 + }, + { + "epoch": 0.41, + "learning_rate": 3.3524903411264803e-06, + "loss": 1.1375, + "step": 13529 + }, + { + "epoch": 0.41, + "learning_rate": 3.352261036442884e-06, + "loss": 1.2032, + "step": 13530 + }, + { + "epoch": 0.41, + "learning_rate": 3.352031723646174e-06, + "loss": 1.0922, + "step": 13531 + }, + { + "epoch": 0.41, + "learning_rate": 3.351802402738532e-06, + "loss": 1.0819, + "step": 13532 + }, + { + "epoch": 0.41, + "learning_rate": 3.351573073722142e-06, + "loss": 1.1781, + "step": 13533 + }, + { + "epoch": 0.41, + "learning_rate": 3.3513437365991863e-06, + "loss": 1.159, + "step": 13534 + }, + { + "epoch": 0.41, + "learning_rate": 3.351114391371848e-06, + "loss": 1.1426, + "step": 13535 + }, + { + "epoch": 0.41, + "learning_rate": 3.3508850380423107e-06, + "loss": 1.1613, + "step": 13536 + }, + { + "epoch": 0.41, + "learning_rate": 3.3506556766127577e-06, + "loss": 1.0342, + "step": 13537 + }, + { + "epoch": 0.41, + "learning_rate": 3.350426307085372e-06, + "loss": 1.0474, + "step": 13538 + }, + { + "epoch": 0.41, + "learning_rate": 3.350196929462338e-06, + "loss": 1.101, + "step": 13539 + }, + { + "epoch": 0.41, + "learning_rate": 3.3499675437458386e-06, + "loss": 1.184, + "step": 13540 + }, + { + "epoch": 0.41, + "learning_rate": 3.3497381499380565e-06, + "loss": 1.173, + "step": 13541 + }, + { + "epoch": 0.41, + "learning_rate": 3.349508748041178e-06, + "loss": 1.0352, + "step": 13542 + }, + { + "epoch": 0.41, + "learning_rate": 3.349279338057384e-06, + "loss": 1.2174, + "step": 13543 + }, + { + "epoch": 0.41, + "learning_rate": 3.3490499199888605e-06, + "loss": 1.059, + "step": 13544 + }, + { + "epoch": 0.41, + "learning_rate": 3.3488204938377907e-06, + "loss": 1.1484, + "step": 13545 + }, + { + "epoch": 0.41, + "learning_rate": 3.3485910596063586e-06, + "loss": 1.1479, + "step": 13546 + }, + { + "epoch": 0.41, + "learning_rate": 3.3483616172967474e-06, + "loss": 1.0712, + "step": 13547 + }, + { + "epoch": 0.41, + "learning_rate": 3.3481321669111434e-06, + "loss": 1.1406, + "step": 13548 + }, + { + "epoch": 0.41, + "learning_rate": 3.347902708451729e-06, + "loss": 1.195, + "step": 13549 + }, + { + "epoch": 0.41, + "learning_rate": 3.3476732419206896e-06, + "loss": 1.1292, + "step": 13550 + }, + { + "epoch": 0.41, + "learning_rate": 3.3474437673202085e-06, + "loss": 1.0306, + "step": 13551 + }, + { + "epoch": 0.41, + "learning_rate": 3.3472142846524725e-06, + "loss": 1.145, + "step": 13552 + }, + { + "epoch": 0.41, + "learning_rate": 3.346984793919663e-06, + "loss": 1.1001, + "step": 13553 + }, + { + "epoch": 0.41, + "learning_rate": 3.3467552951239667e-06, + "loss": 1.138, + "step": 13554 + }, + { + "epoch": 0.41, + "learning_rate": 3.346525788267567e-06, + "loss": 1.1459, + "step": 13555 + }, + { + "epoch": 0.41, + "learning_rate": 3.3462962733526507e-06, + "loss": 1.1909, + "step": 13556 + }, + { + "epoch": 0.41, + "learning_rate": 3.3460667503814e-06, + "loss": 1.1926, + "step": 13557 + }, + { + "epoch": 0.41, + "learning_rate": 3.3458372193560023e-06, + "loss": 1.1949, + "step": 13558 + }, + { + "epoch": 0.41, + "learning_rate": 3.3456076802786418e-06, + "loss": 1.1543, + "step": 13559 + }, + { + "epoch": 0.41, + "learning_rate": 3.3453781331515032e-06, + "loss": 1.1672, + "step": 13560 + }, + { + "epoch": 0.41, + "learning_rate": 3.3451485779767724e-06, + "loss": 1.1769, + "step": 13561 + }, + { + "epoch": 0.41, + "learning_rate": 3.3449190147566334e-06, + "loss": 1.1567, + "step": 13562 + }, + { + "epoch": 0.41, + "learning_rate": 3.344689443493273e-06, + "loss": 1.1207, + "step": 13563 + }, + { + "epoch": 0.41, + "learning_rate": 3.3444598641888752e-06, + "loss": 1.0082, + "step": 13564 + }, + { + "epoch": 0.41, + "learning_rate": 3.344230276845627e-06, + "loss": 1.0852, + "step": 13565 + }, + { + "epoch": 0.41, + "learning_rate": 3.344000681465712e-06, + "loss": 1.1243, + "step": 13566 + }, + { + "epoch": 0.41, + "learning_rate": 3.3437710780513183e-06, + "loss": 1.2344, + "step": 13567 + }, + { + "epoch": 0.41, + "learning_rate": 3.3435414666046296e-06, + "loss": 1.2616, + "step": 13568 + }, + { + "epoch": 0.41, + "learning_rate": 3.3433118471278326e-06, + "loss": 1.2651, + "step": 13569 + }, + { + "epoch": 0.41, + "learning_rate": 3.343082219623113e-06, + "loss": 1.1456, + "step": 13570 + }, + { + "epoch": 0.41, + "learning_rate": 3.3428525840926562e-06, + "loss": 1.1747, + "step": 13571 + }, + { + "epoch": 0.41, + "learning_rate": 3.342622940538649e-06, + "loss": 1.1849, + "step": 13572 + }, + { + "epoch": 0.41, + "learning_rate": 3.342393288963277e-06, + "loss": 1.1105, + "step": 13573 + }, + { + "epoch": 0.41, + "learning_rate": 3.3421636293687275e-06, + "loss": 1.2181, + "step": 13574 + }, + { + "epoch": 0.41, + "learning_rate": 3.341933961757185e-06, + "loss": 1.1926, + "step": 13575 + }, + { + "epoch": 0.41, + "learning_rate": 3.3417042861308376e-06, + "loss": 1.095, + "step": 13576 + }, + { + "epoch": 0.41, + "learning_rate": 3.34147460249187e-06, + "loss": 1.1272, + "step": 13577 + }, + { + "epoch": 0.41, + "learning_rate": 3.3412449108424695e-06, + "loss": 1.1195, + "step": 13578 + }, + { + "epoch": 0.41, + "learning_rate": 3.3410152111848227e-06, + "loss": 1.1477, + "step": 13579 + }, + { + "epoch": 0.41, + "learning_rate": 3.340785503521116e-06, + "loss": 1.004, + "step": 13580 + }, + { + "epoch": 0.41, + "learning_rate": 3.3405557878535365e-06, + "loss": 1.2321, + "step": 13581 + }, + { + "epoch": 0.41, + "learning_rate": 3.3403260641842704e-06, + "loss": 1.1039, + "step": 13582 + }, + { + "epoch": 0.41, + "learning_rate": 3.3400963325155058e-06, + "loss": 1.0716, + "step": 13583 + }, + { + "epoch": 0.41, + "learning_rate": 3.3398665928494274e-06, + "loss": 0.9949, + "step": 13584 + }, + { + "epoch": 0.41, + "learning_rate": 3.3396368451882237e-06, + "loss": 1.1141, + "step": 13585 + }, + { + "epoch": 0.41, + "learning_rate": 3.3394070895340817e-06, + "loss": 1.2484, + "step": 13586 + }, + { + "epoch": 0.41, + "learning_rate": 3.3391773258891897e-06, + "loss": 1.2073, + "step": 13587 + }, + { + "epoch": 0.41, + "learning_rate": 3.3389475542557326e-06, + "loss": 1.0826, + "step": 13588 + }, + { + "epoch": 0.41, + "learning_rate": 3.3387177746358988e-06, + "loss": 1.0333, + "step": 13589 + }, + { + "epoch": 0.41, + "learning_rate": 3.3384879870318764e-06, + "loss": 1.1254, + "step": 13590 + }, + { + "epoch": 0.41, + "learning_rate": 3.3382581914458522e-06, + "loss": 0.9973, + "step": 13591 + }, + { + "epoch": 0.41, + "learning_rate": 3.338028387880013e-06, + "loss": 1.2757, + "step": 13592 + }, + { + "epoch": 0.41, + "learning_rate": 3.3377985763365477e-06, + "loss": 1.0663, + "step": 13593 + }, + { + "epoch": 0.41, + "learning_rate": 3.337568756817643e-06, + "loss": 0.9921, + "step": 13594 + }, + { + "epoch": 0.41, + "learning_rate": 3.337338929325487e-06, + "loss": 1.1827, + "step": 13595 + }, + { + "epoch": 0.41, + "learning_rate": 3.3371090938622686e-06, + "loss": 1.1663, + "step": 13596 + }, + { + "epoch": 0.41, + "learning_rate": 3.336879250430174e-06, + "loss": 1.1044, + "step": 13597 + }, + { + "epoch": 0.41, + "learning_rate": 3.336649399031392e-06, + "loss": 1.1277, + "step": 13598 + }, + { + "epoch": 0.41, + "learning_rate": 3.336419539668111e-06, + "loss": 1.1132, + "step": 13599 + }, + { + "epoch": 0.41, + "learning_rate": 3.336189672342519e-06, + "loss": 1.1026, + "step": 13600 + }, + { + "epoch": 0.41, + "learning_rate": 3.335959797056804e-06, + "loss": 1.1508, + "step": 13601 + }, + { + "epoch": 0.41, + "learning_rate": 3.335729913813154e-06, + "loss": 1.197, + "step": 13602 + }, + { + "epoch": 0.41, + "learning_rate": 3.3355000226137575e-06, + "loss": 1.1175, + "step": 13603 + }, + { + "epoch": 0.41, + "learning_rate": 3.3352701234608035e-06, + "loss": 1.164, + "step": 13604 + }, + { + "epoch": 0.41, + "learning_rate": 3.3350402163564798e-06, + "loss": 1.0899, + "step": 13605 + }, + { + "epoch": 0.41, + "learning_rate": 3.3348103013029763e-06, + "loss": 1.1204, + "step": 13606 + }, + { + "epoch": 0.41, + "learning_rate": 3.33458037830248e-06, + "loss": 1.2388, + "step": 13607 + }, + { + "epoch": 0.41, + "learning_rate": 3.334350447357181e-06, + "loss": 1.139, + "step": 13608 + }, + { + "epoch": 0.41, + "learning_rate": 3.3341205084692675e-06, + "loss": 1.1727, + "step": 13609 + }, + { + "epoch": 0.41, + "learning_rate": 3.3338905616409277e-06, + "loss": 1.1639, + "step": 13610 + }, + { + "epoch": 0.41, + "learning_rate": 3.3336606068743523e-06, + "loss": 1.1589, + "step": 13611 + }, + { + "epoch": 0.41, + "learning_rate": 3.333430644171729e-06, + "loss": 1.122, + "step": 13612 + }, + { + "epoch": 0.41, + "learning_rate": 3.3332006735352472e-06, + "loss": 1.1958, + "step": 13613 + }, + { + "epoch": 0.41, + "learning_rate": 3.3329706949670964e-06, + "loss": 1.0426, + "step": 13614 + }, + { + "epoch": 0.41, + "learning_rate": 3.3327407084694665e-06, + "loss": 1.1425, + "step": 13615 + }, + { + "epoch": 0.41, + "learning_rate": 3.332510714044545e-06, + "loss": 1.0942, + "step": 13616 + }, + { + "epoch": 0.41, + "learning_rate": 3.3322807116945233e-06, + "loss": 1.1105, + "step": 13617 + }, + { + "epoch": 0.41, + "learning_rate": 3.3320507014215895e-06, + "loss": 1.1187, + "step": 13618 + }, + { + "epoch": 0.41, + "learning_rate": 3.3318206832279342e-06, + "loss": 1.136, + "step": 13619 + }, + { + "epoch": 0.41, + "learning_rate": 3.3315906571157465e-06, + "loss": 1.0947, + "step": 13620 + }, + { + "epoch": 0.41, + "learning_rate": 3.331360623087216e-06, + "loss": 1.1441, + "step": 13621 + }, + { + "epoch": 0.41, + "learning_rate": 3.331130581144533e-06, + "loss": 1.1425, + "step": 13622 + }, + { + "epoch": 0.41, + "learning_rate": 3.330900531289887e-06, + "loss": 1.2042, + "step": 13623 + }, + { + "epoch": 0.41, + "learning_rate": 3.3306704735254684e-06, + "loss": 1.1824, + "step": 13624 + }, + { + "epoch": 0.41, + "learning_rate": 3.330440407853467e-06, + "loss": 1.0788, + "step": 13625 + }, + { + "epoch": 0.41, + "learning_rate": 3.3302103342760717e-06, + "loss": 1.2662, + "step": 13626 + }, + { + "epoch": 0.41, + "learning_rate": 3.329980252795475e-06, + "loss": 1.1013, + "step": 13627 + }, + { + "epoch": 0.41, + "learning_rate": 3.3297501634138663e-06, + "loss": 1.0694, + "step": 13628 + }, + { + "epoch": 0.41, + "learning_rate": 3.329520066133435e-06, + "loss": 1.1138, + "step": 13629 + }, + { + "epoch": 0.41, + "learning_rate": 3.3292899609563722e-06, + "loss": 0.9988, + "step": 13630 + }, + { + "epoch": 0.41, + "learning_rate": 3.3290598478848684e-06, + "loss": 1.1514, + "step": 13631 + }, + { + "epoch": 0.41, + "learning_rate": 3.3288297269211147e-06, + "loss": 1.1294, + "step": 13632 + }, + { + "epoch": 0.41, + "learning_rate": 3.3285995980673004e-06, + "loss": 1.1084, + "step": 13633 + }, + { + "epoch": 0.41, + "learning_rate": 3.3283694613256167e-06, + "loss": 1.1257, + "step": 13634 + }, + { + "epoch": 0.41, + "learning_rate": 3.3281393166982557e-06, + "loss": 1.1463, + "step": 13635 + }, + { + "epoch": 0.41, + "learning_rate": 3.3279091641874066e-06, + "loss": 1.1675, + "step": 13636 + }, + { + "epoch": 0.41, + "learning_rate": 3.3276790037952624e-06, + "loss": 1.1917, + "step": 13637 + }, + { + "epoch": 0.41, + "learning_rate": 3.327448835524011e-06, + "loss": 1.1004, + "step": 13638 + }, + { + "epoch": 0.41, + "learning_rate": 3.3272186593758456e-06, + "loss": 1.244, + "step": 13639 + }, + { + "epoch": 0.41, + "learning_rate": 3.326988475352957e-06, + "loss": 1.0873, + "step": 13640 + }, + { + "epoch": 0.41, + "learning_rate": 3.3267582834575363e-06, + "loss": 1.1903, + "step": 13641 + }, + { + "epoch": 0.41, + "learning_rate": 3.3265280836917754e-06, + "loss": 1.1769, + "step": 13642 + }, + { + "epoch": 0.41, + "learning_rate": 3.3262978760578652e-06, + "loss": 1.0928, + "step": 13643 + }, + { + "epoch": 0.41, + "learning_rate": 3.3260676605579967e-06, + "loss": 1.1235, + "step": 13644 + }, + { + "epoch": 0.41, + "learning_rate": 3.3258374371943625e-06, + "loss": 1.1172, + "step": 13645 + }, + { + "epoch": 0.41, + "learning_rate": 3.325607205969153e-06, + "loss": 1.0901, + "step": 13646 + }, + { + "epoch": 0.41, + "learning_rate": 3.325376966884561e-06, + "loss": 1.0919, + "step": 13647 + }, + { + "epoch": 0.41, + "learning_rate": 3.3251467199427772e-06, + "loss": 1.2144, + "step": 13648 + }, + { + "epoch": 0.41, + "learning_rate": 3.3249164651459942e-06, + "loss": 1.169, + "step": 13649 + }, + { + "epoch": 0.41, + "learning_rate": 3.3246862024964043e-06, + "loss": 1.271, + "step": 13650 + }, + { + "epoch": 0.41, + "learning_rate": 3.324455931996199e-06, + "loss": 1.1308, + "step": 13651 + }, + { + "epoch": 0.41, + "learning_rate": 3.324225653647569e-06, + "loss": 1.1581, + "step": 13652 + }, + { + "epoch": 0.41, + "learning_rate": 3.323995367452709e-06, + "loss": 1.1112, + "step": 13653 + }, + { + "epoch": 0.41, + "learning_rate": 3.32376507341381e-06, + "loss": 1.1279, + "step": 13654 + }, + { + "epoch": 0.41, + "learning_rate": 3.3235347715330633e-06, + "loss": 1.165, + "step": 13655 + }, + { + "epoch": 0.41, + "learning_rate": 3.323304461812663e-06, + "loss": 1.1489, + "step": 13656 + }, + { + "epoch": 0.41, + "learning_rate": 3.3230741442548004e-06, + "loss": 1.0748, + "step": 13657 + }, + { + "epoch": 0.41, + "learning_rate": 3.3228438188616685e-06, + "loss": 1.1227, + "step": 13658 + }, + { + "epoch": 0.41, + "learning_rate": 3.3226134856354596e-06, + "loss": 1.1476, + "step": 13659 + }, + { + "epoch": 0.41, + "learning_rate": 3.3223831445783672e-06, + "loss": 1.1823, + "step": 13660 + }, + { + "epoch": 0.41, + "learning_rate": 3.3221527956925825e-06, + "loss": 1.1268, + "step": 13661 + }, + { + "epoch": 0.41, + "learning_rate": 3.321922438980299e-06, + "loss": 1.1316, + "step": 13662 + }, + { + "epoch": 0.41, + "learning_rate": 3.3216920744437103e-06, + "loss": 1.0075, + "step": 13663 + }, + { + "epoch": 0.41, + "learning_rate": 3.3214617020850087e-06, + "loss": 1.1555, + "step": 13664 + }, + { + "epoch": 0.41, + "learning_rate": 3.3212313219063876e-06, + "loss": 1.1906, + "step": 13665 + }, + { + "epoch": 0.41, + "learning_rate": 3.321000933910039e-06, + "loss": 1.1473, + "step": 13666 + }, + { + "epoch": 0.41, + "learning_rate": 3.320770538098157e-06, + "loss": 1.1308, + "step": 13667 + }, + { + "epoch": 0.41, + "learning_rate": 3.320540134472935e-06, + "loss": 1.1985, + "step": 13668 + }, + { + "epoch": 0.41, + "learning_rate": 3.3203097230365664e-06, + "loss": 1.0612, + "step": 13669 + }, + { + "epoch": 0.41, + "learning_rate": 3.320079303791244e-06, + "loss": 1.2013, + "step": 13670 + }, + { + "epoch": 0.41, + "learning_rate": 3.3198488767391623e-06, + "loss": 1.0778, + "step": 13671 + }, + { + "epoch": 0.41, + "learning_rate": 3.3196184418825133e-06, + "loss": 1.1794, + "step": 13672 + }, + { + "epoch": 0.41, + "learning_rate": 3.3193879992234923e-06, + "loss": 1.0818, + "step": 13673 + }, + { + "epoch": 0.41, + "learning_rate": 3.3191575487642915e-06, + "loss": 1.1843, + "step": 13674 + }, + { + "epoch": 0.41, + "learning_rate": 3.3189270905071054e-06, + "loss": 1.1674, + "step": 13675 + }, + { + "epoch": 0.41, + "learning_rate": 3.318696624454128e-06, + "loss": 1.1201, + "step": 13676 + }, + { + "epoch": 0.41, + "learning_rate": 3.318466150607553e-06, + "loss": 1.1459, + "step": 13677 + }, + { + "epoch": 0.41, + "learning_rate": 3.3182356689695745e-06, + "loss": 1.1093, + "step": 13678 + }, + { + "epoch": 0.41, + "learning_rate": 3.318005179542386e-06, + "loss": 1.0835, + "step": 13679 + }, + { + "epoch": 0.41, + "learning_rate": 3.3177746823281826e-06, + "loss": 1.3038, + "step": 13680 + }, + { + "epoch": 0.41, + "learning_rate": 3.317544177329158e-06, + "loss": 1.0217, + "step": 13681 + }, + { + "epoch": 0.41, + "learning_rate": 3.317313664547507e-06, + "loss": 1.0784, + "step": 13682 + }, + { + "epoch": 0.41, + "learning_rate": 3.3170831439854224e-06, + "loss": 1.1624, + "step": 13683 + }, + { + "epoch": 0.41, + "learning_rate": 3.316852615645101e-06, + "loss": 1.1458, + "step": 13684 + }, + { + "epoch": 0.41, + "learning_rate": 3.316622079528735e-06, + "loss": 1.1046, + "step": 13685 + }, + { + "epoch": 0.41, + "learning_rate": 3.3163915356385214e-06, + "loss": 1.2263, + "step": 13686 + }, + { + "epoch": 0.41, + "learning_rate": 3.316160983976653e-06, + "loss": 1.1105, + "step": 13687 + }, + { + "epoch": 0.41, + "learning_rate": 3.3159304245453246e-06, + "loss": 1.1241, + "step": 13688 + }, + { + "epoch": 0.41, + "learning_rate": 3.3156998573467318e-06, + "loss": 1.0848, + "step": 13689 + }, + { + "epoch": 0.41, + "learning_rate": 3.3154692823830694e-06, + "loss": 1.1055, + "step": 13690 + }, + { + "epoch": 0.41, + "learning_rate": 3.315238699656532e-06, + "loss": 1.1706, + "step": 13691 + }, + { + "epoch": 0.41, + "learning_rate": 3.3150081091693152e-06, + "loss": 1.1014, + "step": 13692 + }, + { + "epoch": 0.41, + "learning_rate": 3.3147775109236136e-06, + "loss": 1.2067, + "step": 13693 + }, + { + "epoch": 0.41, + "learning_rate": 3.3145469049216223e-06, + "loss": 1.236, + "step": 13694 + }, + { + "epoch": 0.41, + "learning_rate": 3.314316291165537e-06, + "loss": 1.1801, + "step": 13695 + }, + { + "epoch": 0.41, + "learning_rate": 3.314085669657552e-06, + "loss": 1.0527, + "step": 13696 + }, + { + "epoch": 0.41, + "learning_rate": 3.313855040399865e-06, + "loss": 1.0903, + "step": 13697 + }, + { + "epoch": 0.41, + "learning_rate": 3.3136244033946687e-06, + "loss": 1.3207, + "step": 13698 + }, + { + "epoch": 0.41, + "learning_rate": 3.3133937586441604e-06, + "loss": 1.1545, + "step": 13699 + }, + { + "epoch": 0.41, + "learning_rate": 3.3131631061505352e-06, + "loss": 1.0759, + "step": 13700 + }, + { + "epoch": 0.41, + "learning_rate": 3.3129324459159886e-06, + "loss": 1.1086, + "step": 13701 + }, + { + "epoch": 0.41, + "learning_rate": 3.3127017779427172e-06, + "loss": 1.1605, + "step": 13702 + }, + { + "epoch": 0.41, + "learning_rate": 3.312471102232916e-06, + "loss": 1.1088, + "step": 13703 + }, + { + "epoch": 0.41, + "learning_rate": 3.3122404187887813e-06, + "loss": 1.0797, + "step": 13704 + }, + { + "epoch": 0.41, + "learning_rate": 3.3120097276125086e-06, + "loss": 1.1015, + "step": 13705 + }, + { + "epoch": 0.41, + "learning_rate": 3.311779028706295e-06, + "loss": 1.1368, + "step": 13706 + }, + { + "epoch": 0.41, + "learning_rate": 3.3115483220723355e-06, + "loss": 1.0693, + "step": 13707 + }, + { + "epoch": 0.41, + "learning_rate": 3.311317607712827e-06, + "loss": 1.1619, + "step": 13708 + }, + { + "epoch": 0.41, + "learning_rate": 3.3110868856299648e-06, + "loss": 1.065, + "step": 13709 + }, + { + "epoch": 0.41, + "learning_rate": 3.3108561558259476e-06, + "loss": 1.1396, + "step": 13710 + }, + { + "epoch": 0.41, + "learning_rate": 3.3106254183029695e-06, + "loss": 1.1796, + "step": 13711 + }, + { + "epoch": 0.41, + "learning_rate": 3.3103946730632286e-06, + "loss": 1.0057, + "step": 13712 + }, + { + "epoch": 0.41, + "learning_rate": 3.3101639201089196e-06, + "loss": 1.0549, + "step": 13713 + }, + { + "epoch": 0.41, + "learning_rate": 3.30993315944224e-06, + "loss": 1.1332, + "step": 13714 + }, + { + "epoch": 0.41, + "learning_rate": 3.309702391065388e-06, + "loss": 1.0016, + "step": 13715 + }, + { + "epoch": 0.41, + "learning_rate": 3.3094716149805588e-06, + "loss": 1.1519, + "step": 13716 + }, + { + "epoch": 0.41, + "learning_rate": 3.3092408311899497e-06, + "loss": 1.0935, + "step": 13717 + }, + { + "epoch": 0.41, + "learning_rate": 3.3090100396957576e-06, + "loss": 1.2168, + "step": 13718 + }, + { + "epoch": 0.41, + "learning_rate": 3.3087792405001802e-06, + "loss": 1.0977, + "step": 13719 + }, + { + "epoch": 0.41, + "learning_rate": 3.308548433605413e-06, + "loss": 1.1832, + "step": 13720 + }, + { + "epoch": 0.41, + "learning_rate": 3.308317619013654e-06, + "loss": 1.0873, + "step": 13721 + }, + { + "epoch": 0.41, + "learning_rate": 3.308086796727101e-06, + "loss": 1.0966, + "step": 13722 + }, + { + "epoch": 0.41, + "learning_rate": 3.307855966747951e-06, + "loss": 1.1636, + "step": 13723 + }, + { + "epoch": 0.41, + "learning_rate": 3.3076251290784004e-06, + "loss": 1.1019, + "step": 13724 + }, + { + "epoch": 0.41, + "learning_rate": 3.3073942837206484e-06, + "loss": 1.1126, + "step": 13725 + }, + { + "epoch": 0.41, + "learning_rate": 3.307163430676892e-06, + "loss": 1.1389, + "step": 13726 + }, + { + "epoch": 0.41, + "learning_rate": 3.3069325699493278e-06, + "loss": 1.1224, + "step": 13727 + }, + { + "epoch": 0.41, + "learning_rate": 3.3067017015401544e-06, + "loss": 0.9437, + "step": 13728 + }, + { + "epoch": 0.41, + "learning_rate": 3.3064708254515693e-06, + "loss": 1.2087, + "step": 13729 + }, + { + "epoch": 0.41, + "learning_rate": 3.3062399416857703e-06, + "loss": 1.1324, + "step": 13730 + }, + { + "epoch": 0.41, + "learning_rate": 3.3060090502449554e-06, + "loss": 1.2092, + "step": 13731 + }, + { + "epoch": 0.41, + "learning_rate": 3.3057781511313225e-06, + "loss": 1.1822, + "step": 13732 + }, + { + "epoch": 0.41, + "learning_rate": 3.30554724434707e-06, + "loss": 1.0439, + "step": 13733 + }, + { + "epoch": 0.41, + "learning_rate": 3.3053163298943946e-06, + "loss": 1.1251, + "step": 13734 + }, + { + "epoch": 0.41, + "learning_rate": 3.305085407775497e-06, + "loss": 1.2143, + "step": 13735 + }, + { + "epoch": 0.41, + "learning_rate": 3.3048544779925734e-06, + "loss": 1.1759, + "step": 13736 + }, + { + "epoch": 0.41, + "learning_rate": 3.3046235405478227e-06, + "loss": 1.1177, + "step": 13737 + }, + { + "epoch": 0.41, + "learning_rate": 3.3043925954434438e-06, + "loss": 1.1713, + "step": 13738 + }, + { + "epoch": 0.41, + "learning_rate": 3.304161642681634e-06, + "loss": 1.0344, + "step": 13739 + }, + { + "epoch": 0.41, + "learning_rate": 3.303930682264594e-06, + "loss": 1.0723, + "step": 13740 + }, + { + "epoch": 0.41, + "learning_rate": 3.3036997141945197e-06, + "loss": 1.1417, + "step": 13741 + }, + { + "epoch": 0.41, + "learning_rate": 3.303468738473612e-06, + "loss": 1.0917, + "step": 13742 + }, + { + "epoch": 0.41, + "learning_rate": 3.303237755104069e-06, + "loss": 1.161, + "step": 13743 + }, + { + "epoch": 0.41, + "learning_rate": 3.303006764088089e-06, + "loss": 1.1276, + "step": 13744 + }, + { + "epoch": 0.41, + "learning_rate": 3.3027757654278715e-06, + "loss": 1.2436, + "step": 13745 + }, + { + "epoch": 0.41, + "learning_rate": 3.3025447591256154e-06, + "loss": 1.0299, + "step": 13746 + }, + { + "epoch": 0.41, + "learning_rate": 3.3023137451835198e-06, + "loss": 1.065, + "step": 13747 + }, + { + "epoch": 0.41, + "learning_rate": 3.3020827236037835e-06, + "loss": 1.0447, + "step": 13748 + }, + { + "epoch": 0.41, + "learning_rate": 3.301851694388606e-06, + "loss": 1.12, + "step": 13749 + }, + { + "epoch": 0.41, + "learning_rate": 3.301620657540186e-06, + "loss": 1.1693, + "step": 13750 + }, + { + "epoch": 0.41, + "learning_rate": 3.3013896130607244e-06, + "loss": 1.1627, + "step": 13751 + }, + { + "epoch": 0.41, + "learning_rate": 3.301158560952419e-06, + "loss": 0.9606, + "step": 13752 + }, + { + "epoch": 0.41, + "learning_rate": 3.3009275012174704e-06, + "loss": 1.007, + "step": 13753 + }, + { + "epoch": 0.41, + "learning_rate": 3.300696433858077e-06, + "loss": 1.1345, + "step": 13754 + }, + { + "epoch": 0.41, + "learning_rate": 3.3004653588764397e-06, + "loss": 1.2297, + "step": 13755 + }, + { + "epoch": 0.41, + "learning_rate": 3.300234276274758e-06, + "loss": 1.0969, + "step": 13756 + }, + { + "epoch": 0.41, + "learning_rate": 3.3000031860552313e-06, + "loss": 1.1589, + "step": 13757 + }, + { + "epoch": 0.41, + "learning_rate": 3.2997720882200597e-06, + "loss": 1.0482, + "step": 13758 + }, + { + "epoch": 0.41, + "learning_rate": 3.299540982771442e-06, + "loss": 1.1629, + "step": 13759 + }, + { + "epoch": 0.41, + "learning_rate": 3.2993098697115805e-06, + "loss": 1.118, + "step": 13760 + }, + { + "epoch": 0.41, + "learning_rate": 3.299078749042673e-06, + "loss": 1.2317, + "step": 13761 + }, + { + "epoch": 0.41, + "learning_rate": 3.2988476207669206e-06, + "loss": 1.2063, + "step": 13762 + }, + { + "epoch": 0.41, + "learning_rate": 3.2986164848865243e-06, + "loss": 1.1521, + "step": 13763 + }, + { + "epoch": 0.41, + "learning_rate": 3.2983853414036838e-06, + "loss": 1.2281, + "step": 13764 + }, + { + "epoch": 0.41, + "learning_rate": 3.2981541903205982e-06, + "loss": 1.0627, + "step": 13765 + }, + { + "epoch": 0.41, + "learning_rate": 3.2979230316394705e-06, + "loss": 1.2043, + "step": 13766 + }, + { + "epoch": 0.41, + "learning_rate": 3.297691865362499e-06, + "loss": 1.1003, + "step": 13767 + }, + { + "epoch": 0.41, + "learning_rate": 3.297460691491885e-06, + "loss": 1.1392, + "step": 13768 + }, + { + "epoch": 0.41, + "learning_rate": 3.29722951002983e-06, + "loss": 1.2401, + "step": 13769 + }, + { + "epoch": 0.41, + "learning_rate": 3.2969983209785337e-06, + "loss": 1.1727, + "step": 13770 + }, + { + "epoch": 0.41, + "learning_rate": 3.2967671243401978e-06, + "loss": 1.064, + "step": 13771 + }, + { + "epoch": 0.41, + "learning_rate": 3.296535920117022e-06, + "loss": 1.1916, + "step": 13772 + }, + { + "epoch": 0.41, + "learning_rate": 3.2963047083112078e-06, + "loss": 1.05, + "step": 13773 + }, + { + "epoch": 0.41, + "learning_rate": 3.296073488924956e-06, + "loss": 1.1381, + "step": 13774 + }, + { + "epoch": 0.41, + "learning_rate": 3.2958422619604678e-06, + "loss": 1.1453, + "step": 13775 + }, + { + "epoch": 0.42, + "learning_rate": 3.295611027419946e-06, + "loss": 1.2476, + "step": 13776 + }, + { + "epoch": 0.42, + "learning_rate": 3.2953797853055892e-06, + "loss": 1.1042, + "step": 13777 + }, + { + "epoch": 0.42, + "learning_rate": 3.2951485356196e-06, + "loss": 1.0844, + "step": 13778 + }, + { + "epoch": 0.42, + "learning_rate": 3.2949172783641803e-06, + "loss": 1.1296, + "step": 13779 + }, + { + "epoch": 0.42, + "learning_rate": 3.2946860135415306e-06, + "loss": 1.2281, + "step": 13780 + }, + { + "epoch": 0.42, + "learning_rate": 3.2944547411538517e-06, + "loss": 1.1001, + "step": 13781 + }, + { + "epoch": 0.42, + "learning_rate": 3.294223461203348e-06, + "loss": 1.1024, + "step": 13782 + }, + { + "epoch": 0.42, + "learning_rate": 3.2939921736922186e-06, + "loss": 1.1458, + "step": 13783 + }, + { + "epoch": 0.42, + "learning_rate": 3.2937608786226665e-06, + "loss": 1.0988, + "step": 13784 + }, + { + "epoch": 0.42, + "learning_rate": 3.293529575996893e-06, + "loss": 1.124, + "step": 13785 + }, + { + "epoch": 0.42, + "learning_rate": 3.2932982658171003e-06, + "loss": 1.2455, + "step": 13786 + }, + { + "epoch": 0.42, + "learning_rate": 3.29306694808549e-06, + "loss": 1.1589, + "step": 13787 + }, + { + "epoch": 0.42, + "learning_rate": 3.2928356228042644e-06, + "loss": 1.289, + "step": 13788 + }, + { + "epoch": 0.42, + "learning_rate": 3.292604289975625e-06, + "loss": 1.0418, + "step": 13789 + }, + { + "epoch": 0.42, + "learning_rate": 3.2923729496017746e-06, + "loss": 1.1246, + "step": 13790 + }, + { + "epoch": 0.42, + "learning_rate": 3.2921416016849157e-06, + "loss": 1.1846, + "step": 13791 + }, + { + "epoch": 0.42, + "learning_rate": 3.29191024622725e-06, + "loss": 1.2372, + "step": 13792 + }, + { + "epoch": 0.42, + "learning_rate": 3.2916788832309803e-06, + "loss": 1.219, + "step": 13793 + }, + { + "epoch": 0.42, + "learning_rate": 3.2914475126983087e-06, + "loss": 1.0831, + "step": 13794 + }, + { + "epoch": 0.42, + "learning_rate": 3.2912161346314387e-06, + "loss": 1.2308, + "step": 13795 + }, + { + "epoch": 0.42, + "learning_rate": 3.2909847490325713e-06, + "loss": 1.1187, + "step": 13796 + }, + { + "epoch": 0.42, + "learning_rate": 3.2907533559039106e-06, + "loss": 1.1421, + "step": 13797 + }, + { + "epoch": 0.42, + "learning_rate": 3.2905219552476587e-06, + "loss": 1.1304, + "step": 13798 + }, + { + "epoch": 0.42, + "learning_rate": 3.2902905470660184e-06, + "loss": 1.1917, + "step": 13799 + }, + { + "epoch": 0.42, + "learning_rate": 3.2900591313611924e-06, + "loss": 1.1331, + "step": 13800 + }, + { + "epoch": 0.42, + "learning_rate": 3.2898277081353846e-06, + "loss": 1.1, + "step": 13801 + }, + { + "epoch": 0.42, + "learning_rate": 3.289596277390797e-06, + "loss": 1.0553, + "step": 13802 + }, + { + "epoch": 0.42, + "learning_rate": 3.2893648391296327e-06, + "loss": 1.2032, + "step": 13803 + }, + { + "epoch": 0.42, + "learning_rate": 3.289133393354096e-06, + "loss": 1.1746, + "step": 13804 + }, + { + "epoch": 0.42, + "learning_rate": 3.288901940066389e-06, + "loss": 1.0004, + "step": 13805 + }, + { + "epoch": 0.42, + "learning_rate": 3.288670479268716e-06, + "loss": 1.155, + "step": 13806 + }, + { + "epoch": 0.42, + "learning_rate": 3.2884390109632793e-06, + "loss": 1.1624, + "step": 13807 + }, + { + "epoch": 0.42, + "learning_rate": 3.2882075351522834e-06, + "loss": 1.1169, + "step": 13808 + }, + { + "epoch": 0.42, + "learning_rate": 3.2879760518379313e-06, + "loss": 1.1384, + "step": 13809 + }, + { + "epoch": 0.42, + "learning_rate": 3.287744561022427e-06, + "loss": 1.0988, + "step": 13810 + }, + { + "epoch": 0.42, + "learning_rate": 3.287513062707973e-06, + "loss": 1.2103, + "step": 13811 + }, + { + "epoch": 0.42, + "learning_rate": 3.287281556896775e-06, + "loss": 1.233, + "step": 13812 + }, + { + "epoch": 0.42, + "learning_rate": 3.2870500435910346e-06, + "loss": 1.2034, + "step": 13813 + }, + { + "epoch": 0.42, + "learning_rate": 3.2868185227929576e-06, + "loss": 1.127, + "step": 13814 + }, + { + "epoch": 0.42, + "learning_rate": 3.286586994504747e-06, + "loss": 1.0066, + "step": 13815 + }, + { + "epoch": 0.42, + "learning_rate": 3.2863554587286067e-06, + "loss": 1.009, + "step": 13816 + }, + { + "epoch": 0.42, + "learning_rate": 3.2861239154667416e-06, + "loss": 1.0598, + "step": 13817 + }, + { + "epoch": 0.42, + "learning_rate": 3.2858923647213553e-06, + "loss": 1.1949, + "step": 13818 + }, + { + "epoch": 0.42, + "learning_rate": 3.285660806494652e-06, + "loss": 0.9948, + "step": 13819 + }, + { + "epoch": 0.42, + "learning_rate": 3.285429240788836e-06, + "loss": 1.1487, + "step": 13820 + }, + { + "epoch": 0.42, + "learning_rate": 3.2851976676061127e-06, + "loss": 1.1069, + "step": 13821 + }, + { + "epoch": 0.42, + "learning_rate": 3.2849660869486853e-06, + "loss": 1.1035, + "step": 13822 + }, + { + "epoch": 0.42, + "learning_rate": 3.284734498818759e-06, + "loss": 1.1915, + "step": 13823 + }, + { + "epoch": 0.42, + "learning_rate": 3.2845029032185384e-06, + "loss": 1.1411, + "step": 13824 + }, + { + "epoch": 0.42, + "learning_rate": 3.284271300150228e-06, + "loss": 1.0331, + "step": 13825 + }, + { + "epoch": 0.42, + "learning_rate": 3.284039689616032e-06, + "loss": 1.2944, + "step": 13826 + }, + { + "epoch": 0.42, + "learning_rate": 3.2838080716181566e-06, + "loss": 1.1814, + "step": 13827 + }, + { + "epoch": 0.42, + "learning_rate": 3.283576446158805e-06, + "loss": 1.226, + "step": 13828 + }, + { + "epoch": 0.42, + "learning_rate": 3.2833448132401836e-06, + "loss": 1.1192, + "step": 13829 + }, + { + "epoch": 0.42, + "learning_rate": 3.283113172864496e-06, + "loss": 1.1959, + "step": 13830 + }, + { + "epoch": 0.42, + "learning_rate": 3.2828815250339484e-06, + "loss": 1.2065, + "step": 13831 + }, + { + "epoch": 0.42, + "learning_rate": 3.2826498697507457e-06, + "loss": 1.0792, + "step": 13832 + }, + { + "epoch": 0.42, + "learning_rate": 3.282418207017094e-06, + "loss": 1.1633, + "step": 13833 + }, + { + "epoch": 0.42, + "learning_rate": 3.282186536835197e-06, + "loss": 1.1077, + "step": 13834 + }, + { + "epoch": 0.42, + "learning_rate": 3.281954859207261e-06, + "loss": 1.1507, + "step": 13835 + }, + { + "epoch": 0.42, + "learning_rate": 3.2817231741354917e-06, + "loss": 1.0428, + "step": 13836 + }, + { + "epoch": 0.42, + "learning_rate": 3.2814914816220938e-06, + "loss": 1.2111, + "step": 13837 + }, + { + "epoch": 0.42, + "learning_rate": 3.281259781669274e-06, + "loss": 1.2024, + "step": 13838 + }, + { + "epoch": 0.42, + "learning_rate": 3.2810280742792367e-06, + "loss": 1.1454, + "step": 13839 + }, + { + "epoch": 0.42, + "learning_rate": 3.2807963594541893e-06, + "loss": 1.1187, + "step": 13840 + }, + { + "epoch": 0.42, + "learning_rate": 3.280564637196336e-06, + "loss": 1.1686, + "step": 13841 + }, + { + "epoch": 0.42, + "learning_rate": 3.280332907507883e-06, + "loss": 1.0681, + "step": 13842 + }, + { + "epoch": 0.42, + "learning_rate": 3.280101170391037e-06, + "loss": 1.1874, + "step": 13843 + }, + { + "epoch": 0.42, + "learning_rate": 3.2798694258480025e-06, + "loss": 1.1526, + "step": 13844 + }, + { + "epoch": 0.42, + "learning_rate": 3.2796376738809876e-06, + "loss": 1.0212, + "step": 13845 + }, + { + "epoch": 0.42, + "learning_rate": 3.2794059144921977e-06, + "loss": 1.1208, + "step": 13846 + }, + { + "epoch": 0.42, + "learning_rate": 3.279174147683838e-06, + "loss": 1.0827, + "step": 13847 + }, + { + "epoch": 0.42, + "learning_rate": 3.278942373458116e-06, + "loss": 1.1055, + "step": 13848 + }, + { + "epoch": 0.42, + "learning_rate": 3.2787105918172386e-06, + "loss": 1.2328, + "step": 13849 + }, + { + "epoch": 0.42, + "learning_rate": 3.2784788027634105e-06, + "loss": 1.1387, + "step": 13850 + }, + { + "epoch": 0.42, + "learning_rate": 3.27824700629884e-06, + "loss": 1.0402, + "step": 13851 + }, + { + "epoch": 0.42, + "learning_rate": 3.2780152024257316e-06, + "loss": 1.1561, + "step": 13852 + }, + { + "epoch": 0.42, + "learning_rate": 3.2777833911462942e-06, + "loss": 1.0251, + "step": 13853 + }, + { + "epoch": 0.42, + "learning_rate": 3.2775515724627327e-06, + "loss": 1.1055, + "step": 13854 + }, + { + "epoch": 0.42, + "learning_rate": 3.2773197463772556e-06, + "loss": 1.1989, + "step": 13855 + }, + { + "epoch": 0.42, + "learning_rate": 3.2770879128920685e-06, + "loss": 1.1075, + "step": 13856 + }, + { + "epoch": 0.42, + "learning_rate": 3.2768560720093786e-06, + "loss": 1.1351, + "step": 13857 + }, + { + "epoch": 0.42, + "learning_rate": 3.2766242237313926e-06, + "loss": 1.0368, + "step": 13858 + }, + { + "epoch": 0.42, + "learning_rate": 3.276392368060319e-06, + "loss": 1.1259, + "step": 13859 + }, + { + "epoch": 0.42, + "learning_rate": 3.276160504998363e-06, + "loss": 1.1285, + "step": 13860 + }, + { + "epoch": 0.42, + "learning_rate": 3.275928634547733e-06, + "loss": 1.2323, + "step": 13861 + }, + { + "epoch": 0.42, + "learning_rate": 3.275696756710637e-06, + "loss": 1.0825, + "step": 13862 + }, + { + "epoch": 0.42, + "learning_rate": 3.2754648714892805e-06, + "loss": 1.0646, + "step": 13863 + }, + { + "epoch": 0.42, + "learning_rate": 3.2752329788858728e-06, + "loss": 1.1639, + "step": 13864 + }, + { + "epoch": 0.42, + "learning_rate": 3.2750010789026194e-06, + "loss": 1.0489, + "step": 13865 + }, + { + "epoch": 0.42, + "learning_rate": 3.27476917154173e-06, + "loss": 1.1508, + "step": 13866 + }, + { + "epoch": 0.42, + "learning_rate": 3.274537256805411e-06, + "loss": 1.1083, + "step": 13867 + }, + { + "epoch": 0.42, + "learning_rate": 3.2743053346958696e-06, + "loss": 1.1479, + "step": 13868 + }, + { + "epoch": 0.42, + "learning_rate": 3.274073405215315e-06, + "loss": 1.1049, + "step": 13869 + }, + { + "epoch": 0.42, + "learning_rate": 3.2738414683659546e-06, + "loss": 1.1503, + "step": 13870 + }, + { + "epoch": 0.42, + "learning_rate": 3.2736095241499953e-06, + "loss": 1.1375, + "step": 13871 + }, + { + "epoch": 0.42, + "learning_rate": 3.2733775725696464e-06, + "loss": 1.0598, + "step": 13872 + }, + { + "epoch": 0.42, + "learning_rate": 3.2731456136271155e-06, + "loss": 1.0958, + "step": 13873 + }, + { + "epoch": 0.42, + "learning_rate": 3.2729136473246102e-06, + "loss": 1.1516, + "step": 13874 + }, + { + "epoch": 0.42, + "learning_rate": 3.27268167366434e-06, + "loss": 1.2678, + "step": 13875 + }, + { + "epoch": 0.42, + "learning_rate": 3.2724496926485118e-06, + "loss": 1.1888, + "step": 13876 + }, + { + "epoch": 0.42, + "learning_rate": 3.272217704279335e-06, + "loss": 1.134, + "step": 13877 + }, + { + "epoch": 0.42, + "learning_rate": 3.271985708559017e-06, + "loss": 1.0716, + "step": 13878 + }, + { + "epoch": 0.42, + "learning_rate": 3.271753705489768e-06, + "loss": 1.1605, + "step": 13879 + }, + { + "epoch": 0.42, + "learning_rate": 3.2715216950737947e-06, + "loss": 1.0585, + "step": 13880 + }, + { + "epoch": 0.42, + "learning_rate": 3.271289677313307e-06, + "loss": 1.1019, + "step": 13881 + }, + { + "epoch": 0.42, + "learning_rate": 3.271057652210512e-06, + "loss": 1.2464, + "step": 13882 + }, + { + "epoch": 0.42, + "learning_rate": 3.27082561976762e-06, + "loss": 1.0909, + "step": 13883 + }, + { + "epoch": 0.42, + "learning_rate": 3.2705935799868393e-06, + "loss": 1.1013, + "step": 13884 + }, + { + "epoch": 0.42, + "learning_rate": 3.2703615328703787e-06, + "loss": 1.1637, + "step": 13885 + }, + { + "epoch": 0.42, + "learning_rate": 3.2701294784204475e-06, + "loss": 1.1079, + "step": 13886 + }, + { + "epoch": 0.42, + "learning_rate": 3.269897416639254e-06, + "loss": 1.2158, + "step": 13887 + }, + { + "epoch": 0.42, + "learning_rate": 3.2696653475290085e-06, + "loss": 1.171, + "step": 13888 + }, + { + "epoch": 0.42, + "learning_rate": 3.2694332710919197e-06, + "loss": 1.0838, + "step": 13889 + }, + { + "epoch": 0.42, + "learning_rate": 3.2692011873301965e-06, + "loss": 1.2168, + "step": 13890 + }, + { + "epoch": 0.42, + "learning_rate": 3.2689690962460483e-06, + "loss": 1.1741, + "step": 13891 + }, + { + "epoch": 0.42, + "learning_rate": 3.2687369978416856e-06, + "loss": 1.2181, + "step": 13892 + }, + { + "epoch": 0.42, + "learning_rate": 3.2685048921193157e-06, + "loss": 1.1622, + "step": 13893 + }, + { + "epoch": 0.42, + "learning_rate": 3.26827277908115e-06, + "loss": 1.1461, + "step": 13894 + }, + { + "epoch": 0.42, + "learning_rate": 3.268040658729397e-06, + "loss": 1.1615, + "step": 13895 + }, + { + "epoch": 0.42, + "learning_rate": 3.2678085310662676e-06, + "loss": 1.0565, + "step": 13896 + }, + { + "epoch": 0.42, + "learning_rate": 3.2675763960939705e-06, + "loss": 1.1094, + "step": 13897 + }, + { + "epoch": 0.42, + "learning_rate": 3.2673442538147148e-06, + "loss": 1.1349, + "step": 13898 + }, + { + "epoch": 0.42, + "learning_rate": 3.2671121042307126e-06, + "loss": 1.1786, + "step": 13899 + }, + { + "epoch": 0.42, + "learning_rate": 3.266879947344172e-06, + "loss": 1.1794, + "step": 13900 + }, + { + "epoch": 0.42, + "learning_rate": 3.266647783157304e-06, + "loss": 1.0725, + "step": 13901 + }, + { + "epoch": 0.42, + "learning_rate": 3.2664156116723177e-06, + "loss": 1.0756, + "step": 13902 + }, + { + "epoch": 0.42, + "learning_rate": 3.266183432891425e-06, + "loss": 1.1404, + "step": 13903 + }, + { + "epoch": 0.42, + "learning_rate": 3.2659512468168342e-06, + "loss": 1.1177, + "step": 13904 + }, + { + "epoch": 0.42, + "learning_rate": 3.2657190534507565e-06, + "loss": 1.1741, + "step": 13905 + }, + { + "epoch": 0.42, + "learning_rate": 3.265486852795402e-06, + "loss": 1.2086, + "step": 13906 + }, + { + "epoch": 0.42, + "learning_rate": 3.265254644852982e-06, + "loss": 1.1106, + "step": 13907 + }, + { + "epoch": 0.42, + "learning_rate": 3.2650224296257062e-06, + "loss": 1.1655, + "step": 13908 + }, + { + "epoch": 0.42, + "learning_rate": 3.264790207115785e-06, + "loss": 1.122, + "step": 13909 + }, + { + "epoch": 0.42, + "learning_rate": 3.264557977325429e-06, + "loss": 1.1252, + "step": 13910 + }, + { + "epoch": 0.42, + "learning_rate": 3.2643257402568505e-06, + "loss": 1.1287, + "step": 13911 + }, + { + "epoch": 0.42, + "learning_rate": 3.264093495912258e-06, + "loss": 1.2737, + "step": 13912 + }, + { + "epoch": 0.42, + "learning_rate": 3.2638612442938635e-06, + "loss": 1.0862, + "step": 13913 + }, + { + "epoch": 0.42, + "learning_rate": 3.2636289854038776e-06, + "loss": 1.131, + "step": 13914 + }, + { + "epoch": 0.42, + "learning_rate": 3.263396719244512e-06, + "loss": 1.0198, + "step": 13915 + }, + { + "epoch": 0.42, + "learning_rate": 3.263164445817978e-06, + "loss": 1.0727, + "step": 13916 + }, + { + "epoch": 0.42, + "learning_rate": 3.2629321651264843e-06, + "loss": 1.1983, + "step": 13917 + }, + { + "epoch": 0.42, + "learning_rate": 3.262699877172246e-06, + "loss": 1.1134, + "step": 13918 + }, + { + "epoch": 0.42, + "learning_rate": 3.26246758195747e-06, + "loss": 1.1853, + "step": 13919 + }, + { + "epoch": 0.42, + "learning_rate": 3.2622352794843716e-06, + "loss": 1.1222, + "step": 13920 + }, + { + "epoch": 0.42, + "learning_rate": 3.262002969755159e-06, + "loss": 1.1766, + "step": 13921 + }, + { + "epoch": 0.42, + "learning_rate": 3.2617706527720465e-06, + "loss": 1.1608, + "step": 13922 + }, + { + "epoch": 0.42, + "learning_rate": 3.261538328537244e-06, + "loss": 1.1373, + "step": 13923 + }, + { + "epoch": 0.42, + "learning_rate": 3.2613059970529625e-06, + "loss": 1.0535, + "step": 13924 + }, + { + "epoch": 0.42, + "learning_rate": 3.2610736583214155e-06, + "loss": 1.0031, + "step": 13925 + }, + { + "epoch": 0.42, + "learning_rate": 3.260841312344813e-06, + "loss": 1.1212, + "step": 13926 + }, + { + "epoch": 0.42, + "learning_rate": 3.2606089591253674e-06, + "loss": 1.0627, + "step": 13927 + }, + { + "epoch": 0.42, + "learning_rate": 3.260376598665291e-06, + "loss": 1.1092, + "step": 13928 + }, + { + "epoch": 0.42, + "learning_rate": 3.2601442309667967e-06, + "loss": 1.2169, + "step": 13929 + }, + { + "epoch": 0.42, + "learning_rate": 3.2599118560320946e-06, + "loss": 1.1694, + "step": 13930 + }, + { + "epoch": 0.42, + "learning_rate": 3.259679473863398e-06, + "loss": 1.1624, + "step": 13931 + }, + { + "epoch": 0.42, + "learning_rate": 3.2594470844629185e-06, + "loss": 1.1234, + "step": 13932 + }, + { + "epoch": 0.42, + "learning_rate": 3.2592146878328685e-06, + "loss": 1.0806, + "step": 13933 + }, + { + "epoch": 0.42, + "learning_rate": 3.2589822839754603e-06, + "loss": 1.1169, + "step": 13934 + }, + { + "epoch": 0.42, + "learning_rate": 3.258749872892907e-06, + "loss": 1.0699, + "step": 13935 + }, + { + "epoch": 0.42, + "learning_rate": 3.258517454587419e-06, + "loss": 1.1573, + "step": 13936 + }, + { + "epoch": 0.42, + "learning_rate": 3.2582850290612113e-06, + "loss": 1.2712, + "step": 13937 + }, + { + "epoch": 0.42, + "learning_rate": 3.2580525963164945e-06, + "loss": 1.2386, + "step": 13938 + }, + { + "epoch": 0.42, + "learning_rate": 3.2578201563554818e-06, + "loss": 1.0767, + "step": 13939 + }, + { + "epoch": 0.42, + "learning_rate": 3.2575877091803864e-06, + "loss": 1.1285, + "step": 13940 + }, + { + "epoch": 0.42, + "learning_rate": 3.2573552547934217e-06, + "loss": 1.0687, + "step": 13941 + }, + { + "epoch": 0.42, + "learning_rate": 3.2571227931967993e-06, + "loss": 1.0438, + "step": 13942 + }, + { + "epoch": 0.42, + "learning_rate": 3.256890324392732e-06, + "loss": 1.2101, + "step": 13943 + }, + { + "epoch": 0.42, + "learning_rate": 3.2566578483834345e-06, + "loss": 1.157, + "step": 13944 + }, + { + "epoch": 0.42, + "learning_rate": 3.2564253651711175e-06, + "loss": 1.1058, + "step": 13945 + }, + { + "epoch": 0.42, + "learning_rate": 3.2561928747579963e-06, + "loss": 1.0874, + "step": 13946 + }, + { + "epoch": 0.42, + "learning_rate": 3.2559603771462826e-06, + "loss": 1.0768, + "step": 13947 + }, + { + "epoch": 0.42, + "learning_rate": 3.255727872338191e-06, + "loss": 1.0806, + "step": 13948 + }, + { + "epoch": 0.42, + "learning_rate": 3.255495360335933e-06, + "loss": 1.1392, + "step": 13949 + }, + { + "epoch": 0.42, + "learning_rate": 3.2552628411417236e-06, + "loss": 1.158, + "step": 13950 + }, + { + "epoch": 0.42, + "learning_rate": 3.255030314757775e-06, + "loss": 1.2177, + "step": 13951 + }, + { + "epoch": 0.42, + "learning_rate": 3.2547977811863024e-06, + "loss": 1.2103, + "step": 13952 + }, + { + "epoch": 0.42, + "learning_rate": 3.254565240429518e-06, + "loss": 1.182, + "step": 13953 + }, + { + "epoch": 0.42, + "learning_rate": 3.2543326924896358e-06, + "loss": 1.1174, + "step": 13954 + }, + { + "epoch": 0.42, + "learning_rate": 3.254100137368869e-06, + "loss": 1.2137, + "step": 13955 + }, + { + "epoch": 0.42, + "learning_rate": 3.2538675750694327e-06, + "loss": 1.2219, + "step": 13956 + }, + { + "epoch": 0.42, + "learning_rate": 3.2536350055935404e-06, + "loss": 1.1642, + "step": 13957 + }, + { + "epoch": 0.42, + "learning_rate": 3.2534024289434058e-06, + "loss": 1.1046, + "step": 13958 + }, + { + "epoch": 0.42, + "learning_rate": 3.253169845121243e-06, + "loss": 1.2551, + "step": 13959 + }, + { + "epoch": 0.42, + "learning_rate": 3.2529372541292658e-06, + "loss": 1.0981, + "step": 13960 + }, + { + "epoch": 0.42, + "learning_rate": 3.2527046559696882e-06, + "loss": 1.1583, + "step": 13961 + }, + { + "epoch": 0.42, + "learning_rate": 3.2524720506447253e-06, + "loss": 1.1055, + "step": 13962 + }, + { + "epoch": 0.42, + "learning_rate": 3.2522394381565915e-06, + "loss": 1.0175, + "step": 13963 + }, + { + "epoch": 0.42, + "learning_rate": 3.2520068185074993e-06, + "loss": 1.1382, + "step": 13964 + }, + { + "epoch": 0.42, + "learning_rate": 3.2517741916996653e-06, + "loss": 1.1293, + "step": 13965 + }, + { + "epoch": 0.42, + "learning_rate": 3.2515415577353025e-06, + "loss": 1.1483, + "step": 13966 + }, + { + "epoch": 0.42, + "learning_rate": 3.2513089166166254e-06, + "loss": 1.1649, + "step": 13967 + }, + { + "epoch": 0.42, + "learning_rate": 3.2510762683458503e-06, + "loss": 1.2555, + "step": 13968 + }, + { + "epoch": 0.42, + "learning_rate": 3.25084361292519e-06, + "loss": 1.1627, + "step": 13969 + }, + { + "epoch": 0.42, + "learning_rate": 3.2506109503568617e-06, + "loss": 1.0829, + "step": 13970 + }, + { + "epoch": 0.42, + "learning_rate": 3.2503782806430774e-06, + "loss": 1.0898, + "step": 13971 + }, + { + "epoch": 0.42, + "learning_rate": 3.2501456037860533e-06, + "loss": 1.2435, + "step": 13972 + }, + { + "epoch": 0.42, + "learning_rate": 3.249912919788005e-06, + "loss": 1.2594, + "step": 13973 + }, + { + "epoch": 0.42, + "learning_rate": 3.2496802286511463e-06, + "loss": 1.3842, + "step": 13974 + }, + { + "epoch": 0.42, + "learning_rate": 3.249447530377693e-06, + "loss": 1.0852, + "step": 13975 + }, + { + "epoch": 0.42, + "learning_rate": 3.24921482496986e-06, + "loss": 1.1573, + "step": 13976 + }, + { + "epoch": 0.42, + "learning_rate": 3.2489821124298633e-06, + "loss": 1.1047, + "step": 13977 + }, + { + "epoch": 0.42, + "learning_rate": 3.2487493927599172e-06, + "loss": 1.1625, + "step": 13978 + }, + { + "epoch": 0.42, + "learning_rate": 3.2485166659622376e-06, + "loss": 1.1904, + "step": 13979 + }, + { + "epoch": 0.42, + "learning_rate": 3.248283932039039e-06, + "loss": 1.1514, + "step": 13980 + }, + { + "epoch": 0.42, + "learning_rate": 3.2480511909925384e-06, + "loss": 1.1192, + "step": 13981 + }, + { + "epoch": 0.42, + "learning_rate": 3.247818442824951e-06, + "loss": 1.1276, + "step": 13982 + }, + { + "epoch": 0.42, + "learning_rate": 3.247585687538492e-06, + "loss": 1.2328, + "step": 13983 + }, + { + "epoch": 0.42, + "learning_rate": 3.247352925135377e-06, + "loss": 1.1169, + "step": 13984 + }, + { + "epoch": 0.42, + "learning_rate": 3.2471201556178226e-06, + "loss": 1.0502, + "step": 13985 + }, + { + "epoch": 0.42, + "learning_rate": 3.246887378988044e-06, + "loss": 1.1268, + "step": 13986 + }, + { + "epoch": 0.42, + "learning_rate": 3.2466545952482576e-06, + "loss": 1.2552, + "step": 13987 + }, + { + "epoch": 0.42, + "learning_rate": 3.2464218044006778e-06, + "loss": 1.0886, + "step": 13988 + }, + { + "epoch": 0.42, + "learning_rate": 3.246189006447523e-06, + "loss": 1.1395, + "step": 13989 + }, + { + "epoch": 0.42, + "learning_rate": 3.2459562013910084e-06, + "loss": 1.0376, + "step": 13990 + }, + { + "epoch": 0.42, + "learning_rate": 3.2457233892333497e-06, + "loss": 1.1329, + "step": 13991 + }, + { + "epoch": 0.42, + "learning_rate": 3.245490569976763e-06, + "loss": 1.086, + "step": 13992 + }, + { + "epoch": 0.42, + "learning_rate": 3.2452577436234656e-06, + "loss": 1.1937, + "step": 13993 + }, + { + "epoch": 0.42, + "learning_rate": 3.2450249101756736e-06, + "loss": 1.108, + "step": 13994 + }, + { + "epoch": 0.42, + "learning_rate": 3.2447920696356027e-06, + "loss": 1.1625, + "step": 13995 + }, + { + "epoch": 0.42, + "learning_rate": 3.24455922200547e-06, + "loss": 1.1168, + "step": 13996 + }, + { + "epoch": 0.42, + "learning_rate": 3.2443263672874923e-06, + "loss": 1.0825, + "step": 13997 + }, + { + "epoch": 0.42, + "learning_rate": 3.2440935054838862e-06, + "loss": 1.0559, + "step": 13998 + }, + { + "epoch": 0.42, + "learning_rate": 3.2438606365968685e-06, + "loss": 0.9066, + "step": 13999 + }, + { + "epoch": 0.42, + "learning_rate": 3.243627760628656e-06, + "loss": 1.1467, + "step": 14000 + }, + { + "epoch": 0.42, + "learning_rate": 3.2433948775814645e-06, + "loss": 1.2185, + "step": 14001 + }, + { + "epoch": 0.42, + "learning_rate": 3.2431619874575126e-06, + "loss": 1.0005, + "step": 14002 + }, + { + "epoch": 0.42, + "learning_rate": 3.242929090259016e-06, + "loss": 1.1573, + "step": 14003 + }, + { + "epoch": 0.42, + "learning_rate": 3.242696185988192e-06, + "loss": 1.027, + "step": 14004 + }, + { + "epoch": 0.42, + "learning_rate": 3.2424632746472584e-06, + "loss": 1.2009, + "step": 14005 + }, + { + "epoch": 0.42, + "learning_rate": 3.2422303562384322e-06, + "loss": 1.1554, + "step": 14006 + }, + { + "epoch": 0.42, + "learning_rate": 3.24199743076393e-06, + "loss": 1.1354, + "step": 14007 + }, + { + "epoch": 0.42, + "learning_rate": 3.24176449822597e-06, + "loss": 1.1581, + "step": 14008 + }, + { + "epoch": 0.42, + "learning_rate": 3.2415315586267694e-06, + "loss": 1.0803, + "step": 14009 + }, + { + "epoch": 0.42, + "learning_rate": 3.241298611968545e-06, + "loss": 1.1735, + "step": 14010 + }, + { + "epoch": 0.42, + "learning_rate": 3.2410656582535148e-06, + "loss": 1.2056, + "step": 14011 + }, + { + "epoch": 0.42, + "learning_rate": 3.2408326974838967e-06, + "loss": 1.2797, + "step": 14012 + }, + { + "epoch": 0.42, + "learning_rate": 3.2405997296619085e-06, + "loss": 1.1392, + "step": 14013 + }, + { + "epoch": 0.42, + "learning_rate": 3.2403667547897666e-06, + "loss": 1.0595, + "step": 14014 + }, + { + "epoch": 0.42, + "learning_rate": 3.240133772869691e-06, + "loss": 1.0581, + "step": 14015 + }, + { + "epoch": 0.42, + "learning_rate": 3.2399007839038977e-06, + "loss": 1.1697, + "step": 14016 + }, + { + "epoch": 0.42, + "learning_rate": 3.2396677878946055e-06, + "loss": 1.2198, + "step": 14017 + }, + { + "epoch": 0.42, + "learning_rate": 3.2394347848440317e-06, + "loss": 1.1759, + "step": 14018 + }, + { + "epoch": 0.42, + "learning_rate": 3.239201774754395e-06, + "loss": 1.1329, + "step": 14019 + }, + { + "epoch": 0.42, + "learning_rate": 3.2389687576279135e-06, + "loss": 1.1576, + "step": 14020 + }, + { + "epoch": 0.42, + "learning_rate": 3.2387357334668053e-06, + "loss": 1.1906, + "step": 14021 + }, + { + "epoch": 0.42, + "learning_rate": 3.2385027022732882e-06, + "loss": 1.2283, + "step": 14022 + }, + { + "epoch": 0.42, + "learning_rate": 3.238269664049582e-06, + "loss": 1.0904, + "step": 14023 + }, + { + "epoch": 0.42, + "learning_rate": 3.238036618797904e-06, + "loss": 1.1935, + "step": 14024 + }, + { + "epoch": 0.42, + "learning_rate": 3.2378035665204723e-06, + "loss": 1.0507, + "step": 14025 + }, + { + "epoch": 0.42, + "learning_rate": 3.2375705072195065e-06, + "loss": 1.1317, + "step": 14026 + }, + { + "epoch": 0.42, + "learning_rate": 3.237337440897224e-06, + "loss": 1.1392, + "step": 14027 + }, + { + "epoch": 0.42, + "learning_rate": 3.2371043675558456e-06, + "loss": 1.2231, + "step": 14028 + }, + { + "epoch": 0.42, + "learning_rate": 3.236871287197587e-06, + "loss": 1.1907, + "step": 14029 + }, + { + "epoch": 0.42, + "learning_rate": 3.23663819982467e-06, + "loss": 1.208, + "step": 14030 + }, + { + "epoch": 0.42, + "learning_rate": 3.236405105439311e-06, + "loss": 1.0516, + "step": 14031 + }, + { + "epoch": 0.42, + "learning_rate": 3.2361720040437307e-06, + "loss": 1.1077, + "step": 14032 + }, + { + "epoch": 0.42, + "learning_rate": 3.2359388956401472e-06, + "loss": 1.1606, + "step": 14033 + }, + { + "epoch": 0.42, + "learning_rate": 3.23570578023078e-06, + "loss": 1.0013, + "step": 14034 + }, + { + "epoch": 0.42, + "learning_rate": 3.235472657817848e-06, + "loss": 1.074, + "step": 14035 + }, + { + "epoch": 0.42, + "learning_rate": 3.2352395284035703e-06, + "loss": 1.2125, + "step": 14036 + }, + { + "epoch": 0.42, + "learning_rate": 3.235006391990166e-06, + "loss": 1.0896, + "step": 14037 + }, + { + "epoch": 0.42, + "learning_rate": 3.234773248579856e-06, + "loss": 1.1959, + "step": 14038 + }, + { + "epoch": 0.42, + "learning_rate": 3.234540098174858e-06, + "loss": 1.0712, + "step": 14039 + }, + { + "epoch": 0.42, + "learning_rate": 3.234306940777392e-06, + "loss": 1.1118, + "step": 14040 + }, + { + "epoch": 0.42, + "learning_rate": 3.2340737763896778e-06, + "loss": 1.0717, + "step": 14041 + }, + { + "epoch": 0.42, + "learning_rate": 3.2338406050139346e-06, + "loss": 1.2367, + "step": 14042 + }, + { + "epoch": 0.42, + "learning_rate": 3.2336074266523825e-06, + "loss": 1.1395, + "step": 14043 + }, + { + "epoch": 0.42, + "learning_rate": 3.233374241307241e-06, + "loss": 1.1004, + "step": 14044 + }, + { + "epoch": 0.42, + "learning_rate": 3.23314104898073e-06, + "loss": 1.075, + "step": 14045 + }, + { + "epoch": 0.42, + "learning_rate": 3.2329078496750687e-06, + "loss": 1.0479, + "step": 14046 + }, + { + "epoch": 0.42, + "learning_rate": 3.232674643392478e-06, + "loss": 1.0928, + "step": 14047 + }, + { + "epoch": 0.42, + "learning_rate": 3.232441430135178e-06, + "loss": 1.0748, + "step": 14048 + }, + { + "epoch": 0.42, + "learning_rate": 3.2322082099053873e-06, + "loss": 1.035, + "step": 14049 + }, + { + "epoch": 0.42, + "learning_rate": 3.2319749827053275e-06, + "loss": 1.2402, + "step": 14050 + }, + { + "epoch": 0.42, + "learning_rate": 3.231741748537219e-06, + "loss": 1.1993, + "step": 14051 + }, + { + "epoch": 0.42, + "learning_rate": 3.231508507403281e-06, + "loss": 1.1056, + "step": 14052 + }, + { + "epoch": 0.42, + "learning_rate": 3.231275259305734e-06, + "loss": 0.9988, + "step": 14053 + }, + { + "epoch": 0.42, + "learning_rate": 3.2310420042467995e-06, + "loss": 1.0735, + "step": 14054 + }, + { + "epoch": 0.42, + "learning_rate": 3.2308087422286966e-06, + "loss": 1.1591, + "step": 14055 + }, + { + "epoch": 0.42, + "learning_rate": 3.230575473253647e-06, + "loss": 1.0576, + "step": 14056 + }, + { + "epoch": 0.42, + "learning_rate": 3.23034219732387e-06, + "loss": 1.0836, + "step": 14057 + }, + { + "epoch": 0.42, + "learning_rate": 3.230108914441588e-06, + "loss": 1.1917, + "step": 14058 + }, + { + "epoch": 0.42, + "learning_rate": 3.2298756246090204e-06, + "loss": 1.0344, + "step": 14059 + }, + { + "epoch": 0.42, + "learning_rate": 3.229642327828387e-06, + "loss": 1.2397, + "step": 14060 + }, + { + "epoch": 0.42, + "learning_rate": 3.229409024101912e-06, + "loss": 1.1139, + "step": 14061 + }, + { + "epoch": 0.42, + "learning_rate": 3.2291757134318134e-06, + "loss": 1.3579, + "step": 14062 + }, + { + "epoch": 0.42, + "learning_rate": 3.228942395820313e-06, + "loss": 1.062, + "step": 14063 + }, + { + "epoch": 0.42, + "learning_rate": 3.2287090712696335e-06, + "loss": 1.1537, + "step": 14064 + }, + { + "epoch": 0.42, + "learning_rate": 3.2284757397819934e-06, + "loss": 1.0523, + "step": 14065 + }, + { + "epoch": 0.42, + "learning_rate": 3.228242401359615e-06, + "loss": 1.0563, + "step": 14066 + }, + { + "epoch": 0.42, + "learning_rate": 3.22800905600472e-06, + "loss": 1.2422, + "step": 14067 + }, + { + "epoch": 0.42, + "learning_rate": 3.227775703719529e-06, + "loss": 1.067, + "step": 14068 + }, + { + "epoch": 0.42, + "learning_rate": 3.2275423445062647e-06, + "loss": 1.2274, + "step": 14069 + }, + { + "epoch": 0.42, + "learning_rate": 3.227308978367147e-06, + "loss": 1.1667, + "step": 14070 + }, + { + "epoch": 0.42, + "learning_rate": 3.227075605304398e-06, + "loss": 1.153, + "step": 14071 + }, + { + "epoch": 0.42, + "learning_rate": 3.22684222532024e-06, + "loss": 1.1552, + "step": 14072 + }, + { + "epoch": 0.42, + "learning_rate": 3.226608838416893e-06, + "loss": 1.3093, + "step": 14073 + }, + { + "epoch": 0.42, + "learning_rate": 3.226375444596581e-06, + "loss": 1.2393, + "step": 14074 + }, + { + "epoch": 0.42, + "learning_rate": 3.2261420438615245e-06, + "loss": 1.1036, + "step": 14075 + }, + { + "epoch": 0.42, + "learning_rate": 3.2259086362139447e-06, + "loss": 1.1353, + "step": 14076 + }, + { + "epoch": 0.42, + "learning_rate": 3.225675221656065e-06, + "loss": 1.1122, + "step": 14077 + }, + { + "epoch": 0.42, + "learning_rate": 3.2254418001901056e-06, + "loss": 1.1007, + "step": 14078 + }, + { + "epoch": 0.42, + "learning_rate": 3.22520837181829e-06, + "loss": 1.1531, + "step": 14079 + }, + { + "epoch": 0.42, + "learning_rate": 3.224974936542841e-06, + "loss": 1.1776, + "step": 14080 + }, + { + "epoch": 0.42, + "learning_rate": 3.2247414943659794e-06, + "loss": 1.1692, + "step": 14081 + }, + { + "epoch": 0.42, + "learning_rate": 3.2245080452899276e-06, + "loss": 1.1262, + "step": 14082 + }, + { + "epoch": 0.42, + "learning_rate": 3.224274589316908e-06, + "loss": 1.1241, + "step": 14083 + }, + { + "epoch": 0.42, + "learning_rate": 3.2240411264491433e-06, + "loss": 1.2077, + "step": 14084 + }, + { + "epoch": 0.42, + "learning_rate": 3.2238076566888552e-06, + "loss": 1.1398, + "step": 14085 + }, + { + "epoch": 0.42, + "learning_rate": 3.223574180038268e-06, + "loss": 1.0545, + "step": 14086 + }, + { + "epoch": 0.42, + "learning_rate": 3.223340696499603e-06, + "loss": 1.175, + "step": 14087 + }, + { + "epoch": 0.42, + "learning_rate": 3.2231072060750816e-06, + "loss": 1.1699, + "step": 14088 + }, + { + "epoch": 0.42, + "learning_rate": 3.2228737087669295e-06, + "loss": 1.154, + "step": 14089 + }, + { + "epoch": 0.42, + "learning_rate": 3.2226402045773665e-06, + "loss": 1.1021, + "step": 14090 + }, + { + "epoch": 0.42, + "learning_rate": 3.222406693508617e-06, + "loss": 1.2538, + "step": 14091 + }, + { + "epoch": 0.42, + "learning_rate": 3.222173175562904e-06, + "loss": 1.0997, + "step": 14092 + }, + { + "epoch": 0.42, + "learning_rate": 3.22193965074245e-06, + "loss": 1.1769, + "step": 14093 + }, + { + "epoch": 0.42, + "learning_rate": 3.221706119049478e-06, + "loss": 1.1184, + "step": 14094 + }, + { + "epoch": 0.42, + "learning_rate": 3.221472580486212e-06, + "loss": 1.0641, + "step": 14095 + }, + { + "epoch": 0.42, + "learning_rate": 3.2212390350548746e-06, + "loss": 0.9837, + "step": 14096 + }, + { + "epoch": 0.42, + "learning_rate": 3.2210054827576887e-06, + "loss": 1.1411, + "step": 14097 + }, + { + "epoch": 0.42, + "learning_rate": 3.220771923596877e-06, + "loss": 1.1364, + "step": 14098 + }, + { + "epoch": 0.42, + "learning_rate": 3.2205383575746645e-06, + "loss": 1.115, + "step": 14099 + }, + { + "epoch": 0.42, + "learning_rate": 3.2203047846932743e-06, + "loss": 1.1016, + "step": 14100 + }, + { + "epoch": 0.42, + "learning_rate": 3.220071204954929e-06, + "loss": 1.0609, + "step": 14101 + }, + { + "epoch": 0.42, + "learning_rate": 3.2198376183618524e-06, + "loss": 1.0888, + "step": 14102 + }, + { + "epoch": 0.42, + "learning_rate": 3.2196040249162684e-06, + "loss": 1.1331, + "step": 14103 + }, + { + "epoch": 0.42, + "learning_rate": 3.2193704246204003e-06, + "loss": 1.0806, + "step": 14104 + }, + { + "epoch": 0.42, + "learning_rate": 3.2191368174764737e-06, + "loss": 1.1544, + "step": 14105 + }, + { + "epoch": 0.42, + "learning_rate": 3.2189032034867094e-06, + "loss": 1.2178, + "step": 14106 + }, + { + "epoch": 0.42, + "learning_rate": 3.2186695826533332e-06, + "loss": 1.1713, + "step": 14107 + }, + { + "epoch": 0.43, + "learning_rate": 3.2184359549785693e-06, + "loss": 1.1732, + "step": 14108 + }, + { + "epoch": 0.43, + "learning_rate": 3.2182023204646407e-06, + "loss": 1.0192, + "step": 14109 + }, + { + "epoch": 0.43, + "learning_rate": 3.217968679113772e-06, + "loss": 1.2174, + "step": 14110 + }, + { + "epoch": 0.43, + "learning_rate": 3.2177350309281867e-06, + "loss": 1.1639, + "step": 14111 + }, + { + "epoch": 0.43, + "learning_rate": 3.2175013759101103e-06, + "loss": 1.0807, + "step": 14112 + }, + { + "epoch": 0.43, + "learning_rate": 3.2172677140617666e-06, + "loss": 1.0448, + "step": 14113 + }, + { + "epoch": 0.43, + "learning_rate": 3.217034045385379e-06, + "loss": 1.1855, + "step": 14114 + }, + { + "epoch": 0.43, + "learning_rate": 3.216800369883173e-06, + "loss": 1.2028, + "step": 14115 + }, + { + "epoch": 0.43, + "learning_rate": 3.216566687557372e-06, + "loss": 1.1774, + "step": 14116 + }, + { + "epoch": 0.43, + "learning_rate": 3.216332998410202e-06, + "loss": 1.1822, + "step": 14117 + }, + { + "epoch": 0.43, + "learning_rate": 3.216099302443887e-06, + "loss": 1.1145, + "step": 14118 + }, + { + "epoch": 0.43, + "learning_rate": 3.215865599660651e-06, + "loss": 1.0624, + "step": 14119 + }, + { + "epoch": 0.43, + "learning_rate": 3.2156318900627194e-06, + "loss": 1.1592, + "step": 14120 + }, + { + "epoch": 0.43, + "learning_rate": 3.2153981736523164e-06, + "loss": 1.1619, + "step": 14121 + }, + { + "epoch": 0.43, + "learning_rate": 3.215164450431668e-06, + "loss": 1.0859, + "step": 14122 + }, + { + "epoch": 0.43, + "learning_rate": 3.2149307204029988e-06, + "loss": 1.0911, + "step": 14123 + }, + { + "epoch": 0.43, + "learning_rate": 3.214696983568533e-06, + "loss": 1.1553, + "step": 14124 + }, + { + "epoch": 0.43, + "learning_rate": 3.214463239930496e-06, + "loss": 1.2103, + "step": 14125 + }, + { + "epoch": 0.43, + "learning_rate": 3.214229489491113e-06, + "loss": 1.2347, + "step": 14126 + }, + { + "epoch": 0.43, + "learning_rate": 3.2139957322526096e-06, + "loss": 1.0574, + "step": 14127 + }, + { + "epoch": 0.43, + "learning_rate": 3.2137619682172107e-06, + "loss": 1.1689, + "step": 14128 + }, + { + "epoch": 0.43, + "learning_rate": 3.2135281973871414e-06, + "loss": 1.1288, + "step": 14129 + }, + { + "epoch": 0.43, + "learning_rate": 3.2132944197646272e-06, + "loss": 1.1266, + "step": 14130 + }, + { + "epoch": 0.43, + "learning_rate": 3.2130606353518933e-06, + "loss": 1.0892, + "step": 14131 + }, + { + "epoch": 0.43, + "learning_rate": 3.212826844151166e-06, + "loss": 1.1177, + "step": 14132 + }, + { + "epoch": 0.43, + "learning_rate": 3.2125930461646703e-06, + "loss": 1.1094, + "step": 14133 + }, + { + "epoch": 0.43, + "learning_rate": 3.2123592413946324e-06, + "loss": 1.1127, + "step": 14134 + }, + { + "epoch": 0.43, + "learning_rate": 3.2121254298432776e-06, + "loss": 1.062, + "step": 14135 + }, + { + "epoch": 0.43, + "learning_rate": 3.2118916115128317e-06, + "loss": 1.2609, + "step": 14136 + }, + { + "epoch": 0.43, + "learning_rate": 3.2116577864055196e-06, + "loss": 1.1127, + "step": 14137 + }, + { + "epoch": 0.43, + "learning_rate": 3.21142395452357e-06, + "loss": 1.2341, + "step": 14138 + }, + { + "epoch": 0.43, + "learning_rate": 3.2111901158692054e-06, + "loss": 1.141, + "step": 14139 + }, + { + "epoch": 0.43, + "learning_rate": 3.2109562704446536e-06, + "loss": 1.0448, + "step": 14140 + }, + { + "epoch": 0.43, + "learning_rate": 3.210722418252141e-06, + "loss": 1.1153, + "step": 14141 + }, + { + "epoch": 0.43, + "learning_rate": 3.2104885592938926e-06, + "loss": 1.1525, + "step": 14142 + }, + { + "epoch": 0.43, + "learning_rate": 3.2102546935721363e-06, + "loss": 1.156, + "step": 14143 + }, + { + "epoch": 0.43, + "learning_rate": 3.2100208210890967e-06, + "loss": 1.1439, + "step": 14144 + }, + { + "epoch": 0.43, + "learning_rate": 3.209786941847001e-06, + "loss": 1.1379, + "step": 14145 + }, + { + "epoch": 0.43, + "learning_rate": 3.2095530558480746e-06, + "loss": 1.0839, + "step": 14146 + }, + { + "epoch": 0.43, + "learning_rate": 3.2093191630945463e-06, + "loss": 1.0849, + "step": 14147 + }, + { + "epoch": 0.43, + "learning_rate": 3.2090852635886404e-06, + "loss": 1.153, + "step": 14148 + }, + { + "epoch": 0.43, + "learning_rate": 3.208851357332585e-06, + "loss": 1.2313, + "step": 14149 + }, + { + "epoch": 0.43, + "learning_rate": 3.208617444328605e-06, + "loss": 1.1984, + "step": 14150 + }, + { + "epoch": 0.43, + "learning_rate": 3.2083835245789292e-06, + "loss": 1.1978, + "step": 14151 + }, + { + "epoch": 0.43, + "learning_rate": 3.2081495980857824e-06, + "loss": 1.0131, + "step": 14152 + }, + { + "epoch": 0.43, + "learning_rate": 3.2079156648513934e-06, + "loss": 1.0875, + "step": 14153 + }, + { + "epoch": 0.43, + "learning_rate": 3.2076817248779878e-06, + "loss": 1.0875, + "step": 14154 + }, + { + "epoch": 0.43, + "learning_rate": 3.2074477781677924e-06, + "loss": 1.1246, + "step": 14155 + }, + { + "epoch": 0.43, + "learning_rate": 3.207213824723036e-06, + "loss": 1.0508, + "step": 14156 + }, + { + "epoch": 0.43, + "learning_rate": 3.206979864545944e-06, + "loss": 1.0758, + "step": 14157 + }, + { + "epoch": 0.43, + "learning_rate": 3.2067458976387442e-06, + "loss": 1.2281, + "step": 14158 + }, + { + "epoch": 0.43, + "learning_rate": 3.206511924003664e-06, + "loss": 1.095, + "step": 14159 + }, + { + "epoch": 0.43, + "learning_rate": 3.2062779436429304e-06, + "loss": 1.1505, + "step": 14160 + }, + { + "epoch": 0.43, + "learning_rate": 3.2060439565587708e-06, + "loss": 1.2157, + "step": 14161 + }, + { + "epoch": 0.43, + "learning_rate": 3.2058099627534136e-06, + "loss": 1.233, + "step": 14162 + }, + { + "epoch": 0.43, + "learning_rate": 3.2055759622290844e-06, + "loss": 1.2139, + "step": 14163 + }, + { + "epoch": 0.43, + "learning_rate": 3.2053419549880127e-06, + "loss": 1.1658, + "step": 14164 + }, + { + "epoch": 0.43, + "learning_rate": 3.2051079410324248e-06, + "loss": 1.0625, + "step": 14165 + }, + { + "epoch": 0.43, + "learning_rate": 3.2048739203645484e-06, + "loss": 1.0929, + "step": 14166 + }, + { + "epoch": 0.43, + "learning_rate": 3.204639892986613e-06, + "loss": 1.1766, + "step": 14167 + }, + { + "epoch": 0.43, + "learning_rate": 3.204405858900844e-06, + "loss": 1.1773, + "step": 14168 + }, + { + "epoch": 0.43, + "learning_rate": 3.2041718181094716e-06, + "loss": 1.0535, + "step": 14169 + }, + { + "epoch": 0.43, + "learning_rate": 3.203937770614722e-06, + "loss": 1.163, + "step": 14170 + }, + { + "epoch": 0.43, + "learning_rate": 3.2037037164188246e-06, + "loss": 1.1348, + "step": 14171 + }, + { + "epoch": 0.43, + "learning_rate": 3.203469655524005e-06, + "loss": 1.2054, + "step": 14172 + }, + { + "epoch": 0.43, + "learning_rate": 3.2032355879324945e-06, + "loss": 1.1327, + "step": 14173 + }, + { + "epoch": 0.43, + "learning_rate": 3.203001513646519e-06, + "loss": 1.1185, + "step": 14174 + }, + { + "epoch": 0.43, + "learning_rate": 3.202767432668309e-06, + "loss": 1.1311, + "step": 14175 + }, + { + "epoch": 0.43, + "learning_rate": 3.20253334500009e-06, + "loss": 1.076, + "step": 14176 + }, + { + "epoch": 0.43, + "learning_rate": 3.202299250644093e-06, + "loss": 1.0887, + "step": 14177 + }, + { + "epoch": 0.43, + "learning_rate": 3.2020651496025444e-06, + "loss": 1.0871, + "step": 14178 + }, + { + "epoch": 0.43, + "learning_rate": 3.201831041877674e-06, + "loss": 1.1032, + "step": 14179 + }, + { + "epoch": 0.43, + "learning_rate": 3.2015969274717113e-06, + "loss": 1.2263, + "step": 14180 + }, + { + "epoch": 0.43, + "learning_rate": 3.201362806386883e-06, + "loss": 1.0435, + "step": 14181 + }, + { + "epoch": 0.43, + "learning_rate": 3.201128678625418e-06, + "loss": 1.0607, + "step": 14182 + }, + { + "epoch": 0.43, + "learning_rate": 3.2008945441895463e-06, + "loss": 1.1316, + "step": 14183 + }, + { + "epoch": 0.43, + "learning_rate": 3.2006604030814957e-06, + "loss": 1.0912, + "step": 14184 + }, + { + "epoch": 0.43, + "learning_rate": 3.200426255303496e-06, + "loss": 1.0804, + "step": 14185 + }, + { + "epoch": 0.43, + "learning_rate": 3.200192100857775e-06, + "loss": 1.1288, + "step": 14186 + }, + { + "epoch": 0.43, + "learning_rate": 3.1999579397465624e-06, + "loss": 1.2278, + "step": 14187 + }, + { + "epoch": 0.43, + "learning_rate": 3.199723771972088e-06, + "loss": 1.2405, + "step": 14188 + }, + { + "epoch": 0.43, + "learning_rate": 3.1994895975365796e-06, + "loss": 1.1688, + "step": 14189 + }, + { + "epoch": 0.43, + "learning_rate": 3.1992554164422686e-06, + "loss": 1.1512, + "step": 14190 + }, + { + "epoch": 0.43, + "learning_rate": 3.1990212286913815e-06, + "loss": 1.0823, + "step": 14191 + }, + { + "epoch": 0.43, + "learning_rate": 3.1987870342861484e-06, + "loss": 1.1111, + "step": 14192 + }, + { + "epoch": 0.43, + "learning_rate": 3.1985528332288006e-06, + "loss": 1.2104, + "step": 14193 + }, + { + "epoch": 0.43, + "learning_rate": 3.1983186255215653e-06, + "loss": 1.213, + "step": 14194 + }, + { + "epoch": 0.43, + "learning_rate": 3.198084411166674e-06, + "loss": 1.038, + "step": 14195 + }, + { + "epoch": 0.43, + "learning_rate": 3.1978501901663546e-06, + "loss": 1.0996, + "step": 14196 + }, + { + "epoch": 0.43, + "learning_rate": 3.1976159625228376e-06, + "loss": 0.9658, + "step": 14197 + }, + { + "epoch": 0.43, + "learning_rate": 3.1973817282383524e-06, + "loss": 1.1104, + "step": 14198 + }, + { + "epoch": 0.43, + "learning_rate": 3.19714748731513e-06, + "loss": 1.1414, + "step": 14199 + }, + { + "epoch": 0.43, + "learning_rate": 3.196913239755398e-06, + "loss": 1.0386, + "step": 14200 + }, + { + "epoch": 0.43, + "learning_rate": 3.1966789855613877e-06, + "loss": 1.1166, + "step": 14201 + }, + { + "epoch": 0.43, + "learning_rate": 3.1964447247353297e-06, + "loss": 1.0743, + "step": 14202 + }, + { + "epoch": 0.43, + "learning_rate": 3.1962104572794532e-06, + "loss": 1.0854, + "step": 14203 + }, + { + "epoch": 0.43, + "learning_rate": 3.195976183195988e-06, + "loss": 1.1428, + "step": 14204 + }, + { + "epoch": 0.43, + "learning_rate": 3.1957419024871654e-06, + "loss": 1.124, + "step": 14205 + }, + { + "epoch": 0.43, + "learning_rate": 3.1955076151552145e-06, + "loss": 1.1285, + "step": 14206 + }, + { + "epoch": 0.43, + "learning_rate": 3.195273321202366e-06, + "loss": 1.233, + "step": 14207 + }, + { + "epoch": 0.43, + "learning_rate": 3.195039020630851e-06, + "loss": 1.1855, + "step": 14208 + }, + { + "epoch": 0.43, + "learning_rate": 3.1948047134428982e-06, + "loss": 1.1044, + "step": 14209 + }, + { + "epoch": 0.43, + "learning_rate": 3.194570399640741e-06, + "loss": 1.2596, + "step": 14210 + }, + { + "epoch": 0.43, + "learning_rate": 3.194336079226606e-06, + "loss": 1.2147, + "step": 14211 + }, + { + "epoch": 0.43, + "learning_rate": 3.1941017522027272e-06, + "loss": 1.0565, + "step": 14212 + }, + { + "epoch": 0.43, + "learning_rate": 3.1938674185713337e-06, + "loss": 1.2635, + "step": 14213 + }, + { + "epoch": 0.43, + "learning_rate": 3.1936330783346557e-06, + "loss": 1.1415, + "step": 14214 + }, + { + "epoch": 0.43, + "learning_rate": 3.1933987314949255e-06, + "loss": 1.1327, + "step": 14215 + }, + { + "epoch": 0.43, + "learning_rate": 3.1931643780543744e-06, + "loss": 1.1044, + "step": 14216 + }, + { + "epoch": 0.43, + "learning_rate": 3.1929300180152307e-06, + "loss": 1.0764, + "step": 14217 + }, + { + "epoch": 0.43, + "learning_rate": 3.192695651379728e-06, + "loss": 1.1461, + "step": 14218 + }, + { + "epoch": 0.43, + "learning_rate": 3.192461278150096e-06, + "loss": 1.2135, + "step": 14219 + }, + { + "epoch": 0.43, + "learning_rate": 3.1922268983285654e-06, + "loss": 1.0907, + "step": 14220 + }, + { + "epoch": 0.43, + "learning_rate": 3.191992511917369e-06, + "loss": 1.1049, + "step": 14221 + }, + { + "epoch": 0.43, + "learning_rate": 3.191758118918737e-06, + "loss": 1.1227, + "step": 14222 + }, + { + "epoch": 0.43, + "learning_rate": 3.1915237193349008e-06, + "loss": 1.1851, + "step": 14223 + }, + { + "epoch": 0.43, + "learning_rate": 3.1912893131680915e-06, + "loss": 1.0811, + "step": 14224 + }, + { + "epoch": 0.43, + "learning_rate": 3.1910549004205414e-06, + "loss": 1.0394, + "step": 14225 + }, + { + "epoch": 0.43, + "learning_rate": 3.190820481094481e-06, + "loss": 1.0657, + "step": 14226 + }, + { + "epoch": 0.43, + "learning_rate": 3.1905860551921426e-06, + "loss": 1.1124, + "step": 14227 + }, + { + "epoch": 0.43, + "learning_rate": 3.1903516227157573e-06, + "loss": 1.1346, + "step": 14228 + }, + { + "epoch": 0.43, + "learning_rate": 3.1901171836675576e-06, + "loss": 1.2043, + "step": 14229 + }, + { + "epoch": 0.43, + "learning_rate": 3.189882738049774e-06, + "loss": 1.1508, + "step": 14230 + }, + { + "epoch": 0.43, + "learning_rate": 3.18964828586464e-06, + "loss": 1.1013, + "step": 14231 + }, + { + "epoch": 0.43, + "learning_rate": 3.1894138271143852e-06, + "loss": 1.0662, + "step": 14232 + }, + { + "epoch": 0.43, + "learning_rate": 3.1891793618012435e-06, + "loss": 1.1658, + "step": 14233 + }, + { + "epoch": 0.43, + "learning_rate": 3.1889448899274466e-06, + "loss": 1.1615, + "step": 14234 + }, + { + "epoch": 0.43, + "learning_rate": 3.188710411495225e-06, + "loss": 1.1505, + "step": 14235 + }, + { + "epoch": 0.43, + "learning_rate": 3.1884759265068134e-06, + "loss": 1.1528, + "step": 14236 + }, + { + "epoch": 0.43, + "learning_rate": 3.1882414349644414e-06, + "loss": 1.144, + "step": 14237 + }, + { + "epoch": 0.43, + "learning_rate": 3.1880069368703433e-06, + "loss": 1.2612, + "step": 14238 + }, + { + "epoch": 0.43, + "learning_rate": 3.1877724322267496e-06, + "loss": 1.175, + "step": 14239 + }, + { + "epoch": 0.43, + "learning_rate": 3.187537921035894e-06, + "loss": 1.0212, + "step": 14240 + }, + { + "epoch": 0.43, + "learning_rate": 3.187303403300009e-06, + "loss": 1.0782, + "step": 14241 + }, + { + "epoch": 0.43, + "learning_rate": 3.1870688790213256e-06, + "loss": 1.1885, + "step": 14242 + }, + { + "epoch": 0.43, + "learning_rate": 3.186834348202078e-06, + "loss": 1.0489, + "step": 14243 + }, + { + "epoch": 0.43, + "learning_rate": 3.1865998108444983e-06, + "loss": 1.0397, + "step": 14244 + }, + { + "epoch": 0.43, + "learning_rate": 3.1863652669508183e-06, + "loss": 1.202, + "step": 14245 + }, + { + "epoch": 0.43, + "learning_rate": 3.1861307165232723e-06, + "loss": 1.1162, + "step": 14246 + }, + { + "epoch": 0.43, + "learning_rate": 3.1858961595640926e-06, + "loss": 1.1177, + "step": 14247 + }, + { + "epoch": 0.43, + "learning_rate": 3.185661596075511e-06, + "loss": 1.2059, + "step": 14248 + }, + { + "epoch": 0.43, + "learning_rate": 3.185427026059762e-06, + "loss": 1.2133, + "step": 14249 + }, + { + "epoch": 0.43, + "learning_rate": 3.185192449519077e-06, + "loss": 1.0421, + "step": 14250 + }, + { + "epoch": 0.43, + "learning_rate": 3.184957866455691e-06, + "loss": 1.2275, + "step": 14251 + }, + { + "epoch": 0.43, + "learning_rate": 3.184723276871835e-06, + "loss": 1.192, + "step": 14252 + }, + { + "epoch": 0.43, + "learning_rate": 3.1844886807697435e-06, + "loss": 1.1912, + "step": 14253 + }, + { + "epoch": 0.43, + "learning_rate": 3.1842540781516496e-06, + "loss": 1.2529, + "step": 14254 + }, + { + "epoch": 0.43, + "learning_rate": 3.1840194690197856e-06, + "loss": 1.079, + "step": 14255 + }, + { + "epoch": 0.43, + "learning_rate": 3.1837848533763858e-06, + "loss": 1.182, + "step": 14256 + }, + { + "epoch": 0.43, + "learning_rate": 3.1835502312236843e-06, + "loss": 1.1383, + "step": 14257 + }, + { + "epoch": 0.43, + "learning_rate": 3.183315602563913e-06, + "loss": 1.1676, + "step": 14258 + }, + { + "epoch": 0.43, + "learning_rate": 3.1830809673993076e-06, + "loss": 1.1171, + "step": 14259 + }, + { + "epoch": 0.43, + "learning_rate": 3.1828463257320995e-06, + "loss": 1.0577, + "step": 14260 + }, + { + "epoch": 0.43, + "learning_rate": 3.1826116775645235e-06, + "loss": 1.0831, + "step": 14261 + }, + { + "epoch": 0.43, + "learning_rate": 3.1823770228988126e-06, + "loss": 1.1395, + "step": 14262 + }, + { + "epoch": 0.43, + "learning_rate": 3.1821423617372014e-06, + "loss": 1.1611, + "step": 14263 + }, + { + "epoch": 0.43, + "learning_rate": 3.181907694081924e-06, + "loss": 1.1998, + "step": 14264 + }, + { + "epoch": 0.43, + "learning_rate": 3.181673019935213e-06, + "loss": 1.0291, + "step": 14265 + }, + { + "epoch": 0.43, + "learning_rate": 3.1814383392993033e-06, + "loss": 1.1189, + "step": 14266 + }, + { + "epoch": 0.43, + "learning_rate": 3.1812036521764287e-06, + "loss": 1.1568, + "step": 14267 + }, + { + "epoch": 0.43, + "learning_rate": 3.1809689585688237e-06, + "loss": 1.1324, + "step": 14268 + }, + { + "epoch": 0.43, + "learning_rate": 3.1807342584787217e-06, + "loss": 1.1587, + "step": 14269 + }, + { + "epoch": 0.43, + "learning_rate": 3.180499551908358e-06, + "loss": 1.1293, + "step": 14270 + }, + { + "epoch": 0.43, + "learning_rate": 3.1802648388599654e-06, + "loss": 1.0603, + "step": 14271 + }, + { + "epoch": 0.43, + "learning_rate": 3.18003011933578e-06, + "loss": 1.0816, + "step": 14272 + }, + { + "epoch": 0.43, + "learning_rate": 3.1797953933380353e-06, + "loss": 1.2656, + "step": 14273 + }, + { + "epoch": 0.43, + "learning_rate": 3.1795606608689656e-06, + "loss": 1.1287, + "step": 14274 + }, + { + "epoch": 0.43, + "learning_rate": 3.1793259219308063e-06, + "loss": 1.1922, + "step": 14275 + }, + { + "epoch": 0.43, + "learning_rate": 3.179091176525791e-06, + "loss": 1.224, + "step": 14276 + }, + { + "epoch": 0.43, + "learning_rate": 3.178856424656155e-06, + "loss": 1.037, + "step": 14277 + }, + { + "epoch": 0.43, + "learning_rate": 3.178621666324132e-06, + "loss": 1.0845, + "step": 14278 + }, + { + "epoch": 0.43, + "learning_rate": 3.1783869015319585e-06, + "loss": 1.0598, + "step": 14279 + }, + { + "epoch": 0.43, + "learning_rate": 3.178152130281868e-06, + "loss": 1.1467, + "step": 14280 + }, + { + "epoch": 0.43, + "learning_rate": 3.177917352576096e-06, + "loss": 1.3311, + "step": 14281 + }, + { + "epoch": 0.43, + "learning_rate": 3.1776825684168765e-06, + "loss": 1.0363, + "step": 14282 + }, + { + "epoch": 0.43, + "learning_rate": 3.177447777806446e-06, + "loss": 1.183, + "step": 14283 + }, + { + "epoch": 0.43, + "learning_rate": 3.1772129807470385e-06, + "loss": 1.0611, + "step": 14284 + }, + { + "epoch": 0.43, + "learning_rate": 3.1769781772408904e-06, + "loss": 1.064, + "step": 14285 + }, + { + "epoch": 0.43, + "learning_rate": 3.1767433672902357e-06, + "loss": 1.2284, + "step": 14286 + }, + { + "epoch": 0.43, + "learning_rate": 3.1765085508973097e-06, + "loss": 1.2101, + "step": 14287 + }, + { + "epoch": 0.43, + "learning_rate": 3.1762737280643486e-06, + "loss": 1.1503, + "step": 14288 + }, + { + "epoch": 0.43, + "learning_rate": 3.1760388987935873e-06, + "loss": 1.1031, + "step": 14289 + }, + { + "epoch": 0.43, + "learning_rate": 3.175804063087261e-06, + "loss": 1.1768, + "step": 14290 + }, + { + "epoch": 0.43, + "learning_rate": 3.1755692209476057e-06, + "loss": 1.1407, + "step": 14291 + }, + { + "epoch": 0.43, + "learning_rate": 3.175334372376857e-06, + "loss": 1.2388, + "step": 14292 + }, + { + "epoch": 0.43, + "learning_rate": 3.1750995173772496e-06, + "loss": 1.1313, + "step": 14293 + }, + { + "epoch": 0.43, + "learning_rate": 3.174864655951021e-06, + "loss": 0.96, + "step": 14294 + }, + { + "epoch": 0.43, + "learning_rate": 3.1746297881004053e-06, + "loss": 1.0863, + "step": 14295 + }, + { + "epoch": 0.43, + "learning_rate": 3.1743949138276386e-06, + "loss": 1.1971, + "step": 14296 + }, + { + "epoch": 0.43, + "learning_rate": 3.174160033134957e-06, + "loss": 1.0446, + "step": 14297 + }, + { + "epoch": 0.43, + "learning_rate": 3.173925146024597e-06, + "loss": 1.2078, + "step": 14298 + }, + { + "epoch": 0.43, + "learning_rate": 3.1736902524987944e-06, + "loss": 1.0853, + "step": 14299 + }, + { + "epoch": 0.43, + "learning_rate": 3.1734553525597846e-06, + "loss": 1.1902, + "step": 14300 + }, + { + "epoch": 0.43, + "learning_rate": 3.1732204462098048e-06, + "loss": 1.1483, + "step": 14301 + }, + { + "epoch": 0.43, + "learning_rate": 3.1729855334510902e-06, + "loss": 1.0953, + "step": 14302 + }, + { + "epoch": 0.43, + "learning_rate": 3.1727506142858776e-06, + "loss": 1.0953, + "step": 14303 + }, + { + "epoch": 0.43, + "learning_rate": 3.1725156887164025e-06, + "loss": 1.2421, + "step": 14304 + }, + { + "epoch": 0.43, + "learning_rate": 3.1722807567449034e-06, + "loss": 1.0815, + "step": 14305 + }, + { + "epoch": 0.43, + "learning_rate": 3.172045818373614e-06, + "loss": 1.123, + "step": 14306 + }, + { + "epoch": 0.43, + "learning_rate": 3.1718108736047724e-06, + "loss": 1.0878, + "step": 14307 + }, + { + "epoch": 0.43, + "learning_rate": 3.1715759224406146e-06, + "loss": 1.1474, + "step": 14308 + }, + { + "epoch": 0.43, + "learning_rate": 3.1713409648833774e-06, + "loss": 1.0892, + "step": 14309 + }, + { + "epoch": 0.43, + "learning_rate": 3.1711060009352978e-06, + "loss": 1.0889, + "step": 14310 + }, + { + "epoch": 0.43, + "learning_rate": 3.1708710305986123e-06, + "loss": 1.1325, + "step": 14311 + }, + { + "epoch": 0.43, + "learning_rate": 3.1706360538755576e-06, + "loss": 1.3138, + "step": 14312 + }, + { + "epoch": 0.43, + "learning_rate": 3.1704010707683707e-06, + "loss": 1.1084, + "step": 14313 + }, + { + "epoch": 0.43, + "learning_rate": 3.170166081279289e-06, + "loss": 1.147, + "step": 14314 + }, + { + "epoch": 0.43, + "learning_rate": 3.169931085410548e-06, + "loss": 1.1439, + "step": 14315 + }, + { + "epoch": 0.43, + "learning_rate": 3.169696083164387e-06, + "loss": 1.0834, + "step": 14316 + }, + { + "epoch": 0.43, + "learning_rate": 3.169461074543041e-06, + "loss": 1.1978, + "step": 14317 + }, + { + "epoch": 0.43, + "learning_rate": 3.1692260595487485e-06, + "loss": 1.0435, + "step": 14318 + }, + { + "epoch": 0.43, + "learning_rate": 3.168991038183745e-06, + "loss": 1.1926, + "step": 14319 + }, + { + "epoch": 0.43, + "learning_rate": 3.16875601045027e-06, + "loss": 1.1105, + "step": 14320 + }, + { + "epoch": 0.43, + "learning_rate": 3.16852097635056e-06, + "loss": 1.1488, + "step": 14321 + }, + { + "epoch": 0.43, + "learning_rate": 3.168285935886852e-06, + "loss": 1.1268, + "step": 14322 + }, + { + "epoch": 0.43, + "learning_rate": 3.168050889061384e-06, + "loss": 1.1301, + "step": 14323 + }, + { + "epoch": 0.43, + "learning_rate": 3.1678158358763923e-06, + "loss": 1.1893, + "step": 14324 + }, + { + "epoch": 0.43, + "learning_rate": 3.167580776334116e-06, + "loss": 1.0839, + "step": 14325 + }, + { + "epoch": 0.43, + "learning_rate": 3.167345710436792e-06, + "loss": 1.1366, + "step": 14326 + }, + { + "epoch": 0.43, + "learning_rate": 3.167110638186659e-06, + "loss": 1.0533, + "step": 14327 + }, + { + "epoch": 0.43, + "learning_rate": 3.1668755595859533e-06, + "loss": 1.128, + "step": 14328 + }, + { + "epoch": 0.43, + "learning_rate": 3.1666404746369145e-06, + "loss": 1.1093, + "step": 14329 + }, + { + "epoch": 0.43, + "learning_rate": 3.1664053833417787e-06, + "loss": 1.0778, + "step": 14330 + }, + { + "epoch": 0.43, + "learning_rate": 3.166170285702785e-06, + "loss": 1.1433, + "step": 14331 + }, + { + "epoch": 0.43, + "learning_rate": 3.16593518172217e-06, + "loss": 1.1106, + "step": 14332 + }, + { + "epoch": 0.43, + "learning_rate": 3.165700071402174e-06, + "loss": 1.2061, + "step": 14333 + }, + { + "epoch": 0.43, + "learning_rate": 3.1654649547450334e-06, + "loss": 1.0534, + "step": 14334 + }, + { + "epoch": 0.43, + "learning_rate": 3.1652298317529866e-06, + "loss": 1.1005, + "step": 14335 + }, + { + "epoch": 0.43, + "learning_rate": 3.1649947024282724e-06, + "loss": 1.1218, + "step": 14336 + }, + { + "epoch": 0.43, + "learning_rate": 3.164759566773129e-06, + "loss": 1.1956, + "step": 14337 + }, + { + "epoch": 0.43, + "learning_rate": 3.1645244247897943e-06, + "loss": 1.2141, + "step": 14338 + }, + { + "epoch": 0.43, + "learning_rate": 3.164289276480508e-06, + "loss": 1.1264, + "step": 14339 + }, + { + "epoch": 0.43, + "learning_rate": 3.1640541218475067e-06, + "loss": 1.1403, + "step": 14340 + }, + { + "epoch": 0.43, + "learning_rate": 3.1638189608930305e-06, + "loss": 1.1472, + "step": 14341 + }, + { + "epoch": 0.43, + "learning_rate": 3.163583793619318e-06, + "loss": 1.1417, + "step": 14342 + }, + { + "epoch": 0.43, + "learning_rate": 3.163348620028607e-06, + "loss": 1.0895, + "step": 14343 + }, + { + "epoch": 0.43, + "learning_rate": 3.163113440123137e-06, + "loss": 1.1734, + "step": 14344 + }, + { + "epoch": 0.43, + "learning_rate": 3.162878253905145e-06, + "loss": 1.1373, + "step": 14345 + }, + { + "epoch": 0.43, + "learning_rate": 3.1626430613768727e-06, + "loss": 1.142, + "step": 14346 + }, + { + "epoch": 0.43, + "learning_rate": 3.162407862540557e-06, + "loss": 1.1398, + "step": 14347 + }, + { + "epoch": 0.43, + "learning_rate": 3.1621726573984377e-06, + "loss": 1.0858, + "step": 14348 + }, + { + "epoch": 0.43, + "learning_rate": 3.161937445952753e-06, + "loss": 1.2024, + "step": 14349 + }, + { + "epoch": 0.43, + "learning_rate": 3.1617022282057432e-06, + "loss": 1.141, + "step": 14350 + }, + { + "epoch": 0.43, + "learning_rate": 3.161467004159646e-06, + "loss": 1.1712, + "step": 14351 + }, + { + "epoch": 0.43, + "learning_rate": 3.161231773816703e-06, + "loss": 1.1074, + "step": 14352 + }, + { + "epoch": 0.43, + "learning_rate": 3.160996537179151e-06, + "loss": 1.1931, + "step": 14353 + }, + { + "epoch": 0.43, + "learning_rate": 3.1607612942492304e-06, + "loss": 1.0492, + "step": 14354 + }, + { + "epoch": 0.43, + "learning_rate": 3.1605260450291807e-06, + "loss": 1.1151, + "step": 14355 + }, + { + "epoch": 0.43, + "learning_rate": 3.1602907895212416e-06, + "loss": 1.1874, + "step": 14356 + }, + { + "epoch": 0.43, + "learning_rate": 3.160055527727652e-06, + "loss": 1.1711, + "step": 14357 + }, + { + "epoch": 0.43, + "learning_rate": 3.159820259650651e-06, + "loss": 1.0461, + "step": 14358 + }, + { + "epoch": 0.43, + "learning_rate": 3.15958498529248e-06, + "loss": 1.1038, + "step": 14359 + }, + { + "epoch": 0.43, + "learning_rate": 3.1593497046553764e-06, + "loss": 1.1924, + "step": 14360 + }, + { + "epoch": 0.43, + "learning_rate": 3.1591144177415816e-06, + "loss": 1.09, + "step": 14361 + }, + { + "epoch": 0.43, + "learning_rate": 3.1588791245533353e-06, + "loss": 1.0879, + "step": 14362 + }, + { + "epoch": 0.43, + "learning_rate": 3.158643825092877e-06, + "loss": 1.1073, + "step": 14363 + }, + { + "epoch": 0.43, + "learning_rate": 3.1584085193624465e-06, + "loss": 1.1832, + "step": 14364 + }, + { + "epoch": 0.43, + "learning_rate": 3.1581732073642835e-06, + "loss": 1.0629, + "step": 14365 + }, + { + "epoch": 0.43, + "learning_rate": 3.157937889100629e-06, + "loss": 1.0844, + "step": 14366 + }, + { + "epoch": 0.43, + "learning_rate": 3.1577025645737224e-06, + "loss": 1.0399, + "step": 14367 + }, + { + "epoch": 0.43, + "learning_rate": 3.1574672337858046e-06, + "loss": 0.9993, + "step": 14368 + }, + { + "epoch": 0.43, + "learning_rate": 3.157231896739115e-06, + "loss": 1.1487, + "step": 14369 + }, + { + "epoch": 0.43, + "learning_rate": 3.1569965534358947e-06, + "loss": 1.0917, + "step": 14370 + }, + { + "epoch": 0.43, + "learning_rate": 3.1567612038783833e-06, + "loss": 1.1279, + "step": 14371 + }, + { + "epoch": 0.43, + "learning_rate": 3.1565258480688226e-06, + "loss": 1.1832, + "step": 14372 + }, + { + "epoch": 0.43, + "learning_rate": 3.1562904860094505e-06, + "loss": 1.2256, + "step": 14373 + }, + { + "epoch": 0.43, + "learning_rate": 3.15605511770251e-06, + "loss": 1.1868, + "step": 14374 + }, + { + "epoch": 0.43, + "learning_rate": 3.15581974315024e-06, + "loss": 1.173, + "step": 14375 + }, + { + "epoch": 0.43, + "learning_rate": 3.1555843623548832e-06, + "loss": 1.1124, + "step": 14376 + }, + { + "epoch": 0.43, + "learning_rate": 3.155348975318678e-06, + "loss": 1.1252, + "step": 14377 + }, + { + "epoch": 0.43, + "learning_rate": 3.155113582043866e-06, + "loss": 1.0481, + "step": 14378 + }, + { + "epoch": 0.43, + "learning_rate": 3.1548781825326883e-06, + "loss": 1.0143, + "step": 14379 + }, + { + "epoch": 0.43, + "learning_rate": 3.1546427767873853e-06, + "loss": 1.0847, + "step": 14380 + }, + { + "epoch": 0.43, + "learning_rate": 3.1544073648101996e-06, + "loss": 1.1938, + "step": 14381 + }, + { + "epoch": 0.43, + "learning_rate": 3.1541719466033703e-06, + "loss": 1.0781, + "step": 14382 + }, + { + "epoch": 0.43, + "learning_rate": 3.15393652216914e-06, + "loss": 1.1156, + "step": 14383 + }, + { + "epoch": 0.43, + "learning_rate": 3.1537010915097476e-06, + "loss": 1.1113, + "step": 14384 + }, + { + "epoch": 0.43, + "learning_rate": 3.153465654627437e-06, + "loss": 1.1991, + "step": 14385 + }, + { + "epoch": 0.43, + "learning_rate": 3.153230211524446e-06, + "loss": 1.1505, + "step": 14386 + }, + { + "epoch": 0.43, + "learning_rate": 3.15299476220302e-06, + "loss": 1.1301, + "step": 14387 + }, + { + "epoch": 0.43, + "learning_rate": 3.152759306665397e-06, + "loss": 1.1145, + "step": 14388 + }, + { + "epoch": 0.43, + "learning_rate": 3.152523844913821e-06, + "loss": 1.0922, + "step": 14389 + }, + { + "epoch": 0.43, + "learning_rate": 3.152288376950532e-06, + "loss": 1.1157, + "step": 14390 + }, + { + "epoch": 0.43, + "learning_rate": 3.152052902777771e-06, + "loss": 1.1964, + "step": 14391 + }, + { + "epoch": 0.43, + "learning_rate": 3.1518174223977806e-06, + "loss": 1.1171, + "step": 14392 + }, + { + "epoch": 0.43, + "learning_rate": 3.1515819358128025e-06, + "loss": 1.2173, + "step": 14393 + }, + { + "epoch": 0.43, + "learning_rate": 3.1513464430250783e-06, + "loss": 1.1213, + "step": 14394 + }, + { + "epoch": 0.43, + "learning_rate": 3.1511109440368494e-06, + "loss": 1.1759, + "step": 14395 + }, + { + "epoch": 0.43, + "learning_rate": 3.1508754388503582e-06, + "loss": 1.1537, + "step": 14396 + }, + { + "epoch": 0.43, + "learning_rate": 3.150639927467846e-06, + "loss": 1.0739, + "step": 14397 + }, + { + "epoch": 0.43, + "learning_rate": 3.150404409891556e-06, + "loss": 1.1823, + "step": 14398 + }, + { + "epoch": 0.43, + "learning_rate": 3.1501688861237277e-06, + "loss": 1.1112, + "step": 14399 + }, + { + "epoch": 0.43, + "learning_rate": 3.1499333561666063e-06, + "loss": 1.0705, + "step": 14400 + }, + { + "epoch": 0.43, + "learning_rate": 3.1496978200224314e-06, + "loss": 1.2056, + "step": 14401 + }, + { + "epoch": 0.43, + "learning_rate": 3.1494622776934463e-06, + "loss": 1.1326, + "step": 14402 + }, + { + "epoch": 0.43, + "learning_rate": 3.1492267291818933e-06, + "loss": 1.0812, + "step": 14403 + }, + { + "epoch": 0.43, + "learning_rate": 3.1489911744900143e-06, + "loss": 1.2069, + "step": 14404 + }, + { + "epoch": 0.43, + "learning_rate": 3.148755613620052e-06, + "loss": 1.01, + "step": 14405 + }, + { + "epoch": 0.43, + "learning_rate": 3.148520046574248e-06, + "loss": 1.221, + "step": 14406 + }, + { + "epoch": 0.43, + "learning_rate": 3.148284473354847e-06, + "loss": 1.0806, + "step": 14407 + }, + { + "epoch": 0.43, + "learning_rate": 3.1480488939640886e-06, + "loss": 1.1223, + "step": 14408 + }, + { + "epoch": 0.43, + "learning_rate": 3.1478133084042174e-06, + "loss": 1.0939, + "step": 14409 + }, + { + "epoch": 0.43, + "learning_rate": 3.147577716677476e-06, + "loss": 1.102, + "step": 14410 + }, + { + "epoch": 0.43, + "learning_rate": 3.147342118786106e-06, + "loss": 1.1076, + "step": 14411 + }, + { + "epoch": 0.43, + "learning_rate": 3.147106514732351e-06, + "loss": 1.2448, + "step": 14412 + }, + { + "epoch": 0.43, + "learning_rate": 3.146870904518454e-06, + "loss": 1.1972, + "step": 14413 + }, + { + "epoch": 0.43, + "learning_rate": 3.1466352881466567e-06, + "loss": 1.0884, + "step": 14414 + }, + { + "epoch": 0.43, + "learning_rate": 3.1463996656192035e-06, + "loss": 1.0731, + "step": 14415 + }, + { + "epoch": 0.43, + "learning_rate": 3.1461640369383364e-06, + "loss": 1.0809, + "step": 14416 + }, + { + "epoch": 0.43, + "learning_rate": 3.1459284021063e-06, + "loss": 1.1712, + "step": 14417 + }, + { + "epoch": 0.43, + "learning_rate": 3.1456927611253347e-06, + "loss": 1.0017, + "step": 14418 + }, + { + "epoch": 0.43, + "learning_rate": 3.1454571139976858e-06, + "loss": 0.9836, + "step": 14419 + }, + { + "epoch": 0.43, + "learning_rate": 3.145221460725596e-06, + "loss": 1.1105, + "step": 14420 + }, + { + "epoch": 0.43, + "learning_rate": 3.1449858013113088e-06, + "loss": 1.136, + "step": 14421 + }, + { + "epoch": 0.43, + "learning_rate": 3.1447501357570675e-06, + "loss": 1.0542, + "step": 14422 + }, + { + "epoch": 0.43, + "learning_rate": 3.1445144640651153e-06, + "loss": 1.1989, + "step": 14423 + }, + { + "epoch": 0.43, + "learning_rate": 3.144278786237696e-06, + "loss": 1.0706, + "step": 14424 + }, + { + "epoch": 0.43, + "learning_rate": 3.1440431022770528e-06, + "loss": 1.0541, + "step": 14425 + }, + { + "epoch": 0.43, + "learning_rate": 3.14380741218543e-06, + "loss": 1.0825, + "step": 14426 + }, + { + "epoch": 0.43, + "learning_rate": 3.1435717159650702e-06, + "loss": 1.1797, + "step": 14427 + }, + { + "epoch": 0.43, + "learning_rate": 3.1433360136182177e-06, + "loss": 1.0937, + "step": 14428 + }, + { + "epoch": 0.43, + "learning_rate": 3.143100305147116e-06, + "loss": 1.2047, + "step": 14429 + }, + { + "epoch": 0.43, + "learning_rate": 3.1428645905540096e-06, + "loss": 1.2203, + "step": 14430 + }, + { + "epoch": 0.43, + "learning_rate": 3.142628869841141e-06, + "loss": 1.0893, + "step": 14431 + }, + { + "epoch": 0.43, + "learning_rate": 3.1423931430107556e-06, + "loss": 1.1216, + "step": 14432 + }, + { + "epoch": 0.43, + "learning_rate": 3.1421574100650966e-06, + "loss": 1.187, + "step": 14433 + }, + { + "epoch": 0.43, + "learning_rate": 3.141921671006408e-06, + "loss": 1.1332, + "step": 14434 + }, + { + "epoch": 0.43, + "learning_rate": 3.141685925836936e-06, + "loss": 1.0444, + "step": 14435 + }, + { + "epoch": 0.43, + "learning_rate": 3.1414501745589217e-06, + "loss": 1.1168, + "step": 14436 + }, + { + "epoch": 0.43, + "learning_rate": 3.1412144171746105e-06, + "loss": 1.1851, + "step": 14437 + }, + { + "epoch": 0.43, + "learning_rate": 3.1409786536862475e-06, + "loss": 1.2495, + "step": 14438 + }, + { + "epoch": 0.43, + "learning_rate": 3.1407428840960764e-06, + "loss": 1.1439, + "step": 14439 + }, + { + "epoch": 0.44, + "learning_rate": 3.140507108406341e-06, + "loss": 1.0628, + "step": 14440 + }, + { + "epoch": 0.44, + "learning_rate": 3.1402713266192876e-06, + "loss": 1.0966, + "step": 14441 + }, + { + "epoch": 0.44, + "learning_rate": 3.1400355387371583e-06, + "loss": 1.137, + "step": 14442 + }, + { + "epoch": 0.44, + "learning_rate": 3.1397997447621995e-06, + "loss": 1.2222, + "step": 14443 + }, + { + "epoch": 0.44, + "learning_rate": 3.1395639446966554e-06, + "loss": 1.1062, + "step": 14444 + }, + { + "epoch": 0.44, + "learning_rate": 3.1393281385427698e-06, + "loss": 1.223, + "step": 14445 + }, + { + "epoch": 0.44, + "learning_rate": 3.139092326302789e-06, + "loss": 0.9894, + "step": 14446 + }, + { + "epoch": 0.44, + "learning_rate": 3.1388565079789567e-06, + "loss": 1.1459, + "step": 14447 + }, + { + "epoch": 0.44, + "learning_rate": 3.1386206835735176e-06, + "loss": 1.0623, + "step": 14448 + }, + { + "epoch": 0.44, + "learning_rate": 3.1383848530887177e-06, + "loss": 1.1663, + "step": 14449 + }, + { + "epoch": 0.44, + "learning_rate": 3.138149016526802e-06, + "loss": 1.2413, + "step": 14450 + }, + { + "epoch": 0.44, + "learning_rate": 3.1379131738900142e-06, + "loss": 1.0649, + "step": 14451 + }, + { + "epoch": 0.44, + "learning_rate": 3.1376773251806012e-06, + "loss": 1.0795, + "step": 14452 + }, + { + "epoch": 0.44, + "learning_rate": 3.137441470400806e-06, + "loss": 1.1153, + "step": 14453 + }, + { + "epoch": 0.44, + "learning_rate": 3.137205609552876e-06, + "loss": 1.1333, + "step": 14454 + }, + { + "epoch": 0.44, + "learning_rate": 3.136969742639055e-06, + "loss": 1.1064, + "step": 14455 + }, + { + "epoch": 0.44, + "learning_rate": 3.136733869661589e-06, + "loss": 1.0643, + "step": 14456 + }, + { + "epoch": 0.44, + "learning_rate": 3.1364979906227226e-06, + "loss": 1.0916, + "step": 14457 + }, + { + "epoch": 0.44, + "learning_rate": 3.136262105524702e-06, + "loss": 1.1248, + "step": 14458 + }, + { + "epoch": 0.44, + "learning_rate": 3.136026214369774e-06, + "loss": 1.0629, + "step": 14459 + }, + { + "epoch": 0.44, + "learning_rate": 3.135790317160181e-06, + "loss": 1.1334, + "step": 14460 + }, + { + "epoch": 0.44, + "learning_rate": 3.1355544138981707e-06, + "loss": 1.1006, + "step": 14461 + }, + { + "epoch": 0.44, + "learning_rate": 3.135318504585989e-06, + "loss": 1.1219, + "step": 14462 + }, + { + "epoch": 0.44, + "learning_rate": 3.1350825892258814e-06, + "loss": 1.2203, + "step": 14463 + }, + { + "epoch": 0.44, + "learning_rate": 3.1348466678200927e-06, + "loss": 1.1047, + "step": 14464 + }, + { + "epoch": 0.44, + "learning_rate": 3.1346107403708704e-06, + "loss": 1.131, + "step": 14465 + }, + { + "epoch": 0.44, + "learning_rate": 3.134374806880458e-06, + "loss": 1.1085, + "step": 14466 + }, + { + "epoch": 0.44, + "learning_rate": 3.1341388673511043e-06, + "loss": 0.975, + "step": 14467 + }, + { + "epoch": 0.44, + "learning_rate": 3.1339029217850535e-06, + "loss": 1.1403, + "step": 14468 + }, + { + "epoch": 0.44, + "learning_rate": 3.1336669701845524e-06, + "loss": 1.0977, + "step": 14469 + }, + { + "epoch": 0.44, + "learning_rate": 3.1334310125518464e-06, + "loss": 1.0947, + "step": 14470 + }, + { + "epoch": 0.44, + "learning_rate": 3.1331950488891827e-06, + "loss": 1.1147, + "step": 14471 + }, + { + "epoch": 0.44, + "learning_rate": 3.1329590791988073e-06, + "loss": 1.1459, + "step": 14472 + }, + { + "epoch": 0.44, + "learning_rate": 3.1327231034829656e-06, + "loss": 1.0631, + "step": 14473 + }, + { + "epoch": 0.44, + "learning_rate": 3.1324871217439044e-06, + "loss": 1.0477, + "step": 14474 + }, + { + "epoch": 0.44, + "learning_rate": 3.1322511339838713e-06, + "loss": 1.2692, + "step": 14475 + }, + { + "epoch": 0.44, + "learning_rate": 3.1320151402051117e-06, + "loss": 1.1641, + "step": 14476 + }, + { + "epoch": 0.44, + "learning_rate": 3.1317791404098724e-06, + "loss": 1.1495, + "step": 14477 + }, + { + "epoch": 0.44, + "learning_rate": 3.1315431346004e-06, + "loss": 1.1418, + "step": 14478 + }, + { + "epoch": 0.44, + "learning_rate": 3.131307122778941e-06, + "loss": 1.1943, + "step": 14479 + }, + { + "epoch": 0.44, + "learning_rate": 3.131071104947743e-06, + "loss": 1.1147, + "step": 14480 + }, + { + "epoch": 0.44, + "learning_rate": 3.1308350811090502e-06, + "loss": 1.1876, + "step": 14481 + }, + { + "epoch": 0.44, + "learning_rate": 3.130599051265113e-06, + "loss": 1.1552, + "step": 14482 + }, + { + "epoch": 0.44, + "learning_rate": 3.130363015418176e-06, + "loss": 0.9672, + "step": 14483 + }, + { + "epoch": 0.44, + "learning_rate": 3.1301269735704867e-06, + "loss": 1.1918, + "step": 14484 + }, + { + "epoch": 0.44, + "learning_rate": 3.1298909257242914e-06, + "loss": 1.1671, + "step": 14485 + }, + { + "epoch": 0.44, + "learning_rate": 3.129654871881838e-06, + "loss": 1.1631, + "step": 14486 + }, + { + "epoch": 0.44, + "learning_rate": 3.1294188120453744e-06, + "loss": 1.0991, + "step": 14487 + }, + { + "epoch": 0.44, + "learning_rate": 3.1291827462171466e-06, + "loss": 1.0798, + "step": 14488 + }, + { + "epoch": 0.44, + "learning_rate": 3.1289466743994014e-06, + "loss": 1.1703, + "step": 14489 + }, + { + "epoch": 0.44, + "learning_rate": 3.1287105965943864e-06, + "loss": 1.0104, + "step": 14490 + }, + { + "epoch": 0.44, + "learning_rate": 3.12847451280435e-06, + "loss": 1.1605, + "step": 14491 + }, + { + "epoch": 0.44, + "learning_rate": 3.1282384230315394e-06, + "loss": 1.1428, + "step": 14492 + }, + { + "epoch": 0.44, + "learning_rate": 3.1280023272782012e-06, + "loss": 1.125, + "step": 14493 + }, + { + "epoch": 0.44, + "learning_rate": 3.1277662255465833e-06, + "loss": 1.1482, + "step": 14494 + }, + { + "epoch": 0.44, + "learning_rate": 3.127530117838934e-06, + "loss": 1.1522, + "step": 14495 + }, + { + "epoch": 0.44, + "learning_rate": 3.127294004157499e-06, + "loss": 1.1309, + "step": 14496 + }, + { + "epoch": 0.44, + "learning_rate": 3.1270578845045278e-06, + "loss": 1.0038, + "step": 14497 + }, + { + "epoch": 0.44, + "learning_rate": 3.1268217588822668e-06, + "loss": 0.9516, + "step": 14498 + }, + { + "epoch": 0.44, + "learning_rate": 3.1265856272929653e-06, + "loss": 1.1858, + "step": 14499 + }, + { + "epoch": 0.44, + "learning_rate": 3.126349489738871e-06, + "loss": 1.1679, + "step": 14500 + }, + { + "epoch": 0.44, + "learning_rate": 3.12611334622223e-06, + "loss": 1.0595, + "step": 14501 + }, + { + "epoch": 0.44, + "learning_rate": 3.1258771967452915e-06, + "loss": 1.1105, + "step": 14502 + }, + { + "epoch": 0.44, + "learning_rate": 3.125641041310304e-06, + "loss": 1.07, + "step": 14503 + }, + { + "epoch": 0.44, + "learning_rate": 3.1254048799195154e-06, + "loss": 1.2601, + "step": 14504 + }, + { + "epoch": 0.44, + "learning_rate": 3.125168712575173e-06, + "loss": 1.1685, + "step": 14505 + }, + { + "epoch": 0.44, + "learning_rate": 3.124932539279526e-06, + "loss": 1.0782, + "step": 14506 + }, + { + "epoch": 0.44, + "learning_rate": 3.124696360034822e-06, + "loss": 1.1272, + "step": 14507 + }, + { + "epoch": 0.44, + "learning_rate": 3.1244601748433095e-06, + "loss": 1.1246, + "step": 14508 + }, + { + "epoch": 0.44, + "learning_rate": 3.1242239837072365e-06, + "loss": 1.052, + "step": 14509 + }, + { + "epoch": 0.44, + "learning_rate": 3.1239877866288525e-06, + "loss": 1.0645, + "step": 14510 + }, + { + "epoch": 0.44, + "learning_rate": 3.123751583610405e-06, + "loss": 1.1913, + "step": 14511 + }, + { + "epoch": 0.44, + "learning_rate": 3.1235153746541423e-06, + "loss": 1.0843, + "step": 14512 + }, + { + "epoch": 0.44, + "learning_rate": 3.1232791597623145e-06, + "loss": 1.1273, + "step": 14513 + }, + { + "epoch": 0.44, + "learning_rate": 3.1230429389371684e-06, + "loss": 1.1821, + "step": 14514 + }, + { + "epoch": 0.44, + "learning_rate": 3.122806712180954e-06, + "loss": 1.1693, + "step": 14515 + }, + { + "epoch": 0.44, + "learning_rate": 3.1225704794959193e-06, + "loss": 1.0835, + "step": 14516 + }, + { + "epoch": 0.44, + "learning_rate": 3.1223342408843145e-06, + "loss": 1.0511, + "step": 14517 + }, + { + "epoch": 0.44, + "learning_rate": 3.1220979963483864e-06, + "loss": 1.1731, + "step": 14518 + }, + { + "epoch": 0.44, + "learning_rate": 3.1218617458903855e-06, + "loss": 1.215, + "step": 14519 + }, + { + "epoch": 0.44, + "learning_rate": 3.1216254895125603e-06, + "loss": 1.1563, + "step": 14520 + }, + { + "epoch": 0.44, + "learning_rate": 3.1213892272171596e-06, + "loss": 1.0853, + "step": 14521 + }, + { + "epoch": 0.44, + "learning_rate": 3.121152959006433e-06, + "loss": 1.0331, + "step": 14522 + }, + { + "epoch": 0.44, + "learning_rate": 3.1209166848826295e-06, + "loss": 1.2539, + "step": 14523 + }, + { + "epoch": 0.44, + "learning_rate": 3.120680404847998e-06, + "loss": 0.9869, + "step": 14524 + }, + { + "epoch": 0.44, + "learning_rate": 3.1204441189047874e-06, + "loss": 1.2009, + "step": 14525 + }, + { + "epoch": 0.44, + "learning_rate": 3.1202078270552485e-06, + "loss": 1.1547, + "step": 14526 + }, + { + "epoch": 0.44, + "learning_rate": 3.119971529301629e-06, + "loss": 1.2014, + "step": 14527 + }, + { + "epoch": 0.44, + "learning_rate": 3.11973522564618e-06, + "loss": 1.1063, + "step": 14528 + }, + { + "epoch": 0.44, + "learning_rate": 3.1194989160911495e-06, + "loss": 1.057, + "step": 14529 + }, + { + "epoch": 0.44, + "learning_rate": 3.119262600638787e-06, + "loss": 1.1677, + "step": 14530 + }, + { + "epoch": 0.44, + "learning_rate": 3.119026279291344e-06, + "loss": 1.1782, + "step": 14531 + }, + { + "epoch": 0.44, + "learning_rate": 3.1187899520510685e-06, + "loss": 1.1346, + "step": 14532 + }, + { + "epoch": 0.44, + "learning_rate": 3.1185536189202104e-06, + "loss": 1.0784, + "step": 14533 + }, + { + "epoch": 0.44, + "learning_rate": 3.1183172799010207e-06, + "loss": 1.0934, + "step": 14534 + }, + { + "epoch": 0.44, + "learning_rate": 3.1180809349957473e-06, + "loss": 1.1409, + "step": 14535 + }, + { + "epoch": 0.44, + "learning_rate": 3.1178445842066417e-06, + "loss": 1.2029, + "step": 14536 + }, + { + "epoch": 0.44, + "learning_rate": 3.117608227535953e-06, + "loss": 1.2406, + "step": 14537 + }, + { + "epoch": 0.44, + "learning_rate": 3.1173718649859307e-06, + "loss": 1.0963, + "step": 14538 + }, + { + "epoch": 0.44, + "learning_rate": 3.117135496558827e-06, + "loss": 1.0762, + "step": 14539 + }, + { + "epoch": 0.44, + "learning_rate": 3.1168991222568896e-06, + "loss": 1.1332, + "step": 14540 + }, + { + "epoch": 0.44, + "learning_rate": 3.1166627420823705e-06, + "loss": 0.9948, + "step": 14541 + }, + { + "epoch": 0.44, + "learning_rate": 3.116426356037518e-06, + "loss": 1.1776, + "step": 14542 + }, + { + "epoch": 0.44, + "learning_rate": 3.116189964124584e-06, + "loss": 1.2463, + "step": 14543 + }, + { + "epoch": 0.44, + "learning_rate": 3.115953566345818e-06, + "loss": 1.1367, + "step": 14544 + }, + { + "epoch": 0.44, + "learning_rate": 3.115717162703471e-06, + "loss": 1.1373, + "step": 14545 + }, + { + "epoch": 0.44, + "learning_rate": 3.115480753199793e-06, + "loss": 1.1202, + "step": 14546 + }, + { + "epoch": 0.44, + "learning_rate": 3.115244337837035e-06, + "loss": 1.1669, + "step": 14547 + }, + { + "epoch": 0.44, + "learning_rate": 3.1150079166174474e-06, + "loss": 1.1147, + "step": 14548 + }, + { + "epoch": 0.44, + "learning_rate": 3.11477148954328e-06, + "loss": 1.2626, + "step": 14549 + }, + { + "epoch": 0.44, + "learning_rate": 3.114535056616784e-06, + "loss": 1.1511, + "step": 14550 + }, + { + "epoch": 0.44, + "learning_rate": 3.114298617840211e-06, + "loss": 1.1161, + "step": 14551 + }, + { + "epoch": 0.44, + "learning_rate": 3.1140621732158103e-06, + "loss": 1.1277, + "step": 14552 + }, + { + "epoch": 0.44, + "learning_rate": 3.113825722745834e-06, + "loss": 1.0533, + "step": 14553 + }, + { + "epoch": 0.44, + "learning_rate": 3.1135892664325322e-06, + "loss": 1.0243, + "step": 14554 + }, + { + "epoch": 0.44, + "learning_rate": 3.1133528042781563e-06, + "loss": 1.0983, + "step": 14555 + }, + { + "epoch": 0.44, + "learning_rate": 3.1131163362849566e-06, + "loss": 1.2218, + "step": 14556 + }, + { + "epoch": 0.44, + "learning_rate": 3.112879862455185e-06, + "loss": 1.0516, + "step": 14557 + }, + { + "epoch": 0.44, + "learning_rate": 3.1126433827910924e-06, + "loss": 1.217, + "step": 14558 + }, + { + "epoch": 0.44, + "learning_rate": 3.1124068972949296e-06, + "loss": 1.0938, + "step": 14559 + }, + { + "epoch": 0.44, + "learning_rate": 3.1121704059689482e-06, + "loss": 1.1837, + "step": 14560 + }, + { + "epoch": 0.44, + "learning_rate": 3.1119339088153992e-06, + "loss": 1.1603, + "step": 14561 + }, + { + "epoch": 0.44, + "learning_rate": 3.1116974058365344e-06, + "loss": 1.2167, + "step": 14562 + }, + { + "epoch": 0.44, + "learning_rate": 3.111460897034605e-06, + "loss": 1.0822, + "step": 14563 + }, + { + "epoch": 0.44, + "learning_rate": 3.1112243824118614e-06, + "loss": 1.1799, + "step": 14564 + }, + { + "epoch": 0.44, + "learning_rate": 3.1109878619705573e-06, + "loss": 1.0494, + "step": 14565 + }, + { + "epoch": 0.44, + "learning_rate": 3.1107513357129427e-06, + "loss": 1.1968, + "step": 14566 + }, + { + "epoch": 0.44, + "learning_rate": 3.1105148036412693e-06, + "loss": 1.1229, + "step": 14567 + }, + { + "epoch": 0.44, + "learning_rate": 3.110278265757789e-06, + "loss": 1.2633, + "step": 14568 + }, + { + "epoch": 0.44, + "learning_rate": 3.1100417220647538e-06, + "loss": 1.1929, + "step": 14569 + }, + { + "epoch": 0.44, + "learning_rate": 3.1098051725644145e-06, + "loss": 1.1324, + "step": 14570 + }, + { + "epoch": 0.44, + "learning_rate": 3.1095686172590238e-06, + "loss": 1.0799, + "step": 14571 + }, + { + "epoch": 0.44, + "learning_rate": 3.109332056150834e-06, + "loss": 1.2193, + "step": 14572 + }, + { + "epoch": 0.44, + "learning_rate": 3.1090954892420965e-06, + "loss": 1.1339, + "step": 14573 + }, + { + "epoch": 0.44, + "learning_rate": 3.108858916535063e-06, + "loss": 1.0118, + "step": 14574 + }, + { + "epoch": 0.44, + "learning_rate": 3.1086223380319858e-06, + "loss": 1.1125, + "step": 14575 + }, + { + "epoch": 0.44, + "learning_rate": 3.108385753735117e-06, + "loss": 1.0933, + "step": 14576 + }, + { + "epoch": 0.44, + "learning_rate": 3.1081491636467093e-06, + "loss": 1.1613, + "step": 14577 + }, + { + "epoch": 0.44, + "learning_rate": 3.1079125677690143e-06, + "loss": 1.0859, + "step": 14578 + }, + { + "epoch": 0.44, + "learning_rate": 3.107675966104284e-06, + "loss": 1.1061, + "step": 14579 + }, + { + "epoch": 0.44, + "learning_rate": 3.107439358654772e-06, + "loss": 1.1367, + "step": 14580 + }, + { + "epoch": 0.44, + "learning_rate": 3.107202745422729e-06, + "loss": 1.153, + "step": 14581 + }, + { + "epoch": 0.44, + "learning_rate": 3.106966126410409e-06, + "loss": 0.9921, + "step": 14582 + }, + { + "epoch": 0.44, + "learning_rate": 3.106729501620063e-06, + "loss": 1.2466, + "step": 14583 + }, + { + "epoch": 0.44, + "learning_rate": 3.1064928710539445e-06, + "loss": 1.1276, + "step": 14584 + }, + { + "epoch": 0.44, + "learning_rate": 3.106256234714306e-06, + "loss": 1.1469, + "step": 14585 + }, + { + "epoch": 0.44, + "learning_rate": 3.1060195926034008e-06, + "loss": 1.2028, + "step": 14586 + }, + { + "epoch": 0.44, + "learning_rate": 3.10578294472348e-06, + "loss": 1.0746, + "step": 14587 + }, + { + "epoch": 0.44, + "learning_rate": 3.1055462910767984e-06, + "loss": 1.1592, + "step": 14588 + }, + { + "epoch": 0.44, + "learning_rate": 3.1053096316656066e-06, + "loss": 1.1341, + "step": 14589 + }, + { + "epoch": 0.44, + "learning_rate": 3.1050729664921597e-06, + "loss": 1.1014, + "step": 14590 + }, + { + "epoch": 0.44, + "learning_rate": 3.1048362955587092e-06, + "loss": 1.0673, + "step": 14591 + }, + { + "epoch": 0.44, + "learning_rate": 3.1045996188675083e-06, + "loss": 1.1321, + "step": 14592 + }, + { + "epoch": 0.44, + "learning_rate": 3.1043629364208107e-06, + "loss": 1.2352, + "step": 14593 + }, + { + "epoch": 0.44, + "learning_rate": 3.1041262482208676e-06, + "loss": 1.1136, + "step": 14594 + }, + { + "epoch": 0.44, + "learning_rate": 3.1038895542699355e-06, + "loss": 1.1023, + "step": 14595 + }, + { + "epoch": 0.44, + "learning_rate": 3.1036528545702644e-06, + "loss": 1.0204, + "step": 14596 + }, + { + "epoch": 0.44, + "learning_rate": 3.103416149124109e-06, + "loss": 1.1186, + "step": 14597 + }, + { + "epoch": 0.44, + "learning_rate": 3.103179437933722e-06, + "loss": 1.1667, + "step": 14598 + }, + { + "epoch": 0.44, + "learning_rate": 3.1029427210013585e-06, + "loss": 1.1467, + "step": 14599 + }, + { + "epoch": 0.44, + "learning_rate": 3.10270599832927e-06, + "loss": 1.1736, + "step": 14600 + }, + { + "epoch": 0.44, + "learning_rate": 3.102469269919711e-06, + "loss": 1.121, + "step": 14601 + }, + { + "epoch": 0.44, + "learning_rate": 3.1022325357749344e-06, + "loss": 1.0945, + "step": 14602 + }, + { + "epoch": 0.44, + "learning_rate": 3.101995795897195e-06, + "loss": 1.0612, + "step": 14603 + }, + { + "epoch": 0.44, + "learning_rate": 3.1017590502887442e-06, + "loss": 1.1653, + "step": 14604 + }, + { + "epoch": 0.44, + "learning_rate": 3.1015222989518373e-06, + "loss": 1.2545, + "step": 14605 + }, + { + "epoch": 0.44, + "learning_rate": 3.1012855418887284e-06, + "loss": 1.1232, + "step": 14606 + }, + { + "epoch": 0.44, + "learning_rate": 3.1010487791016703e-06, + "loss": 1.1832, + "step": 14607 + }, + { + "epoch": 0.44, + "learning_rate": 3.1008120105929173e-06, + "loss": 1.0968, + "step": 14608 + }, + { + "epoch": 0.44, + "learning_rate": 3.1005752363647235e-06, + "loss": 1.1289, + "step": 14609 + }, + { + "epoch": 0.44, + "learning_rate": 3.1003384564193427e-06, + "loss": 1.1951, + "step": 14610 + }, + { + "epoch": 0.44, + "learning_rate": 3.1001016707590293e-06, + "loss": 1.2086, + "step": 14611 + }, + { + "epoch": 0.44, + "learning_rate": 3.099864879386036e-06, + "loss": 1.0373, + "step": 14612 + }, + { + "epoch": 0.44, + "learning_rate": 3.099628082302618e-06, + "loss": 1.1238, + "step": 14613 + }, + { + "epoch": 0.44, + "learning_rate": 3.099391279511031e-06, + "loss": 1.0614, + "step": 14614 + }, + { + "epoch": 0.44, + "learning_rate": 3.0991544710135263e-06, + "loss": 1.1411, + "step": 14615 + }, + { + "epoch": 0.44, + "learning_rate": 3.0989176568123603e-06, + "loss": 1.007, + "step": 14616 + }, + { + "epoch": 0.44, + "learning_rate": 3.098680836909786e-06, + "loss": 1.1929, + "step": 14617 + }, + { + "epoch": 0.44, + "learning_rate": 3.0984440113080586e-06, + "loss": 1.1612, + "step": 14618 + }, + { + "epoch": 0.44, + "learning_rate": 3.098207180009433e-06, + "loss": 1.1599, + "step": 14619 + }, + { + "epoch": 0.44, + "learning_rate": 3.097970343016163e-06, + "loss": 1.0674, + "step": 14620 + }, + { + "epoch": 0.44, + "learning_rate": 3.0977335003305033e-06, + "loss": 1.0992, + "step": 14621 + }, + { + "epoch": 0.44, + "learning_rate": 3.097496651954708e-06, + "loss": 1.1409, + "step": 14622 + }, + { + "epoch": 0.44, + "learning_rate": 3.097259797891033e-06, + "loss": 1.1318, + "step": 14623 + }, + { + "epoch": 0.44, + "learning_rate": 3.097022938141732e-06, + "loss": 1.2057, + "step": 14624 + }, + { + "epoch": 0.44, + "learning_rate": 3.0967860727090598e-06, + "loss": 1.2011, + "step": 14625 + }, + { + "epoch": 0.44, + "learning_rate": 3.096549201595272e-06, + "loss": 1.0654, + "step": 14626 + }, + { + "epoch": 0.44, + "learning_rate": 3.096312324802624e-06, + "loss": 1.0894, + "step": 14627 + }, + { + "epoch": 0.44, + "learning_rate": 3.0960754423333684e-06, + "loss": 1.0469, + "step": 14628 + }, + { + "epoch": 0.44, + "learning_rate": 3.095838554189763e-06, + "loss": 1.1129, + "step": 14629 + }, + { + "epoch": 0.44, + "learning_rate": 3.09560166037406e-06, + "loss": 1.2709, + "step": 14630 + }, + { + "epoch": 0.44, + "learning_rate": 3.0953647608885173e-06, + "loss": 1.1896, + "step": 14631 + }, + { + "epoch": 0.44, + "learning_rate": 3.0951278557353887e-06, + "loss": 1.0833, + "step": 14632 + }, + { + "epoch": 0.44, + "learning_rate": 3.094890944916929e-06, + "loss": 1.1313, + "step": 14633 + }, + { + "epoch": 0.44, + "learning_rate": 3.0946540284353943e-06, + "loss": 0.9858, + "step": 14634 + }, + { + "epoch": 0.44, + "learning_rate": 3.0944171062930395e-06, + "loss": 1.2241, + "step": 14635 + }, + { + "epoch": 0.44, + "learning_rate": 3.0941801784921205e-06, + "loss": 1.265, + "step": 14636 + }, + { + "epoch": 0.44, + "learning_rate": 3.0939432450348916e-06, + "loss": 1.1143, + "step": 14637 + }, + { + "epoch": 0.44, + "learning_rate": 3.0937063059236094e-06, + "loss": 1.1542, + "step": 14638 + }, + { + "epoch": 0.44, + "learning_rate": 3.0934693611605295e-06, + "loss": 1.1279, + "step": 14639 + }, + { + "epoch": 0.44, + "learning_rate": 3.093232410747907e-06, + "loss": 0.989, + "step": 14640 + }, + { + "epoch": 0.44, + "learning_rate": 3.0929954546879975e-06, + "loss": 1.0112, + "step": 14641 + }, + { + "epoch": 0.44, + "learning_rate": 3.092758492983057e-06, + "loss": 1.1883, + "step": 14642 + }, + { + "epoch": 0.44, + "learning_rate": 3.092521525635341e-06, + "loss": 1.1767, + "step": 14643 + }, + { + "epoch": 0.44, + "learning_rate": 3.092284552647105e-06, + "loss": 1.098, + "step": 14644 + }, + { + "epoch": 0.44, + "learning_rate": 3.0920475740206064e-06, + "loss": 1.1931, + "step": 14645 + }, + { + "epoch": 0.44, + "learning_rate": 3.091810589758099e-06, + "loss": 1.0893, + "step": 14646 + }, + { + "epoch": 0.44, + "learning_rate": 3.0915735998618406e-06, + "loss": 1.1791, + "step": 14647 + }, + { + "epoch": 0.44, + "learning_rate": 3.091336604334086e-06, + "loss": 1.0649, + "step": 14648 + }, + { + "epoch": 0.44, + "learning_rate": 3.0910996031770916e-06, + "loss": 1.1564, + "step": 14649 + }, + { + "epoch": 0.44, + "learning_rate": 3.0908625963931137e-06, + "loss": 1.1019, + "step": 14650 + }, + { + "epoch": 0.44, + "learning_rate": 3.0906255839844093e-06, + "loss": 1.1213, + "step": 14651 + }, + { + "epoch": 0.44, + "learning_rate": 3.0903885659532327e-06, + "loss": 1.064, + "step": 14652 + }, + { + "epoch": 0.44, + "learning_rate": 3.0901515423018417e-06, + "loss": 1.0818, + "step": 14653 + }, + { + "epoch": 0.44, + "learning_rate": 3.089914513032492e-06, + "loss": 1.2269, + "step": 14654 + }, + { + "epoch": 0.44, + "learning_rate": 3.089677478147441e-06, + "loss": 1.1635, + "step": 14655 + }, + { + "epoch": 0.44, + "learning_rate": 3.0894404376489433e-06, + "loss": 1.135, + "step": 14656 + }, + { + "epoch": 0.44, + "learning_rate": 3.0892033915392573e-06, + "loss": 1.1979, + "step": 14657 + }, + { + "epoch": 0.44, + "learning_rate": 3.088966339820639e-06, + "loss": 1.0381, + "step": 14658 + }, + { + "epoch": 0.44, + "learning_rate": 3.088729282495344e-06, + "loss": 1.182, + "step": 14659 + }, + { + "epoch": 0.44, + "learning_rate": 3.0884922195656304e-06, + "loss": 1.1091, + "step": 14660 + }, + { + "epoch": 0.44, + "learning_rate": 3.088255151033754e-06, + "loss": 1.0689, + "step": 14661 + }, + { + "epoch": 0.44, + "learning_rate": 3.0880180769019718e-06, + "loss": 1.1868, + "step": 14662 + }, + { + "epoch": 0.44, + "learning_rate": 3.087780997172541e-06, + "loss": 1.106, + "step": 14663 + }, + { + "epoch": 0.44, + "learning_rate": 3.0875439118477184e-06, + "loss": 1.1465, + "step": 14664 + }, + { + "epoch": 0.44, + "learning_rate": 3.0873068209297604e-06, + "loss": 1.1614, + "step": 14665 + }, + { + "epoch": 0.44, + "learning_rate": 3.0870697244209236e-06, + "loss": 1.1969, + "step": 14666 + }, + { + "epoch": 0.44, + "learning_rate": 3.0868326223234664e-06, + "loss": 1.127, + "step": 14667 + }, + { + "epoch": 0.44, + "learning_rate": 3.086595514639646e-06, + "loss": 1.2479, + "step": 14668 + }, + { + "epoch": 0.44, + "learning_rate": 3.0863584013717174e-06, + "loss": 1.1121, + "step": 14669 + }, + { + "epoch": 0.44, + "learning_rate": 3.0861212825219407e-06, + "loss": 1.2092, + "step": 14670 + }, + { + "epoch": 0.44, + "learning_rate": 3.0858841580925704e-06, + "loss": 1.1615, + "step": 14671 + }, + { + "epoch": 0.44, + "learning_rate": 3.085647028085865e-06, + "loss": 1.1111, + "step": 14672 + }, + { + "epoch": 0.44, + "learning_rate": 3.0854098925040833e-06, + "loss": 1.1444, + "step": 14673 + }, + { + "epoch": 0.44, + "learning_rate": 3.0851727513494808e-06, + "loss": 1.2431, + "step": 14674 + }, + { + "epoch": 0.44, + "learning_rate": 3.0849356046243157e-06, + "loss": 1.1693, + "step": 14675 + }, + { + "epoch": 0.44, + "learning_rate": 3.0846984523308445e-06, + "loss": 1.1588, + "step": 14676 + }, + { + "epoch": 0.44, + "learning_rate": 3.0844612944713267e-06, + "loss": 1.1873, + "step": 14677 + }, + { + "epoch": 0.44, + "learning_rate": 3.084224131048018e-06, + "loss": 1.113, + "step": 14678 + }, + { + "epoch": 0.44, + "learning_rate": 3.0839869620631768e-06, + "loss": 1.1453, + "step": 14679 + }, + { + "epoch": 0.44, + "learning_rate": 3.0837497875190615e-06, + "loss": 1.1719, + "step": 14680 + }, + { + "epoch": 0.44, + "learning_rate": 3.0835126074179293e-06, + "loss": 1.1417, + "step": 14681 + }, + { + "epoch": 0.44, + "learning_rate": 3.083275421762038e-06, + "loss": 1.0988, + "step": 14682 + }, + { + "epoch": 0.44, + "learning_rate": 3.083038230553646e-06, + "loss": 1.1409, + "step": 14683 + }, + { + "epoch": 0.44, + "learning_rate": 3.0828010337950105e-06, + "loss": 1.115, + "step": 14684 + }, + { + "epoch": 0.44, + "learning_rate": 3.08256383148839e-06, + "loss": 1.1482, + "step": 14685 + }, + { + "epoch": 0.44, + "learning_rate": 3.0823266236360428e-06, + "loss": 1.1849, + "step": 14686 + }, + { + "epoch": 0.44, + "learning_rate": 3.0820894102402253e-06, + "loss": 1.2848, + "step": 14687 + }, + { + "epoch": 0.44, + "learning_rate": 3.0818521913031984e-06, + "loss": 1.0839, + "step": 14688 + }, + { + "epoch": 0.44, + "learning_rate": 3.0816149668272176e-06, + "loss": 1.0945, + "step": 14689 + }, + { + "epoch": 0.44, + "learning_rate": 3.0813777368145437e-06, + "loss": 1.1216, + "step": 14690 + }, + { + "epoch": 0.44, + "learning_rate": 3.0811405012674327e-06, + "loss": 1.1013, + "step": 14691 + }, + { + "epoch": 0.44, + "learning_rate": 3.0809032601881446e-06, + "loss": 1.1941, + "step": 14692 + }, + { + "epoch": 0.44, + "learning_rate": 3.0806660135789375e-06, + "loss": 1.0532, + "step": 14693 + }, + { + "epoch": 0.44, + "learning_rate": 3.0804287614420684e-06, + "loss": 1.1483, + "step": 14694 + }, + { + "epoch": 0.44, + "learning_rate": 3.080191503779798e-06, + "loss": 1.1666, + "step": 14695 + }, + { + "epoch": 0.44, + "learning_rate": 3.079954240594384e-06, + "loss": 1.1475, + "step": 14696 + }, + { + "epoch": 0.44, + "learning_rate": 3.079716971888084e-06, + "loss": 1.1516, + "step": 14697 + }, + { + "epoch": 0.44, + "learning_rate": 3.0794796976631585e-06, + "loss": 1.1373, + "step": 14698 + }, + { + "epoch": 0.44, + "learning_rate": 3.0792424179218655e-06, + "loss": 1.178, + "step": 14699 + }, + { + "epoch": 0.44, + "learning_rate": 3.0790051326664634e-06, + "loss": 1.2847, + "step": 14700 + }, + { + "epoch": 0.44, + "learning_rate": 3.0787678418992112e-06, + "loss": 1.0834, + "step": 14701 + }, + { + "epoch": 0.44, + "learning_rate": 3.078530545622368e-06, + "loss": 1.1385, + "step": 14702 + }, + { + "epoch": 0.44, + "learning_rate": 3.078293243838193e-06, + "loss": 1.176, + "step": 14703 + }, + { + "epoch": 0.44, + "learning_rate": 3.078055936548944e-06, + "loss": 1.0701, + "step": 14704 + }, + { + "epoch": 0.44, + "learning_rate": 3.0778186237568814e-06, + "loss": 1.0605, + "step": 14705 + }, + { + "epoch": 0.44, + "learning_rate": 3.0775813054642632e-06, + "loss": 1.2028, + "step": 14706 + }, + { + "epoch": 0.44, + "learning_rate": 3.0773439816733496e-06, + "loss": 1.1182, + "step": 14707 + }, + { + "epoch": 0.44, + "learning_rate": 3.077106652386399e-06, + "loss": 1.0781, + "step": 14708 + }, + { + "epoch": 0.44, + "learning_rate": 3.076869317605672e-06, + "loss": 1.1337, + "step": 14709 + }, + { + "epoch": 0.44, + "learning_rate": 3.076631977333426e-06, + "loss": 1.1226, + "step": 14710 + }, + { + "epoch": 0.44, + "learning_rate": 3.0763946315719213e-06, + "loss": 1.0858, + "step": 14711 + }, + { + "epoch": 0.44, + "learning_rate": 3.076157280323418e-06, + "loss": 1.1463, + "step": 14712 + }, + { + "epoch": 0.44, + "learning_rate": 3.0759199235901745e-06, + "loss": 1.1273, + "step": 14713 + }, + { + "epoch": 0.44, + "learning_rate": 3.0756825613744506e-06, + "loss": 1.0483, + "step": 14714 + }, + { + "epoch": 0.44, + "learning_rate": 3.0754451936785057e-06, + "loss": 1.1028, + "step": 14715 + }, + { + "epoch": 0.44, + "learning_rate": 3.0752078205046006e-06, + "loss": 1.1893, + "step": 14716 + }, + { + "epoch": 0.44, + "learning_rate": 3.074970441854993e-06, + "loss": 1.2094, + "step": 14717 + }, + { + "epoch": 0.44, + "learning_rate": 3.0747330577319444e-06, + "loss": 1.1157, + "step": 14718 + }, + { + "epoch": 0.44, + "learning_rate": 3.0744956681377135e-06, + "loss": 1.2896, + "step": 14719 + }, + { + "epoch": 0.44, + "learning_rate": 3.0742582730745606e-06, + "loss": 1.1337, + "step": 14720 + }, + { + "epoch": 0.44, + "learning_rate": 3.0740208725447456e-06, + "loss": 1.1336, + "step": 14721 + }, + { + "epoch": 0.44, + "learning_rate": 3.073783466550529e-06, + "loss": 1.115, + "step": 14722 + }, + { + "epoch": 0.44, + "learning_rate": 3.073546055094169e-06, + "loss": 1.1548, + "step": 14723 + }, + { + "epoch": 0.44, + "learning_rate": 3.0733086381779274e-06, + "loss": 1.2521, + "step": 14724 + }, + { + "epoch": 0.44, + "learning_rate": 3.073071215804064e-06, + "loss": 1.111, + "step": 14725 + }, + { + "epoch": 0.44, + "learning_rate": 3.072833787974838e-06, + "loss": 1.15, + "step": 14726 + }, + { + "epoch": 0.44, + "learning_rate": 3.072596354692511e-06, + "loss": 1.0164, + "step": 14727 + }, + { + "epoch": 0.44, + "learning_rate": 3.0723589159593416e-06, + "loss": 1.0891, + "step": 14728 + }, + { + "epoch": 0.44, + "learning_rate": 3.0721214717775918e-06, + "loss": 1.0938, + "step": 14729 + }, + { + "epoch": 0.44, + "learning_rate": 3.07188402214952e-06, + "loss": 1.1459, + "step": 14730 + }, + { + "epoch": 0.44, + "learning_rate": 3.0716465670773887e-06, + "loss": 1.1202, + "step": 14731 + }, + { + "epoch": 0.44, + "learning_rate": 3.071409106563457e-06, + "loss": 1.0472, + "step": 14732 + }, + { + "epoch": 0.44, + "learning_rate": 3.0711716406099857e-06, + "loss": 1.1375, + "step": 14733 + }, + { + "epoch": 0.44, + "learning_rate": 3.0709341692192357e-06, + "loss": 1.0275, + "step": 14734 + }, + { + "epoch": 0.44, + "learning_rate": 3.070696692393467e-06, + "loss": 1.2274, + "step": 14735 + }, + { + "epoch": 0.44, + "learning_rate": 3.0704592101349414e-06, + "loss": 1.0761, + "step": 14736 + }, + { + "epoch": 0.44, + "learning_rate": 3.070221722445918e-06, + "loss": 1.2225, + "step": 14737 + }, + { + "epoch": 0.44, + "learning_rate": 3.069984229328659e-06, + "loss": 1.1825, + "step": 14738 + }, + { + "epoch": 0.44, + "learning_rate": 3.0697467307854243e-06, + "loss": 1.0791, + "step": 14739 + }, + { + "epoch": 0.44, + "learning_rate": 3.0695092268184755e-06, + "loss": 1.1956, + "step": 14740 + }, + { + "epoch": 0.44, + "learning_rate": 3.0692717174300727e-06, + "loss": 1.1542, + "step": 14741 + }, + { + "epoch": 0.44, + "learning_rate": 3.0690342026224785e-06, + "loss": 1.0583, + "step": 14742 + }, + { + "epoch": 0.44, + "learning_rate": 3.0687966823979515e-06, + "loss": 1.2639, + "step": 14743 + }, + { + "epoch": 0.44, + "learning_rate": 3.0685591567587545e-06, + "loss": 1.1705, + "step": 14744 + }, + { + "epoch": 0.44, + "learning_rate": 3.068321625707148e-06, + "loss": 1.0775, + "step": 14745 + }, + { + "epoch": 0.44, + "learning_rate": 3.068084089245394e-06, + "loss": 1.0995, + "step": 14746 + }, + { + "epoch": 0.44, + "learning_rate": 3.067846547375752e-06, + "loss": 1.0996, + "step": 14747 + }, + { + "epoch": 0.44, + "learning_rate": 3.0676090001004845e-06, + "loss": 1.1075, + "step": 14748 + }, + { + "epoch": 0.44, + "learning_rate": 3.067371447421853e-06, + "loss": 1.2621, + "step": 14749 + }, + { + "epoch": 0.44, + "learning_rate": 3.0671338893421186e-06, + "loss": 1.1689, + "step": 14750 + }, + { + "epoch": 0.44, + "learning_rate": 3.0668963258635424e-06, + "loss": 1.127, + "step": 14751 + }, + { + "epoch": 0.44, + "learning_rate": 3.0666587569883868e-06, + "loss": 1.1248, + "step": 14752 + }, + { + "epoch": 0.44, + "learning_rate": 3.0664211827189124e-06, + "loss": 1.0974, + "step": 14753 + }, + { + "epoch": 0.44, + "learning_rate": 3.066183603057381e-06, + "loss": 1.2842, + "step": 14754 + }, + { + "epoch": 0.44, + "learning_rate": 3.0659460180060546e-06, + "loss": 1.1293, + "step": 14755 + }, + { + "epoch": 0.44, + "learning_rate": 3.0657084275671943e-06, + "loss": 1.1981, + "step": 14756 + }, + { + "epoch": 0.44, + "learning_rate": 3.0654708317430633e-06, + "loss": 1.1049, + "step": 14757 + }, + { + "epoch": 0.44, + "learning_rate": 3.065233230535921e-06, + "loss": 1.1393, + "step": 14758 + }, + { + "epoch": 0.44, + "learning_rate": 3.0649956239480317e-06, + "loss": 1.1057, + "step": 14759 + }, + { + "epoch": 0.44, + "learning_rate": 3.0647580119816554e-06, + "loss": 1.2109, + "step": 14760 + }, + { + "epoch": 0.44, + "learning_rate": 3.064520394639055e-06, + "loss": 1.0641, + "step": 14761 + }, + { + "epoch": 0.44, + "learning_rate": 3.064282771922492e-06, + "loss": 1.2008, + "step": 14762 + }, + { + "epoch": 0.44, + "learning_rate": 3.0640451438342294e-06, + "loss": 1.1712, + "step": 14763 + }, + { + "epoch": 0.44, + "learning_rate": 3.0638075103765287e-06, + "loss": 1.1107, + "step": 14764 + }, + { + "epoch": 0.44, + "learning_rate": 3.063569871551651e-06, + "loss": 1.1293, + "step": 14765 + }, + { + "epoch": 0.44, + "learning_rate": 3.063332227361861e-06, + "loss": 1.0225, + "step": 14766 + }, + { + "epoch": 0.44, + "learning_rate": 3.0630945778094184e-06, + "loss": 1.2394, + "step": 14767 + }, + { + "epoch": 0.44, + "learning_rate": 3.062856922896587e-06, + "loss": 1.189, + "step": 14768 + }, + { + "epoch": 0.44, + "learning_rate": 3.062619262625629e-06, + "loss": 1.1292, + "step": 14769 + }, + { + "epoch": 0.44, + "learning_rate": 3.0623815969988067e-06, + "loss": 1.0402, + "step": 14770 + }, + { + "epoch": 0.44, + "learning_rate": 3.0621439260183816e-06, + "loss": 1.069, + "step": 14771 + }, + { + "epoch": 0.45, + "learning_rate": 3.061906249686618e-06, + "loss": 1.1075, + "step": 14772 + }, + { + "epoch": 0.45, + "learning_rate": 3.0616685680057774e-06, + "loss": 1.165, + "step": 14773 + }, + { + "epoch": 0.45, + "learning_rate": 3.0614308809781217e-06, + "loss": 1.2053, + "step": 14774 + }, + { + "epoch": 0.45, + "learning_rate": 3.0611931886059156e-06, + "loss": 1.1024, + "step": 14775 + }, + { + "epoch": 0.45, + "learning_rate": 3.0609554908914197e-06, + "loss": 1.1535, + "step": 14776 + }, + { + "epoch": 0.45, + "learning_rate": 3.060717787836898e-06, + "loss": 1.0752, + "step": 14777 + }, + { + "epoch": 0.45, + "learning_rate": 3.0604800794446127e-06, + "loss": 1.1179, + "step": 14778 + }, + { + "epoch": 0.45, + "learning_rate": 3.0602423657168272e-06, + "loss": 1.1052, + "step": 14779 + }, + { + "epoch": 0.45, + "learning_rate": 3.0600046466558043e-06, + "loss": 1.1312, + "step": 14780 + }, + { + "epoch": 0.45, + "learning_rate": 3.059766922263807e-06, + "loss": 1.0672, + "step": 14781 + }, + { + "epoch": 0.45, + "learning_rate": 3.059529192543098e-06, + "loss": 1.1547, + "step": 14782 + }, + { + "epoch": 0.45, + "learning_rate": 3.059291457495941e-06, + "loss": 1.1434, + "step": 14783 + }, + { + "epoch": 0.45, + "learning_rate": 3.0590537171245983e-06, + "loss": 1.1545, + "step": 14784 + }, + { + "epoch": 0.45, + "learning_rate": 3.0588159714313336e-06, + "loss": 1.1465, + "step": 14785 + }, + { + "epoch": 0.45, + "learning_rate": 3.0585782204184093e-06, + "loss": 1.2677, + "step": 14786 + }, + { + "epoch": 0.45, + "learning_rate": 3.0583404640880904e-06, + "loss": 1.1063, + "step": 14787 + }, + { + "epoch": 0.45, + "learning_rate": 3.0581027024426385e-06, + "loss": 1.044, + "step": 14788 + }, + { + "epoch": 0.45, + "learning_rate": 3.0578649354843177e-06, + "loss": 1.1429, + "step": 14789 + }, + { + "epoch": 0.45, + "learning_rate": 3.0576271632153913e-06, + "loss": 1.1365, + "step": 14790 + }, + { + "epoch": 0.45, + "learning_rate": 3.0573893856381234e-06, + "loss": 1.0804, + "step": 14791 + }, + { + "epoch": 0.45, + "learning_rate": 3.0571516027547764e-06, + "loss": 1.1697, + "step": 14792 + }, + { + "epoch": 0.45, + "learning_rate": 3.056913814567615e-06, + "loss": 1.2116, + "step": 14793 + }, + { + "epoch": 0.45, + "learning_rate": 3.0566760210789024e-06, + "loss": 1.1603, + "step": 14794 + }, + { + "epoch": 0.45, + "learning_rate": 3.0564382222909016e-06, + "loss": 1.1406, + "step": 14795 + }, + { + "epoch": 0.45, + "learning_rate": 3.0562004182058774e-06, + "loss": 1.0244, + "step": 14796 + }, + { + "epoch": 0.45, + "learning_rate": 3.055962608826093e-06, + "loss": 1.0757, + "step": 14797 + }, + { + "epoch": 0.45, + "learning_rate": 3.0557247941538125e-06, + "loss": 1.1399, + "step": 14798 + }, + { + "epoch": 0.45, + "learning_rate": 3.055486974191299e-06, + "loss": 1.0634, + "step": 14799 + }, + { + "epoch": 0.45, + "learning_rate": 3.0552491489408177e-06, + "loss": 0.9146, + "step": 14800 + }, + { + "epoch": 0.45, + "learning_rate": 3.0550113184046316e-06, + "loss": 1.1141, + "step": 14801 + }, + { + "epoch": 0.45, + "learning_rate": 3.0547734825850047e-06, + "loss": 1.0416, + "step": 14802 + }, + { + "epoch": 0.45, + "learning_rate": 3.0545356414842015e-06, + "loss": 1.1083, + "step": 14803 + }, + { + "epoch": 0.45, + "learning_rate": 3.054297795104486e-06, + "loss": 1.2559, + "step": 14804 + }, + { + "epoch": 0.45, + "learning_rate": 3.0540599434481234e-06, + "loss": 1.1813, + "step": 14805 + }, + { + "epoch": 0.45, + "learning_rate": 3.0538220865173764e-06, + "loss": 1.1415, + "step": 14806 + }, + { + "epoch": 0.45, + "learning_rate": 3.05358422431451e-06, + "loss": 1.0627, + "step": 14807 + }, + { + "epoch": 0.45, + "learning_rate": 3.0533463568417878e-06, + "loss": 1.1559, + "step": 14808 + }, + { + "epoch": 0.45, + "learning_rate": 3.0531084841014757e-06, + "loss": 1.0953, + "step": 14809 + }, + { + "epoch": 0.45, + "learning_rate": 3.052870606095836e-06, + "loss": 1.1125, + "step": 14810 + }, + { + "epoch": 0.45, + "learning_rate": 3.052632722827136e-06, + "loss": 1.0751, + "step": 14811 + }, + { + "epoch": 0.45, + "learning_rate": 3.052394834297637e-06, + "loss": 1.1754, + "step": 14812 + }, + { + "epoch": 0.45, + "learning_rate": 3.052156940509607e-06, + "loss": 1.0242, + "step": 14813 + }, + { + "epoch": 0.45, + "learning_rate": 3.0519190414653073e-06, + "loss": 1.1301, + "step": 14814 + }, + { + "epoch": 0.45, + "learning_rate": 3.051681137167005e-06, + "loss": 0.9966, + "step": 14815 + }, + { + "epoch": 0.45, + "learning_rate": 3.0514432276169635e-06, + "loss": 1.1392, + "step": 14816 + }, + { + "epoch": 0.45, + "learning_rate": 3.051205312817448e-06, + "loss": 1.1576, + "step": 14817 + }, + { + "epoch": 0.45, + "learning_rate": 3.0509673927707233e-06, + "loss": 1.0967, + "step": 14818 + }, + { + "epoch": 0.45, + "learning_rate": 3.0507294674790544e-06, + "loss": 1.1479, + "step": 14819 + }, + { + "epoch": 0.45, + "learning_rate": 3.050491536944707e-06, + "loss": 1.0662, + "step": 14820 + }, + { + "epoch": 0.45, + "learning_rate": 3.0502536011699444e-06, + "loss": 1.1151, + "step": 14821 + }, + { + "epoch": 0.45, + "learning_rate": 3.0500156601570336e-06, + "loss": 1.1435, + "step": 14822 + }, + { + "epoch": 0.45, + "learning_rate": 3.0497777139082374e-06, + "loss": 1.1257, + "step": 14823 + }, + { + "epoch": 0.45, + "learning_rate": 3.049539762425823e-06, + "loss": 1.0964, + "step": 14824 + }, + { + "epoch": 0.45, + "learning_rate": 3.0493018057120543e-06, + "loss": 1.2317, + "step": 14825 + }, + { + "epoch": 0.45, + "learning_rate": 3.0490638437691974e-06, + "loss": 1.2184, + "step": 14826 + }, + { + "epoch": 0.45, + "learning_rate": 3.0488258765995166e-06, + "loss": 1.0772, + "step": 14827 + }, + { + "epoch": 0.45, + "learning_rate": 3.0485879042052785e-06, + "loss": 1.0153, + "step": 14828 + }, + { + "epoch": 0.45, + "learning_rate": 3.048349926588747e-06, + "loss": 1.2186, + "step": 14829 + }, + { + "epoch": 0.45, + "learning_rate": 3.0481119437521884e-06, + "loss": 1.2355, + "step": 14830 + }, + { + "epoch": 0.45, + "learning_rate": 3.0478739556978676e-06, + "loss": 0.9916, + "step": 14831 + }, + { + "epoch": 0.45, + "learning_rate": 3.047635962428051e-06, + "loss": 1.067, + "step": 14832 + }, + { + "epoch": 0.45, + "learning_rate": 3.0473979639450048e-06, + "loss": 1.0667, + "step": 14833 + }, + { + "epoch": 0.45, + "learning_rate": 3.047159960250992e-06, + "loss": 1.0767, + "step": 14834 + }, + { + "epoch": 0.45, + "learning_rate": 3.046921951348281e-06, + "loss": 1.0927, + "step": 14835 + }, + { + "epoch": 0.45, + "learning_rate": 3.0466839372391365e-06, + "loss": 1.106, + "step": 14836 + }, + { + "epoch": 0.45, + "learning_rate": 3.046445917925824e-06, + "loss": 1.1881, + "step": 14837 + }, + { + "epoch": 0.45, + "learning_rate": 3.0462078934106093e-06, + "loss": 1.1042, + "step": 14838 + }, + { + "epoch": 0.45, + "learning_rate": 3.045969863695759e-06, + "loss": 1.1733, + "step": 14839 + }, + { + "epoch": 0.45, + "learning_rate": 3.045731828783538e-06, + "loss": 1.2003, + "step": 14840 + }, + { + "epoch": 0.45, + "learning_rate": 3.0454937886762133e-06, + "loss": 1.1149, + "step": 14841 + }, + { + "epoch": 0.45, + "learning_rate": 3.04525574337605e-06, + "loss": 1.1506, + "step": 14842 + }, + { + "epoch": 0.45, + "learning_rate": 3.045017692885314e-06, + "loss": 1.0517, + "step": 14843 + }, + { + "epoch": 0.45, + "learning_rate": 3.044779637206273e-06, + "loss": 1.0084, + "step": 14844 + }, + { + "epoch": 0.45, + "learning_rate": 3.044541576341192e-06, + "loss": 1.1625, + "step": 14845 + }, + { + "epoch": 0.45, + "learning_rate": 3.044303510292338e-06, + "loss": 1.0669, + "step": 14846 + }, + { + "epoch": 0.45, + "learning_rate": 3.0440654390619756e-06, + "loss": 1.1125, + "step": 14847 + }, + { + "epoch": 0.45, + "learning_rate": 3.0438273626523733e-06, + "loss": 1.1068, + "step": 14848 + }, + { + "epoch": 0.45, + "learning_rate": 3.0435892810657958e-06, + "loss": 1.0877, + "step": 14849 + }, + { + "epoch": 0.45, + "learning_rate": 3.0433511943045106e-06, + "loss": 1.27, + "step": 14850 + }, + { + "epoch": 0.45, + "learning_rate": 3.043113102370783e-06, + "loss": 1.0872, + "step": 14851 + }, + { + "epoch": 0.45, + "learning_rate": 3.0428750052668814e-06, + "loss": 1.0952, + "step": 14852 + }, + { + "epoch": 0.45, + "learning_rate": 3.0426369029950703e-06, + "loss": 1.1595, + "step": 14853 + }, + { + "epoch": 0.45, + "learning_rate": 3.0423987955576177e-06, + "loss": 1.1741, + "step": 14854 + }, + { + "epoch": 0.45, + "learning_rate": 3.0421606829567895e-06, + "loss": 1.1337, + "step": 14855 + }, + { + "epoch": 0.45, + "learning_rate": 3.0419225651948524e-06, + "loss": 1.176, + "step": 14856 + }, + { + "epoch": 0.45, + "learning_rate": 3.041684442274074e-06, + "loss": 1.1602, + "step": 14857 + }, + { + "epoch": 0.45, + "learning_rate": 3.0414463141967203e-06, + "loss": 1.1531, + "step": 14858 + }, + { + "epoch": 0.45, + "learning_rate": 3.0412081809650583e-06, + "loss": 1.1306, + "step": 14859 + }, + { + "epoch": 0.45, + "learning_rate": 3.0409700425813553e-06, + "loss": 1.2427, + "step": 14860 + }, + { + "epoch": 0.45, + "learning_rate": 3.0407318990478783e-06, + "loss": 1.2053, + "step": 14861 + }, + { + "epoch": 0.45, + "learning_rate": 3.040493750366894e-06, + "loss": 1.3325, + "step": 14862 + }, + { + "epoch": 0.45, + "learning_rate": 3.0402555965406694e-06, + "loss": 1.1187, + "step": 14863 + }, + { + "epoch": 0.45, + "learning_rate": 3.0400174375714713e-06, + "loss": 1.0901, + "step": 14864 + }, + { + "epoch": 0.45, + "learning_rate": 3.0397792734615684e-06, + "loss": 1.1011, + "step": 14865 + }, + { + "epoch": 0.45, + "learning_rate": 3.0395411042132256e-06, + "loss": 1.1588, + "step": 14866 + }, + { + "epoch": 0.45, + "learning_rate": 3.039302929828712e-06, + "loss": 1.2394, + "step": 14867 + }, + { + "epoch": 0.45, + "learning_rate": 3.0390647503102937e-06, + "loss": 1.2151, + "step": 14868 + }, + { + "epoch": 0.45, + "learning_rate": 3.0388265656602395e-06, + "loss": 1.0953, + "step": 14869 + }, + { + "epoch": 0.45, + "learning_rate": 3.038588375880815e-06, + "loss": 1.1587, + "step": 14870 + }, + { + "epoch": 0.45, + "learning_rate": 3.0383501809742888e-06, + "loss": 1.1756, + "step": 14871 + }, + { + "epoch": 0.45, + "learning_rate": 3.0381119809429277e-06, + "loss": 1.0594, + "step": 14872 + }, + { + "epoch": 0.45, + "learning_rate": 3.037873775789e-06, + "loss": 1.041, + "step": 14873 + }, + { + "epoch": 0.45, + "learning_rate": 3.0376355655147738e-06, + "loss": 1.1254, + "step": 14874 + }, + { + "epoch": 0.45, + "learning_rate": 3.037397350122515e-06, + "loss": 1.0798, + "step": 14875 + }, + { + "epoch": 0.45, + "learning_rate": 3.037159129614493e-06, + "loss": 1.1326, + "step": 14876 + }, + { + "epoch": 0.45, + "learning_rate": 3.0369209039929744e-06, + "loss": 1.2007, + "step": 14877 + }, + { + "epoch": 0.45, + "learning_rate": 3.036682673260228e-06, + "loss": 1.1541, + "step": 14878 + }, + { + "epoch": 0.45, + "learning_rate": 3.03644443741852e-06, + "loss": 1.1207, + "step": 14879 + }, + { + "epoch": 0.45, + "learning_rate": 3.03620619647012e-06, + "loss": 1.1224, + "step": 14880 + }, + { + "epoch": 0.45, + "learning_rate": 3.0359679504172944e-06, + "loss": 1.2437, + "step": 14881 + }, + { + "epoch": 0.45, + "learning_rate": 3.0357296992623132e-06, + "loss": 1.199, + "step": 14882 + }, + { + "epoch": 0.45, + "learning_rate": 3.0354914430074424e-06, + "loss": 1.0492, + "step": 14883 + }, + { + "epoch": 0.45, + "learning_rate": 3.035253181654951e-06, + "loss": 1.0746, + "step": 14884 + }, + { + "epoch": 0.45, + "learning_rate": 3.0350149152071073e-06, + "loss": 1.0243, + "step": 14885 + }, + { + "epoch": 0.45, + "learning_rate": 3.034776643666179e-06, + "loss": 1.1371, + "step": 14886 + }, + { + "epoch": 0.45, + "learning_rate": 3.034538367034435e-06, + "loss": 1.2206, + "step": 14887 + }, + { + "epoch": 0.45, + "learning_rate": 3.0343000853141434e-06, + "loss": 1.1569, + "step": 14888 + }, + { + "epoch": 0.45, + "learning_rate": 3.0340617985075726e-06, + "loss": 1.1542, + "step": 14889 + }, + { + "epoch": 0.45, + "learning_rate": 3.03382350661699e-06, + "loss": 1.0891, + "step": 14890 + }, + { + "epoch": 0.45, + "learning_rate": 3.033585209644665e-06, + "loss": 1.1248, + "step": 14891 + }, + { + "epoch": 0.45, + "learning_rate": 3.0333469075928657e-06, + "loss": 1.0459, + "step": 14892 + }, + { + "epoch": 0.45, + "learning_rate": 3.033108600463861e-06, + "loss": 1.0521, + "step": 14893 + }, + { + "epoch": 0.45, + "learning_rate": 3.032870288259918e-06, + "loss": 1.0944, + "step": 14894 + }, + { + "epoch": 0.45, + "learning_rate": 3.032631970983308e-06, + "loss": 1.0605, + "step": 14895 + }, + { + "epoch": 0.45, + "learning_rate": 3.0323936486362977e-06, + "loss": 1.1127, + "step": 14896 + }, + { + "epoch": 0.45, + "learning_rate": 3.0321553212211556e-06, + "loss": 1.0903, + "step": 14897 + }, + { + "epoch": 0.45, + "learning_rate": 3.0319169887401517e-06, + "loss": 1.1921, + "step": 14898 + }, + { + "epoch": 0.45, + "learning_rate": 3.0316786511955544e-06, + "loss": 1.015, + "step": 14899 + }, + { + "epoch": 0.45, + "learning_rate": 3.0314403085896315e-06, + "loss": 1.1487, + "step": 14900 + }, + { + "epoch": 0.45, + "learning_rate": 3.0312019609246536e-06, + "loss": 1.0677, + "step": 14901 + }, + { + "epoch": 0.45, + "learning_rate": 3.0309636082028885e-06, + "loss": 1.0962, + "step": 14902 + }, + { + "epoch": 0.45, + "learning_rate": 3.030725250426606e-06, + "loss": 1.048, + "step": 14903 + }, + { + "epoch": 0.45, + "learning_rate": 3.0304868875980747e-06, + "loss": 1.1287, + "step": 14904 + }, + { + "epoch": 0.45, + "learning_rate": 3.0302485197195635e-06, + "loss": 1.2548, + "step": 14905 + }, + { + "epoch": 0.45, + "learning_rate": 3.0300101467933425e-06, + "loss": 1.1954, + "step": 14906 + }, + { + "epoch": 0.45, + "learning_rate": 3.029771768821679e-06, + "loss": 1.0962, + "step": 14907 + }, + { + "epoch": 0.45, + "learning_rate": 3.0295333858068445e-06, + "loss": 1.0999, + "step": 14908 + }, + { + "epoch": 0.45, + "learning_rate": 3.029294997751106e-06, + "loss": 1.0826, + "step": 14909 + }, + { + "epoch": 0.45, + "learning_rate": 3.0290566046567344e-06, + "loss": 1.1889, + "step": 14910 + }, + { + "epoch": 0.45, + "learning_rate": 3.0288182065259997e-06, + "loss": 1.2178, + "step": 14911 + }, + { + "epoch": 0.45, + "learning_rate": 3.028579803361169e-06, + "loss": 0.9716, + "step": 14912 + }, + { + "epoch": 0.45, + "learning_rate": 3.0283413951645135e-06, + "loss": 1.0901, + "step": 14913 + }, + { + "epoch": 0.45, + "learning_rate": 3.028102981938303e-06, + "loss": 1.0308, + "step": 14914 + }, + { + "epoch": 0.45, + "learning_rate": 3.027864563684806e-06, + "loss": 1.0925, + "step": 14915 + }, + { + "epoch": 0.45, + "learning_rate": 3.0276261404062925e-06, + "loss": 1.0338, + "step": 14916 + }, + { + "epoch": 0.45, + "learning_rate": 3.027387712105033e-06, + "loss": 1.1744, + "step": 14917 + }, + { + "epoch": 0.45, + "learning_rate": 3.027149278783296e-06, + "loss": 1.3307, + "step": 14918 + }, + { + "epoch": 0.45, + "learning_rate": 3.0269108404433516e-06, + "loss": 1.1037, + "step": 14919 + }, + { + "epoch": 0.45, + "learning_rate": 3.0266723970874696e-06, + "loss": 1.1788, + "step": 14920 + }, + { + "epoch": 0.45, + "learning_rate": 3.026433948717921e-06, + "loss": 1.0553, + "step": 14921 + }, + { + "epoch": 0.45, + "learning_rate": 3.026195495336973e-06, + "loss": 1.1447, + "step": 14922 + }, + { + "epoch": 0.45, + "learning_rate": 3.025957036946899e-06, + "loss": 1.1297, + "step": 14923 + }, + { + "epoch": 0.45, + "learning_rate": 3.0257185735499667e-06, + "loss": 1.0829, + "step": 14924 + }, + { + "epoch": 0.45, + "learning_rate": 3.025480105148446e-06, + "loss": 1.1163, + "step": 14925 + }, + { + "epoch": 0.45, + "learning_rate": 3.0252416317446087e-06, + "loss": 1.1706, + "step": 14926 + }, + { + "epoch": 0.45, + "learning_rate": 3.025003153340724e-06, + "loss": 1.121, + "step": 14927 + }, + { + "epoch": 0.45, + "learning_rate": 3.024764669939062e-06, + "loss": 1.1783, + "step": 14928 + }, + { + "epoch": 0.45, + "learning_rate": 3.0245261815418923e-06, + "loss": 1.0968, + "step": 14929 + }, + { + "epoch": 0.45, + "learning_rate": 3.024287688151488e-06, + "loss": 1.0508, + "step": 14930 + }, + { + "epoch": 0.45, + "learning_rate": 3.0240491897701154e-06, + "loss": 1.1603, + "step": 14931 + }, + { + "epoch": 0.45, + "learning_rate": 3.023810686400048e-06, + "loss": 1.1132, + "step": 14932 + }, + { + "epoch": 0.45, + "learning_rate": 3.0235721780435547e-06, + "loss": 1.0547, + "step": 14933 + }, + { + "epoch": 0.45, + "learning_rate": 3.0233336647029065e-06, + "loss": 1.09, + "step": 14934 + }, + { + "epoch": 0.45, + "learning_rate": 3.0230951463803736e-06, + "loss": 1.0119, + "step": 14935 + }, + { + "epoch": 0.45, + "learning_rate": 3.0228566230782275e-06, + "loss": 1.2341, + "step": 14936 + }, + { + "epoch": 0.45, + "learning_rate": 3.0226180947987375e-06, + "loss": 1.2206, + "step": 14937 + }, + { + "epoch": 0.45, + "learning_rate": 3.0223795615441754e-06, + "loss": 1.1182, + "step": 14938 + }, + { + "epoch": 0.45, + "learning_rate": 3.0221410233168107e-06, + "loss": 1.1302, + "step": 14939 + }, + { + "epoch": 0.45, + "learning_rate": 3.0219024801189157e-06, + "loss": 1.1982, + "step": 14940 + }, + { + "epoch": 0.45, + "learning_rate": 3.0216639319527604e-06, + "loss": 1.1483, + "step": 14941 + }, + { + "epoch": 0.45, + "learning_rate": 3.0214253788206148e-06, + "loss": 1.1927, + "step": 14942 + }, + { + "epoch": 0.45, + "learning_rate": 3.021186820724752e-06, + "loss": 1.1354, + "step": 14943 + }, + { + "epoch": 0.45, + "learning_rate": 3.020948257667441e-06, + "loss": 1.0372, + "step": 14944 + }, + { + "epoch": 0.45, + "learning_rate": 3.020709689650954e-06, + "loss": 1.1368, + "step": 14945 + }, + { + "epoch": 0.45, + "learning_rate": 3.0204711166775615e-06, + "loss": 1.145, + "step": 14946 + }, + { + "epoch": 0.45, + "learning_rate": 3.020232538749534e-06, + "loss": 1.0741, + "step": 14947 + }, + { + "epoch": 0.45, + "learning_rate": 3.019993955869144e-06, + "loss": 1.1126, + "step": 14948 + }, + { + "epoch": 0.45, + "learning_rate": 3.0197553680386617e-06, + "loss": 1.0806, + "step": 14949 + }, + { + "epoch": 0.45, + "learning_rate": 3.019516775260358e-06, + "loss": 1.1036, + "step": 14950 + }, + { + "epoch": 0.45, + "learning_rate": 3.0192781775365047e-06, + "loss": 1.1358, + "step": 14951 + }, + { + "epoch": 0.45, + "learning_rate": 3.0190395748693747e-06, + "loss": 1.1465, + "step": 14952 + }, + { + "epoch": 0.45, + "learning_rate": 3.018800967261237e-06, + "loss": 0.9894, + "step": 14953 + }, + { + "epoch": 0.45, + "learning_rate": 3.0185623547143633e-06, + "loss": 1.1562, + "step": 14954 + }, + { + "epoch": 0.45, + "learning_rate": 3.0183237372310265e-06, + "loss": 1.1361, + "step": 14955 + }, + { + "epoch": 0.45, + "learning_rate": 3.0180851148134976e-06, + "loss": 1.1638, + "step": 14956 + }, + { + "epoch": 0.45, + "learning_rate": 3.0178464874640473e-06, + "loss": 1.1564, + "step": 14957 + }, + { + "epoch": 0.45, + "learning_rate": 3.0176078551849487e-06, + "loss": 1.224, + "step": 14958 + }, + { + "epoch": 0.45, + "learning_rate": 3.017369217978472e-06, + "loss": 1.1669, + "step": 14959 + }, + { + "epoch": 0.45, + "learning_rate": 3.0171305758468893e-06, + "loss": 1.047, + "step": 14960 + }, + { + "epoch": 0.45, + "learning_rate": 3.0168919287924732e-06, + "loss": 1.2891, + "step": 14961 + }, + { + "epoch": 0.45, + "learning_rate": 3.016653276817495e-06, + "loss": 1.0485, + "step": 14962 + }, + { + "epoch": 0.45, + "learning_rate": 3.0164146199242254e-06, + "loss": 1.0698, + "step": 14963 + }, + { + "epoch": 0.45, + "learning_rate": 3.016175958114938e-06, + "loss": 1.2037, + "step": 14964 + }, + { + "epoch": 0.45, + "learning_rate": 3.015937291391904e-06, + "loss": 1.0697, + "step": 14965 + }, + { + "epoch": 0.45, + "learning_rate": 3.0156986197573956e-06, + "loss": 1.0734, + "step": 14966 + }, + { + "epoch": 0.45, + "learning_rate": 3.0154599432136842e-06, + "loss": 1.1746, + "step": 14967 + }, + { + "epoch": 0.45, + "learning_rate": 3.0152212617630427e-06, + "loss": 1.1586, + "step": 14968 + }, + { + "epoch": 0.45, + "learning_rate": 3.0149825754077434e-06, + "loss": 1.1862, + "step": 14969 + }, + { + "epoch": 0.45, + "learning_rate": 3.014743884150057e-06, + "loss": 1.1271, + "step": 14970 + }, + { + "epoch": 0.45, + "learning_rate": 3.0145051879922576e-06, + "loss": 1.1592, + "step": 14971 + }, + { + "epoch": 0.45, + "learning_rate": 3.0142664869366163e-06, + "loss": 1.1242, + "step": 14972 + }, + { + "epoch": 0.45, + "learning_rate": 3.014027780985406e-06, + "loss": 1.1035, + "step": 14973 + }, + { + "epoch": 0.45, + "learning_rate": 3.0137890701408982e-06, + "loss": 1.2027, + "step": 14974 + }, + { + "epoch": 0.45, + "learning_rate": 3.0135503544053666e-06, + "loss": 1.1534, + "step": 14975 + }, + { + "epoch": 0.45, + "learning_rate": 3.0133116337810823e-06, + "loss": 1.0423, + "step": 14976 + }, + { + "epoch": 0.45, + "learning_rate": 3.013072908270319e-06, + "loss": 1.0829, + "step": 14977 + }, + { + "epoch": 0.45, + "learning_rate": 3.012834177875349e-06, + "loss": 1.2991, + "step": 14978 + }, + { + "epoch": 0.45, + "learning_rate": 3.012595442598444e-06, + "loss": 1.1431, + "step": 14979 + }, + { + "epoch": 0.45, + "learning_rate": 3.0123567024418763e-06, + "loss": 1.0403, + "step": 14980 + }, + { + "epoch": 0.45, + "learning_rate": 3.012117957407921e-06, + "loss": 1.1014, + "step": 14981 + }, + { + "epoch": 0.45, + "learning_rate": 3.011879207498849e-06, + "loss": 1.0923, + "step": 14982 + }, + { + "epoch": 0.45, + "learning_rate": 3.0116404527169336e-06, + "loss": 1.05, + "step": 14983 + }, + { + "epoch": 0.45, + "learning_rate": 3.0114016930644475e-06, + "loss": 1.0977, + "step": 14984 + }, + { + "epoch": 0.45, + "learning_rate": 3.0111629285436633e-06, + "loss": 1.0594, + "step": 14985 + }, + { + "epoch": 0.45, + "learning_rate": 3.010924159156855e-06, + "loss": 1.1941, + "step": 14986 + }, + { + "epoch": 0.45, + "learning_rate": 3.010685384906294e-06, + "loss": 1.1496, + "step": 14987 + }, + { + "epoch": 0.45, + "learning_rate": 3.0104466057942543e-06, + "loss": 1.1786, + "step": 14988 + }, + { + "epoch": 0.45, + "learning_rate": 3.0102078218230084e-06, + "loss": 1.1038, + "step": 14989 + }, + { + "epoch": 0.45, + "learning_rate": 3.00996903299483e-06, + "loss": 1.107, + "step": 14990 + }, + { + "epoch": 0.45, + "learning_rate": 3.0097302393119926e-06, + "loss": 1.2237, + "step": 14991 + }, + { + "epoch": 0.45, + "learning_rate": 3.0094914407767678e-06, + "loss": 1.2612, + "step": 14992 + }, + { + "epoch": 0.45, + "learning_rate": 3.009252637391431e-06, + "loss": 1.1642, + "step": 14993 + }, + { + "epoch": 0.45, + "learning_rate": 3.0090138291582533e-06, + "loss": 1.2562, + "step": 14994 + }, + { + "epoch": 0.45, + "learning_rate": 3.008775016079509e-06, + "loss": 1.1235, + "step": 14995 + }, + { + "epoch": 0.45, + "learning_rate": 3.008536198157472e-06, + "loss": 1.114, + "step": 14996 + }, + { + "epoch": 0.45, + "learning_rate": 3.0082973753944158e-06, + "loss": 1.053, + "step": 14997 + }, + { + "epoch": 0.45, + "learning_rate": 3.008058547792613e-06, + "loss": 1.1693, + "step": 14998 + }, + { + "epoch": 0.45, + "learning_rate": 3.0078197153543375e-06, + "loss": 1.0311, + "step": 14999 + }, + { + "epoch": 0.45, + "learning_rate": 3.007580878081863e-06, + "loss": 1.1408, + "step": 15000 + }, + { + "epoch": 0.45, + "learning_rate": 3.007342035977463e-06, + "loss": 1.0805, + "step": 15001 + }, + { + "epoch": 0.45, + "learning_rate": 3.007103189043411e-06, + "loss": 1.0815, + "step": 15002 + }, + { + "epoch": 0.45, + "learning_rate": 3.0068643372819807e-06, + "loss": 1.132, + "step": 15003 + }, + { + "epoch": 0.45, + "learning_rate": 3.0066254806954465e-06, + "loss": 1.2695, + "step": 15004 + }, + { + "epoch": 0.45, + "learning_rate": 3.006386619286081e-06, + "loss": 1.1483, + "step": 15005 + }, + { + "epoch": 0.45, + "learning_rate": 3.00614775305616e-06, + "loss": 1.1975, + "step": 15006 + }, + { + "epoch": 0.45, + "learning_rate": 3.005908882007955e-06, + "loss": 1.1371, + "step": 15007 + }, + { + "epoch": 0.45, + "learning_rate": 3.0056700061437416e-06, + "loss": 1.1133, + "step": 15008 + }, + { + "epoch": 0.45, + "learning_rate": 3.0054311254657925e-06, + "loss": 1.1273, + "step": 15009 + }, + { + "epoch": 0.45, + "learning_rate": 3.0051922399763837e-06, + "loss": 1.0631, + "step": 15010 + }, + { + "epoch": 0.45, + "learning_rate": 3.004953349677787e-06, + "loss": 1.1359, + "step": 15011 + }, + { + "epoch": 0.45, + "learning_rate": 3.004714454572279e-06, + "loss": 1.1047, + "step": 15012 + }, + { + "epoch": 0.45, + "learning_rate": 3.0044755546621314e-06, + "loss": 1.106, + "step": 15013 + }, + { + "epoch": 0.45, + "learning_rate": 3.00423664994962e-06, + "loss": 1.152, + "step": 15014 + }, + { + "epoch": 0.45, + "learning_rate": 3.003997740437018e-06, + "loss": 1.0988, + "step": 15015 + }, + { + "epoch": 0.45, + "learning_rate": 3.0037588261266004e-06, + "loss": 1.0496, + "step": 15016 + }, + { + "epoch": 0.45, + "learning_rate": 3.003519907020642e-06, + "loss": 1.162, + "step": 15017 + }, + { + "epoch": 0.45, + "learning_rate": 3.0032809831214157e-06, + "loss": 1.1252, + "step": 15018 + }, + { + "epoch": 0.45, + "learning_rate": 3.003042054431198e-06, + "loss": 1.0586, + "step": 15019 + }, + { + "epoch": 0.45, + "learning_rate": 3.002803120952261e-06, + "loss": 1.1463, + "step": 15020 + }, + { + "epoch": 0.45, + "learning_rate": 3.00256418268688e-06, + "loss": 1.1293, + "step": 15021 + }, + { + "epoch": 0.45, + "learning_rate": 3.0023252396373315e-06, + "loss": 1.0838, + "step": 15022 + }, + { + "epoch": 0.45, + "learning_rate": 3.002086291805888e-06, + "loss": 1.2036, + "step": 15023 + }, + { + "epoch": 0.45, + "learning_rate": 3.0018473391948244e-06, + "loss": 1.0673, + "step": 15024 + }, + { + "epoch": 0.45, + "learning_rate": 3.001608381806417e-06, + "loss": 1.1108, + "step": 15025 + }, + { + "epoch": 0.45, + "learning_rate": 3.001369419642938e-06, + "loss": 1.1023, + "step": 15026 + }, + { + "epoch": 0.45, + "learning_rate": 3.0011304527066646e-06, + "loss": 1.067, + "step": 15027 + }, + { + "epoch": 0.45, + "learning_rate": 3.0008914809998707e-06, + "loss": 1.0644, + "step": 15028 + }, + { + "epoch": 0.45, + "learning_rate": 3.000652504524831e-06, + "loss": 1.0986, + "step": 15029 + }, + { + "epoch": 0.45, + "learning_rate": 3.00041352328382e-06, + "loss": 1.1628, + "step": 15030 + }, + { + "epoch": 0.45, + "learning_rate": 3.0001745372791134e-06, + "loss": 1.2697, + "step": 15031 + }, + { + "epoch": 0.45, + "learning_rate": 2.9999355465129863e-06, + "loss": 1.1801, + "step": 15032 + }, + { + "epoch": 0.45, + "learning_rate": 2.9996965509877135e-06, + "loss": 1.1409, + "step": 15033 + }, + { + "epoch": 0.45, + "learning_rate": 2.9994575507055706e-06, + "loss": 1.1143, + "step": 15034 + }, + { + "epoch": 0.45, + "learning_rate": 2.9992185456688323e-06, + "loss": 1.0839, + "step": 15035 + }, + { + "epoch": 0.45, + "learning_rate": 2.998979535879773e-06, + "loss": 1.1321, + "step": 15036 + }, + { + "epoch": 0.45, + "learning_rate": 2.9987405213406696e-06, + "loss": 1.066, + "step": 15037 + }, + { + "epoch": 0.45, + "learning_rate": 2.9985015020537967e-06, + "loss": 1.1416, + "step": 15038 + }, + { + "epoch": 0.45, + "learning_rate": 2.9982624780214293e-06, + "loss": 1.152, + "step": 15039 + }, + { + "epoch": 0.45, + "learning_rate": 2.998023449245843e-06, + "loss": 1.1181, + "step": 15040 + }, + { + "epoch": 0.45, + "learning_rate": 2.9977844157293134e-06, + "loss": 1.1052, + "step": 15041 + }, + { + "epoch": 0.45, + "learning_rate": 2.9975453774741164e-06, + "loss": 1.1062, + "step": 15042 + }, + { + "epoch": 0.45, + "learning_rate": 2.9973063344825267e-06, + "loss": 1.1058, + "step": 15043 + }, + { + "epoch": 0.45, + "learning_rate": 2.9970672867568195e-06, + "loss": 1.0695, + "step": 15044 + }, + { + "epoch": 0.45, + "learning_rate": 2.996828234299272e-06, + "loss": 1.1589, + "step": 15045 + }, + { + "epoch": 0.45, + "learning_rate": 2.9965891771121584e-06, + "loss": 1.0209, + "step": 15046 + }, + { + "epoch": 0.45, + "learning_rate": 2.9963501151977557e-06, + "loss": 1.0857, + "step": 15047 + }, + { + "epoch": 0.45, + "learning_rate": 2.996111048558339e-06, + "loss": 1.0541, + "step": 15048 + }, + { + "epoch": 0.45, + "learning_rate": 2.995871977196183e-06, + "loss": 1.1155, + "step": 15049 + }, + { + "epoch": 0.45, + "learning_rate": 2.9956329011135655e-06, + "loss": 0.9796, + "step": 15050 + }, + { + "epoch": 0.45, + "learning_rate": 2.995393820312761e-06, + "loss": 1.1225, + "step": 15051 + }, + { + "epoch": 0.45, + "learning_rate": 2.9951547347960463e-06, + "loss": 1.1925, + "step": 15052 + }, + { + "epoch": 0.45, + "learning_rate": 2.9949156445656968e-06, + "loss": 1.043, + "step": 15053 + }, + { + "epoch": 0.45, + "learning_rate": 2.9946765496239887e-06, + "loss": 1.1902, + "step": 15054 + }, + { + "epoch": 0.45, + "learning_rate": 2.994437449973199e-06, + "loss": 1.089, + "step": 15055 + }, + { + "epoch": 0.45, + "learning_rate": 2.9941983456156014e-06, + "loss": 1.1725, + "step": 15056 + }, + { + "epoch": 0.45, + "learning_rate": 2.993959236553474e-06, + "loss": 1.0436, + "step": 15057 + }, + { + "epoch": 0.45, + "learning_rate": 2.993720122789093e-06, + "loss": 1.159, + "step": 15058 + }, + { + "epoch": 0.45, + "learning_rate": 2.993481004324734e-06, + "loss": 1.193, + "step": 15059 + }, + { + "epoch": 0.45, + "learning_rate": 2.993241881162674e-06, + "loss": 1.125, + "step": 15060 + }, + { + "epoch": 0.45, + "learning_rate": 2.993002753305188e-06, + "loss": 1.0774, + "step": 15061 + }, + { + "epoch": 0.45, + "learning_rate": 2.9927636207545536e-06, + "loss": 1.2726, + "step": 15062 + }, + { + "epoch": 0.45, + "learning_rate": 2.9925244835130467e-06, + "loss": 1.124, + "step": 15063 + }, + { + "epoch": 0.45, + "learning_rate": 2.9922853415829444e-06, + "loss": 1.1584, + "step": 15064 + }, + { + "epoch": 0.45, + "learning_rate": 2.9920461949665217e-06, + "loss": 1.1003, + "step": 15065 + }, + { + "epoch": 0.45, + "learning_rate": 2.9918070436660573e-06, + "loss": 1.1501, + "step": 15066 + }, + { + "epoch": 0.45, + "learning_rate": 2.991567887683826e-06, + "loss": 1.0919, + "step": 15067 + }, + { + "epoch": 0.45, + "learning_rate": 2.9913287270221065e-06, + "loss": 1.2153, + "step": 15068 + }, + { + "epoch": 0.45, + "learning_rate": 2.9910895616831725e-06, + "loss": 1.1077, + "step": 15069 + }, + { + "epoch": 0.45, + "learning_rate": 2.9908503916693027e-06, + "loss": 1.1951, + "step": 15070 + }, + { + "epoch": 0.45, + "learning_rate": 2.9906112169827745e-06, + "loss": 1.1134, + "step": 15071 + }, + { + "epoch": 0.45, + "learning_rate": 2.9903720376258628e-06, + "loss": 1.0903, + "step": 15072 + }, + { + "epoch": 0.45, + "learning_rate": 2.9901328536008462e-06, + "loss": 1.2823, + "step": 15073 + }, + { + "epoch": 0.45, + "learning_rate": 2.9898936649100004e-06, + "loss": 0.9698, + "step": 15074 + }, + { + "epoch": 0.45, + "learning_rate": 2.9896544715556037e-06, + "loss": 1.1346, + "step": 15075 + }, + { + "epoch": 0.45, + "learning_rate": 2.9894152735399314e-06, + "loss": 1.1124, + "step": 15076 + }, + { + "epoch": 0.45, + "learning_rate": 2.989176070865261e-06, + "loss": 1.1754, + "step": 15077 + }, + { + "epoch": 0.45, + "learning_rate": 2.9889368635338708e-06, + "loss": 1.1156, + "step": 15078 + }, + { + "epoch": 0.45, + "learning_rate": 2.988697651548037e-06, + "loss": 1.1059, + "step": 15079 + }, + { + "epoch": 0.45, + "learning_rate": 2.9884584349100366e-06, + "loss": 1.0761, + "step": 15080 + }, + { + "epoch": 0.45, + "learning_rate": 2.9882192136221476e-06, + "loss": 1.0821, + "step": 15081 + }, + { + "epoch": 0.45, + "learning_rate": 2.987979987686646e-06, + "loss": 1.1146, + "step": 15082 + }, + { + "epoch": 0.45, + "learning_rate": 2.9877407571058102e-06, + "loss": 1.0707, + "step": 15083 + }, + { + "epoch": 0.45, + "learning_rate": 2.987501521881918e-06, + "loss": 1.1908, + "step": 15084 + }, + { + "epoch": 0.45, + "learning_rate": 2.987262282017246e-06, + "loss": 1.1755, + "step": 15085 + }, + { + "epoch": 0.45, + "learning_rate": 2.987023037514072e-06, + "loss": 1.2018, + "step": 15086 + }, + { + "epoch": 0.45, + "learning_rate": 2.986783788374672e-06, + "loss": 1.1385, + "step": 15087 + }, + { + "epoch": 0.45, + "learning_rate": 2.986544534601326e-06, + "loss": 1.0776, + "step": 15088 + }, + { + "epoch": 0.45, + "learning_rate": 2.98630527619631e-06, + "loss": 1.1719, + "step": 15089 + }, + { + "epoch": 0.45, + "learning_rate": 2.9860660131619014e-06, + "loss": 1.2012, + "step": 15090 + }, + { + "epoch": 0.45, + "learning_rate": 2.9858267455003786e-06, + "loss": 1.1574, + "step": 15091 + }, + { + "epoch": 0.45, + "learning_rate": 2.98558747321402e-06, + "loss": 1.2179, + "step": 15092 + }, + { + "epoch": 0.45, + "learning_rate": 2.9853481963051016e-06, + "loss": 1.0339, + "step": 15093 + }, + { + "epoch": 0.45, + "learning_rate": 2.985108914775903e-06, + "loss": 1.2458, + "step": 15094 + }, + { + "epoch": 0.45, + "learning_rate": 2.9848696286287004e-06, + "loss": 1.0337, + "step": 15095 + }, + { + "epoch": 0.45, + "learning_rate": 2.9846303378657727e-06, + "loss": 1.1053, + "step": 15096 + }, + { + "epoch": 0.45, + "learning_rate": 2.984391042489398e-06, + "loss": 1.15, + "step": 15097 + }, + { + "epoch": 0.45, + "learning_rate": 2.984151742501853e-06, + "loss": 1.2087, + "step": 15098 + }, + { + "epoch": 0.45, + "learning_rate": 2.9839124379054173e-06, + "loss": 1.0482, + "step": 15099 + }, + { + "epoch": 0.45, + "learning_rate": 2.983673128702368e-06, + "loss": 1.1539, + "step": 15100 + }, + { + "epoch": 0.45, + "learning_rate": 2.9834338148949836e-06, + "loss": 1.095, + "step": 15101 + }, + { + "epoch": 0.45, + "learning_rate": 2.9831944964855418e-06, + "loss": 1.1113, + "step": 15102 + }, + { + "epoch": 0.45, + "learning_rate": 2.9829551734763213e-06, + "loss": 1.1276, + "step": 15103 + }, + { + "epoch": 0.46, + "learning_rate": 2.9827158458696005e-06, + "loss": 1.1945, + "step": 15104 + }, + { + "epoch": 0.46, + "learning_rate": 2.9824765136676564e-06, + "loss": 1.2107, + "step": 15105 + }, + { + "epoch": 0.46, + "learning_rate": 2.9822371768727685e-06, + "loss": 1.076, + "step": 15106 + }, + { + "epoch": 0.46, + "learning_rate": 2.9819978354872158e-06, + "loss": 1.1466, + "step": 15107 + }, + { + "epoch": 0.46, + "learning_rate": 2.981758489513275e-06, + "loss": 1.1135, + "step": 15108 + }, + { + "epoch": 0.46, + "learning_rate": 2.9815191389532254e-06, + "loss": 1.1085, + "step": 15109 + }, + { + "epoch": 0.46, + "learning_rate": 2.9812797838093465e-06, + "loss": 1.1205, + "step": 15110 + }, + { + "epoch": 0.46, + "learning_rate": 2.981040424083915e-06, + "loss": 1.1611, + "step": 15111 + }, + { + "epoch": 0.46, + "learning_rate": 2.980801059779211e-06, + "loss": 1.1002, + "step": 15112 + }, + { + "epoch": 0.46, + "learning_rate": 2.9805616908975115e-06, + "loss": 1.1718, + "step": 15113 + }, + { + "epoch": 0.46, + "learning_rate": 2.980322317441097e-06, + "loss": 1.1441, + "step": 15114 + }, + { + "epoch": 0.46, + "learning_rate": 2.980082939412245e-06, + "loss": 1.1285, + "step": 15115 + }, + { + "epoch": 0.46, + "learning_rate": 2.979843556813235e-06, + "loss": 1.1803, + "step": 15116 + }, + { + "epoch": 0.46, + "learning_rate": 2.9796041696463446e-06, + "loss": 1.1855, + "step": 15117 + }, + { + "epoch": 0.46, + "learning_rate": 2.979364777913854e-06, + "loss": 1.1343, + "step": 15118 + }, + { + "epoch": 0.46, + "learning_rate": 2.979125381618041e-06, + "loss": 1.1429, + "step": 15119 + }, + { + "epoch": 0.46, + "learning_rate": 2.9788859807611865e-06, + "loss": 1.184, + "step": 15120 + }, + { + "epoch": 0.46, + "learning_rate": 2.978646575345567e-06, + "loss": 1.1431, + "step": 15121 + }, + { + "epoch": 0.46, + "learning_rate": 2.978407165373463e-06, + "loss": 1.1469, + "step": 15122 + }, + { + "epoch": 0.46, + "learning_rate": 2.978167750847153e-06, + "loss": 1.1286, + "step": 15123 + }, + { + "epoch": 0.46, + "learning_rate": 2.977928331768916e-06, + "loss": 1.0958, + "step": 15124 + }, + { + "epoch": 0.46, + "learning_rate": 2.977688908141032e-06, + "loss": 1.2067, + "step": 15125 + }, + { + "epoch": 0.46, + "learning_rate": 2.9774494799657794e-06, + "loss": 1.1445, + "step": 15126 + }, + { + "epoch": 0.46, + "learning_rate": 2.9772100472454386e-06, + "loss": 1.1758, + "step": 15127 + }, + { + "epoch": 0.46, + "learning_rate": 2.9769706099822864e-06, + "loss": 1.1334, + "step": 15128 + }, + { + "epoch": 0.46, + "learning_rate": 2.9767311681786047e-06, + "loss": 1.0557, + "step": 15129 + }, + { + "epoch": 0.46, + "learning_rate": 2.9764917218366718e-06, + "loss": 1.0811, + "step": 15130 + }, + { + "epoch": 0.46, + "learning_rate": 2.9762522709587672e-06, + "loss": 1.1133, + "step": 15131 + }, + { + "epoch": 0.46, + "learning_rate": 2.9760128155471697e-06, + "loss": 1.1093, + "step": 15132 + }, + { + "epoch": 0.46, + "learning_rate": 2.97577335560416e-06, + "loss": 1.1517, + "step": 15133 + }, + { + "epoch": 0.46, + "learning_rate": 2.9755338911320177e-06, + "loss": 1.1297, + "step": 15134 + }, + { + "epoch": 0.46, + "learning_rate": 2.975294422133021e-06, + "loss": 1.176, + "step": 15135 + }, + { + "epoch": 0.46, + "learning_rate": 2.9750549486094505e-06, + "loss": 1.1808, + "step": 15136 + }, + { + "epoch": 0.46, + "learning_rate": 2.974815470563585e-06, + "loss": 1.1867, + "step": 15137 + }, + { + "epoch": 0.46, + "learning_rate": 2.974575987997706e-06, + "loss": 1.0501, + "step": 15138 + }, + { + "epoch": 0.46, + "learning_rate": 2.9743365009140916e-06, + "loss": 1.0901, + "step": 15139 + }, + { + "epoch": 0.46, + "learning_rate": 2.974097009315023e-06, + "loss": 1.2015, + "step": 15140 + }, + { + "epoch": 0.46, + "learning_rate": 2.973857513202778e-06, + "loss": 1.1932, + "step": 15141 + }, + { + "epoch": 0.46, + "learning_rate": 2.973618012579639e-06, + "loss": 1.101, + "step": 15142 + }, + { + "epoch": 0.46, + "learning_rate": 2.9733785074478833e-06, + "loss": 1.1694, + "step": 15143 + }, + { + "epoch": 0.46, + "learning_rate": 2.9731389978097926e-06, + "loss": 1.1808, + "step": 15144 + }, + { + "epoch": 0.46, + "learning_rate": 2.9728994836676465e-06, + "loss": 1.0845, + "step": 15145 + }, + { + "epoch": 0.46, + "learning_rate": 2.9726599650237253e-06, + "loss": 1.1412, + "step": 15146 + }, + { + "epoch": 0.46, + "learning_rate": 2.9724204418803083e-06, + "loss": 1.1999, + "step": 15147 + }, + { + "epoch": 0.46, + "learning_rate": 2.972180914239677e-06, + "loss": 1.0638, + "step": 15148 + }, + { + "epoch": 0.46, + "learning_rate": 2.9719413821041104e-06, + "loss": 1.0128, + "step": 15149 + }, + { + "epoch": 0.46, + "learning_rate": 2.971701845475889e-06, + "loss": 1.1255, + "step": 15150 + }, + { + "epoch": 0.46, + "learning_rate": 2.9714623043572936e-06, + "loss": 1.1763, + "step": 15151 + }, + { + "epoch": 0.46, + "learning_rate": 2.9712227587506035e-06, + "loss": 1.0789, + "step": 15152 + }, + { + "epoch": 0.46, + "learning_rate": 2.970983208658101e-06, + "loss": 1.1083, + "step": 15153 + }, + { + "epoch": 0.46, + "learning_rate": 2.970743654082064e-06, + "loss": 1.1255, + "step": 15154 + }, + { + "epoch": 0.46, + "learning_rate": 2.9705040950247743e-06, + "loss": 1.0857, + "step": 15155 + }, + { + "epoch": 0.46, + "learning_rate": 2.9702645314885126e-06, + "loss": 1.0412, + "step": 15156 + }, + { + "epoch": 0.46, + "learning_rate": 2.970024963475559e-06, + "loss": 1.2633, + "step": 15157 + }, + { + "epoch": 0.46, + "learning_rate": 2.9697853909881936e-06, + "loss": 1.1854, + "step": 15158 + }, + { + "epoch": 0.46, + "learning_rate": 2.9695458140286975e-06, + "loss": 1.2025, + "step": 15159 + }, + { + "epoch": 0.46, + "learning_rate": 2.9693062325993515e-06, + "loss": 1.0794, + "step": 15160 + }, + { + "epoch": 0.46, + "learning_rate": 2.9690666467024372e-06, + "loss": 1.1824, + "step": 15161 + }, + { + "epoch": 0.46, + "learning_rate": 2.9688270563402334e-06, + "loss": 1.1319, + "step": 15162 + }, + { + "epoch": 0.46, + "learning_rate": 2.968587461515022e-06, + "loss": 1.1635, + "step": 15163 + }, + { + "epoch": 0.46, + "learning_rate": 2.9683478622290832e-06, + "loss": 1.1707, + "step": 15164 + }, + { + "epoch": 0.46, + "learning_rate": 2.9681082584846986e-06, + "loss": 1.0994, + "step": 15165 + }, + { + "epoch": 0.46, + "learning_rate": 2.96786865028415e-06, + "loss": 1.0969, + "step": 15166 + }, + { + "epoch": 0.46, + "learning_rate": 2.9676290376297156e-06, + "loss": 1.1609, + "step": 15167 + }, + { + "epoch": 0.46, + "learning_rate": 2.9673894205236793e-06, + "loss": 1.1219, + "step": 15168 + }, + { + "epoch": 0.46, + "learning_rate": 2.9671497989683195e-06, + "loss": 1.0663, + "step": 15169 + }, + { + "epoch": 0.46, + "learning_rate": 2.9669101729659195e-06, + "loss": 1.1117, + "step": 15170 + }, + { + "epoch": 0.46, + "learning_rate": 2.9666705425187594e-06, + "loss": 0.9832, + "step": 15171 + }, + { + "epoch": 0.46, + "learning_rate": 2.96643090762912e-06, + "loss": 1.1426, + "step": 15172 + }, + { + "epoch": 0.46, + "learning_rate": 2.9661912682992827e-06, + "loss": 1.1407, + "step": 15173 + }, + { + "epoch": 0.46, + "learning_rate": 2.96595162453153e-06, + "loss": 1.3425, + "step": 15174 + }, + { + "epoch": 0.46, + "learning_rate": 2.9657119763281415e-06, + "loss": 1.2319, + "step": 15175 + }, + { + "epoch": 0.46, + "learning_rate": 2.9654723236913994e-06, + "loss": 1.1123, + "step": 15176 + }, + { + "epoch": 0.46, + "learning_rate": 2.9652326666235858e-06, + "loss": 1.0679, + "step": 15177 + }, + { + "epoch": 0.46, + "learning_rate": 2.9649930051269803e-06, + "loss": 1.081, + "step": 15178 + }, + { + "epoch": 0.46, + "learning_rate": 2.9647533392038662e-06, + "loss": 1.1108, + "step": 15179 + }, + { + "epoch": 0.46, + "learning_rate": 2.9645136688565233e-06, + "loss": 1.0342, + "step": 15180 + }, + { + "epoch": 0.46, + "learning_rate": 2.964273994087235e-06, + "loss": 1.1391, + "step": 15181 + }, + { + "epoch": 0.46, + "learning_rate": 2.964034314898281e-06, + "loss": 1.213, + "step": 15182 + }, + { + "epoch": 0.46, + "learning_rate": 2.9637946312919447e-06, + "loss": 1.1373, + "step": 15183 + }, + { + "epoch": 0.46, + "learning_rate": 2.963554943270506e-06, + "loss": 1.1082, + "step": 15184 + }, + { + "epoch": 0.46, + "learning_rate": 2.9633152508362474e-06, + "loss": 0.9963, + "step": 15185 + }, + { + "epoch": 0.46, + "learning_rate": 2.9630755539914514e-06, + "loss": 1.2848, + "step": 15186 + }, + { + "epoch": 0.46, + "learning_rate": 2.9628358527383983e-06, + "loss": 1.2893, + "step": 15187 + }, + { + "epoch": 0.46, + "learning_rate": 2.962596147079371e-06, + "loss": 1.063, + "step": 15188 + }, + { + "epoch": 0.46, + "learning_rate": 2.962356437016652e-06, + "loss": 1.1129, + "step": 15189 + }, + { + "epoch": 0.46, + "learning_rate": 2.962116722552522e-06, + "loss": 1.2816, + "step": 15190 + }, + { + "epoch": 0.46, + "learning_rate": 2.961877003689263e-06, + "loss": 1.0707, + "step": 15191 + }, + { + "epoch": 0.46, + "learning_rate": 2.9616372804291584e-06, + "loss": 1.1216, + "step": 15192 + }, + { + "epoch": 0.46, + "learning_rate": 2.9613975527744877e-06, + "loss": 1.2029, + "step": 15193 + }, + { + "epoch": 0.46, + "learning_rate": 2.961157820727536e-06, + "loss": 1.2109, + "step": 15194 + }, + { + "epoch": 0.46, + "learning_rate": 2.9609180842905825e-06, + "loss": 1.1562, + "step": 15195 + }, + { + "epoch": 0.46, + "learning_rate": 2.960678343465912e-06, + "loss": 1.1432, + "step": 15196 + }, + { + "epoch": 0.46, + "learning_rate": 2.960438598255805e-06, + "loss": 1.1078, + "step": 15197 + }, + { + "epoch": 0.46, + "learning_rate": 2.960198848662545e-06, + "loss": 1.0883, + "step": 15198 + }, + { + "epoch": 0.46, + "learning_rate": 2.9599590946884126e-06, + "loss": 1.1275, + "step": 15199 + }, + { + "epoch": 0.46, + "learning_rate": 2.9597193363356915e-06, + "loss": 1.0878, + "step": 15200 + }, + { + "epoch": 0.46, + "learning_rate": 2.9594795736066633e-06, + "loss": 1.1597, + "step": 15201 + }, + { + "epoch": 0.46, + "learning_rate": 2.959239806503611e-06, + "loss": 1.0562, + "step": 15202 + }, + { + "epoch": 0.46, + "learning_rate": 2.959000035028818e-06, + "loss": 1.0573, + "step": 15203 + }, + { + "epoch": 0.46, + "learning_rate": 2.958760259184564e-06, + "loss": 1.1648, + "step": 15204 + }, + { + "epoch": 0.46, + "learning_rate": 2.9585204789731346e-06, + "loss": 1.1426, + "step": 15205 + }, + { + "epoch": 0.46, + "learning_rate": 2.9582806943968106e-06, + "loss": 1.192, + "step": 15206 + }, + { + "epoch": 0.46, + "learning_rate": 2.958040905457876e-06, + "loss": 1.099, + "step": 15207 + }, + { + "epoch": 0.46, + "learning_rate": 2.9578011121586112e-06, + "loss": 1.1116, + "step": 15208 + }, + { + "epoch": 0.46, + "learning_rate": 2.9575613145013015e-06, + "loss": 1.1235, + "step": 15209 + }, + { + "epoch": 0.46, + "learning_rate": 2.957321512488228e-06, + "loss": 1.0884, + "step": 15210 + }, + { + "epoch": 0.46, + "learning_rate": 2.9570817061216737e-06, + "loss": 1.1775, + "step": 15211 + }, + { + "epoch": 0.46, + "learning_rate": 2.9568418954039215e-06, + "loss": 1.1732, + "step": 15212 + }, + { + "epoch": 0.46, + "learning_rate": 2.9566020803372548e-06, + "loss": 1.0865, + "step": 15213 + }, + { + "epoch": 0.46, + "learning_rate": 2.9563622609239555e-06, + "loss": 1.0753, + "step": 15214 + }, + { + "epoch": 0.46, + "learning_rate": 2.956122437166309e-06, + "loss": 1.2009, + "step": 15215 + }, + { + "epoch": 0.46, + "learning_rate": 2.955882609066595e-06, + "loss": 1.0508, + "step": 15216 + }, + { + "epoch": 0.46, + "learning_rate": 2.9556427766270986e-06, + "loss": 1.1472, + "step": 15217 + }, + { + "epoch": 0.46, + "learning_rate": 2.955402939850103e-06, + "loss": 1.1876, + "step": 15218 + }, + { + "epoch": 0.46, + "learning_rate": 2.9551630987378892e-06, + "loss": 1.1252, + "step": 15219 + }, + { + "epoch": 0.46, + "learning_rate": 2.9549232532927437e-06, + "loss": 1.2089, + "step": 15220 + }, + { + "epoch": 0.46, + "learning_rate": 2.954683403516947e-06, + "loss": 1.2148, + "step": 15221 + }, + { + "epoch": 0.46, + "learning_rate": 2.9544435494127832e-06, + "loss": 1.0824, + "step": 15222 + }, + { + "epoch": 0.46, + "learning_rate": 2.9542036909825363e-06, + "loss": 1.1884, + "step": 15223 + }, + { + "epoch": 0.46, + "learning_rate": 2.953963828228489e-06, + "loss": 1.1586, + "step": 15224 + }, + { + "epoch": 0.46, + "learning_rate": 2.953723961152924e-06, + "loss": 1.1826, + "step": 15225 + }, + { + "epoch": 0.46, + "learning_rate": 2.9534840897581254e-06, + "loss": 1.0975, + "step": 15226 + }, + { + "epoch": 0.46, + "learning_rate": 2.9532442140463768e-06, + "loss": 1.1537, + "step": 15227 + }, + { + "epoch": 0.46, + "learning_rate": 2.9530043340199622e-06, + "loss": 1.1786, + "step": 15228 + }, + { + "epoch": 0.46, + "learning_rate": 2.9527644496811636e-06, + "loss": 1.1565, + "step": 15229 + }, + { + "epoch": 0.46, + "learning_rate": 2.9525245610322658e-06, + "loss": 1.1931, + "step": 15230 + }, + { + "epoch": 0.46, + "learning_rate": 2.9522846680755523e-06, + "loss": 1.1738, + "step": 15231 + }, + { + "epoch": 0.46, + "learning_rate": 2.9520447708133065e-06, + "loss": 1.0709, + "step": 15232 + }, + { + "epoch": 0.46, + "learning_rate": 2.951804869247813e-06, + "loss": 1.0923, + "step": 15233 + }, + { + "epoch": 0.46, + "learning_rate": 2.9515649633813536e-06, + "loss": 1.1462, + "step": 15234 + }, + { + "epoch": 0.46, + "learning_rate": 2.9513250532162142e-06, + "loss": 1.1812, + "step": 15235 + }, + { + "epoch": 0.46, + "learning_rate": 2.951085138754677e-06, + "loss": 1.2095, + "step": 15236 + }, + { + "epoch": 0.46, + "learning_rate": 2.9508452199990267e-06, + "loss": 1.2043, + "step": 15237 + }, + { + "epoch": 0.46, + "learning_rate": 2.9506052969515466e-06, + "loss": 1.1269, + "step": 15238 + }, + { + "epoch": 0.46, + "learning_rate": 2.9503653696145218e-06, + "loss": 1.0814, + "step": 15239 + }, + { + "epoch": 0.46, + "learning_rate": 2.950125437990235e-06, + "loss": 1.1186, + "step": 15240 + }, + { + "epoch": 0.46, + "learning_rate": 2.949885502080971e-06, + "loss": 1.1948, + "step": 15241 + }, + { + "epoch": 0.46, + "learning_rate": 2.9496455618890137e-06, + "loss": 1.1764, + "step": 15242 + }, + { + "epoch": 0.46, + "learning_rate": 2.949405617416647e-06, + "loss": 1.1849, + "step": 15243 + }, + { + "epoch": 0.46, + "learning_rate": 2.949165668666156e-06, + "loss": 1.1064, + "step": 15244 + }, + { + "epoch": 0.46, + "learning_rate": 2.9489257156398233e-06, + "loss": 1.1958, + "step": 15245 + }, + { + "epoch": 0.46, + "learning_rate": 2.9486857583399347e-06, + "loss": 1.0884, + "step": 15246 + }, + { + "epoch": 0.46, + "learning_rate": 2.948445796768773e-06, + "loss": 1.1046, + "step": 15247 + }, + { + "epoch": 0.46, + "learning_rate": 2.9482058309286244e-06, + "loss": 1.2487, + "step": 15248 + }, + { + "epoch": 0.46, + "learning_rate": 2.947965860821771e-06, + "loss": 1.1517, + "step": 15249 + }, + { + "epoch": 0.46, + "learning_rate": 2.9477258864504994e-06, + "loss": 1.0751, + "step": 15250 + }, + { + "epoch": 0.46, + "learning_rate": 2.947485907817092e-06, + "loss": 1.1018, + "step": 15251 + }, + { + "epoch": 0.46, + "learning_rate": 2.947245924923835e-06, + "loss": 1.0518, + "step": 15252 + }, + { + "epoch": 0.46, + "learning_rate": 2.947005937773012e-06, + "loss": 1.1943, + "step": 15253 + }, + { + "epoch": 0.46, + "learning_rate": 2.9467659463669074e-06, + "loss": 1.1164, + "step": 15254 + }, + { + "epoch": 0.46, + "learning_rate": 2.9465259507078057e-06, + "loss": 1.0811, + "step": 15255 + }, + { + "epoch": 0.46, + "learning_rate": 2.946285950797993e-06, + "loss": 1.0693, + "step": 15256 + }, + { + "epoch": 0.46, + "learning_rate": 2.946045946639753e-06, + "loss": 1.0799, + "step": 15257 + }, + { + "epoch": 0.46, + "learning_rate": 2.9458059382353697e-06, + "loss": 1.0778, + "step": 15258 + }, + { + "epoch": 0.46, + "learning_rate": 2.9455659255871295e-06, + "loss": 1.0701, + "step": 15259 + }, + { + "epoch": 0.46, + "learning_rate": 2.9453259086973156e-06, + "loss": 1.1718, + "step": 15260 + }, + { + "epoch": 0.46, + "learning_rate": 2.9450858875682144e-06, + "loss": 1.2208, + "step": 15261 + }, + { + "epoch": 0.46, + "learning_rate": 2.9448458622021087e-06, + "loss": 1.2162, + "step": 15262 + }, + { + "epoch": 0.46, + "learning_rate": 2.9446058326012855e-06, + "loss": 1.204, + "step": 15263 + }, + { + "epoch": 0.46, + "learning_rate": 2.9443657987680284e-06, + "loss": 1.0222, + "step": 15264 + }, + { + "epoch": 0.46, + "learning_rate": 2.9441257607046236e-06, + "loss": 1.1031, + "step": 15265 + }, + { + "epoch": 0.46, + "learning_rate": 2.9438857184133546e-06, + "loss": 1.0738, + "step": 15266 + }, + { + "epoch": 0.46, + "learning_rate": 2.943645671896508e-06, + "loss": 1.2951, + "step": 15267 + }, + { + "epoch": 0.46, + "learning_rate": 2.9434056211563674e-06, + "loss": 1.1537, + "step": 15268 + }, + { + "epoch": 0.46, + "learning_rate": 2.9431655661952198e-06, + "loss": 0.9945, + "step": 15269 + }, + { + "epoch": 0.46, + "learning_rate": 2.9429255070153484e-06, + "loss": 1.0731, + "step": 15270 + }, + { + "epoch": 0.46, + "learning_rate": 2.94268544361904e-06, + "loss": 1.1155, + "step": 15271 + }, + { + "epoch": 0.46, + "learning_rate": 2.9424453760085803e-06, + "loss": 1.087, + "step": 15272 + }, + { + "epoch": 0.46, + "learning_rate": 2.9422053041862525e-06, + "loss": 1.1404, + "step": 15273 + }, + { + "epoch": 0.46, + "learning_rate": 2.941965228154344e-06, + "loss": 1.2064, + "step": 15274 + }, + { + "epoch": 0.46, + "learning_rate": 2.9417251479151386e-06, + "loss": 1.2646, + "step": 15275 + }, + { + "epoch": 0.46, + "learning_rate": 2.9414850634709235e-06, + "loss": 1.1467, + "step": 15276 + }, + { + "epoch": 0.46, + "learning_rate": 2.9412449748239824e-06, + "loss": 1.0895, + "step": 15277 + }, + { + "epoch": 0.46, + "learning_rate": 2.9410048819766024e-06, + "loss": 1.0745, + "step": 15278 + }, + { + "epoch": 0.46, + "learning_rate": 2.940764784931067e-06, + "loss": 1.0398, + "step": 15279 + }, + { + "epoch": 0.46, + "learning_rate": 2.9405246836896643e-06, + "loss": 1.2407, + "step": 15280 + }, + { + "epoch": 0.46, + "learning_rate": 2.9402845782546785e-06, + "loss": 1.1907, + "step": 15281 + }, + { + "epoch": 0.46, + "learning_rate": 2.9400444686283953e-06, + "loss": 1.048, + "step": 15282 + }, + { + "epoch": 0.46, + "learning_rate": 2.9398043548131005e-06, + "loss": 1.0909, + "step": 15283 + }, + { + "epoch": 0.46, + "learning_rate": 2.9395642368110807e-06, + "loss": 1.1077, + "step": 15284 + }, + { + "epoch": 0.46, + "learning_rate": 2.939324114624621e-06, + "loss": 1.0922, + "step": 15285 + }, + { + "epoch": 0.46, + "learning_rate": 2.9390839882560067e-06, + "loss": 1.1678, + "step": 15286 + }, + { + "epoch": 0.46, + "learning_rate": 2.9388438577075252e-06, + "loss": 1.199, + "step": 15287 + }, + { + "epoch": 0.46, + "learning_rate": 2.9386037229814607e-06, + "loss": 1.1561, + "step": 15288 + }, + { + "epoch": 0.46, + "learning_rate": 2.9383635840801007e-06, + "loss": 1.1055, + "step": 15289 + }, + { + "epoch": 0.46, + "learning_rate": 2.93812344100573e-06, + "loss": 0.9777, + "step": 15290 + }, + { + "epoch": 0.46, + "learning_rate": 2.9378832937606357e-06, + "loss": 1.157, + "step": 15291 + }, + { + "epoch": 0.46, + "learning_rate": 2.9376431423471023e-06, + "loss": 1.2474, + "step": 15292 + }, + { + "epoch": 0.46, + "learning_rate": 2.9374029867674183e-06, + "loss": 1.2162, + "step": 15293 + }, + { + "epoch": 0.46, + "learning_rate": 2.9371628270238672e-06, + "loss": 1.1478, + "step": 15294 + }, + { + "epoch": 0.46, + "learning_rate": 2.936922663118737e-06, + "loss": 1.2199, + "step": 15295 + }, + { + "epoch": 0.46, + "learning_rate": 2.9366824950543138e-06, + "loss": 1.0107, + "step": 15296 + }, + { + "epoch": 0.46, + "learning_rate": 2.9364423228328832e-06, + "loss": 1.1539, + "step": 15297 + }, + { + "epoch": 0.46, + "learning_rate": 2.936202146456732e-06, + "loss": 1.1076, + "step": 15298 + }, + { + "epoch": 0.46, + "learning_rate": 2.9359619659281464e-06, + "loss": 1.1106, + "step": 15299 + }, + { + "epoch": 0.46, + "learning_rate": 2.9357217812494133e-06, + "loss": 1.073, + "step": 15300 + }, + { + "epoch": 0.46, + "learning_rate": 2.935481592422818e-06, + "loss": 1.1857, + "step": 15301 + }, + { + "epoch": 0.46, + "learning_rate": 2.9352413994506484e-06, + "loss": 1.1838, + "step": 15302 + }, + { + "epoch": 0.46, + "learning_rate": 2.9350012023351898e-06, + "loss": 1.0374, + "step": 15303 + }, + { + "epoch": 0.46, + "learning_rate": 2.9347610010787297e-06, + "loss": 1.0609, + "step": 15304 + }, + { + "epoch": 0.46, + "learning_rate": 2.9345207956835537e-06, + "loss": 1.0557, + "step": 15305 + }, + { + "epoch": 0.46, + "learning_rate": 2.9342805861519498e-06, + "loss": 1.2979, + "step": 15306 + }, + { + "epoch": 0.46, + "learning_rate": 2.9340403724862034e-06, + "loss": 1.1713, + "step": 15307 + }, + { + "epoch": 0.46, + "learning_rate": 2.9338001546886006e-06, + "loss": 1.1947, + "step": 15308 + }, + { + "epoch": 0.46, + "learning_rate": 2.9335599327614306e-06, + "loss": 1.1198, + "step": 15309 + }, + { + "epoch": 0.46, + "learning_rate": 2.9333197067069786e-06, + "loss": 1.1192, + "step": 15310 + }, + { + "epoch": 0.46, + "learning_rate": 2.9330794765275317e-06, + "loss": 1.1532, + "step": 15311 + }, + { + "epoch": 0.46, + "learning_rate": 2.932839242225376e-06, + "loss": 1.105, + "step": 15312 + }, + { + "epoch": 0.46, + "learning_rate": 2.9325990038028e-06, + "loss": 1.1465, + "step": 15313 + }, + { + "epoch": 0.46, + "learning_rate": 2.9323587612620897e-06, + "loss": 1.1036, + "step": 15314 + }, + { + "epoch": 0.46, + "learning_rate": 2.9321185146055327e-06, + "loss": 1.1508, + "step": 15315 + }, + { + "epoch": 0.46, + "learning_rate": 2.931878263835415e-06, + "loss": 1.2097, + "step": 15316 + }, + { + "epoch": 0.46, + "learning_rate": 2.931638008954024e-06, + "loss": 1.1707, + "step": 15317 + }, + { + "epoch": 0.46, + "learning_rate": 2.9313977499636476e-06, + "loss": 1.2238, + "step": 15318 + }, + { + "epoch": 0.46, + "learning_rate": 2.9311574868665724e-06, + "loss": 1.1213, + "step": 15319 + }, + { + "epoch": 0.46, + "learning_rate": 2.930917219665085e-06, + "loss": 1.0572, + "step": 15320 + }, + { + "epoch": 0.46, + "learning_rate": 2.930676948361474e-06, + "loss": 1.0863, + "step": 15321 + }, + { + "epoch": 0.46, + "learning_rate": 2.930436672958025e-06, + "loss": 1.1154, + "step": 15322 + }, + { + "epoch": 0.46, + "learning_rate": 2.9301963934570266e-06, + "loss": 1.129, + "step": 15323 + }, + { + "epoch": 0.46, + "learning_rate": 2.9299561098607653e-06, + "loss": 1.0925, + "step": 15324 + }, + { + "epoch": 0.46, + "learning_rate": 2.929715822171529e-06, + "loss": 1.1025, + "step": 15325 + }, + { + "epoch": 0.46, + "learning_rate": 2.9294755303916054e-06, + "loss": 1.1542, + "step": 15326 + }, + { + "epoch": 0.46, + "learning_rate": 2.9292352345232817e-06, + "loss": 1.01, + "step": 15327 + }, + { + "epoch": 0.46, + "learning_rate": 2.928994934568845e-06, + "loss": 1.1523, + "step": 15328 + }, + { + "epoch": 0.46, + "learning_rate": 2.928754630530583e-06, + "loss": 1.1139, + "step": 15329 + }, + { + "epoch": 0.46, + "learning_rate": 2.9285143224107844e-06, + "loss": 1.1403, + "step": 15330 + }, + { + "epoch": 0.46, + "learning_rate": 2.9282740102117345e-06, + "loss": 1.2197, + "step": 15331 + }, + { + "epoch": 0.46, + "learning_rate": 2.9280336939357235e-06, + "loss": 1.0397, + "step": 15332 + }, + { + "epoch": 0.46, + "learning_rate": 2.9277933735850365e-06, + "loss": 1.0361, + "step": 15333 + }, + { + "epoch": 0.46, + "learning_rate": 2.927553049161964e-06, + "loss": 1.0681, + "step": 15334 + }, + { + "epoch": 0.46, + "learning_rate": 2.9273127206687917e-06, + "loss": 1.0795, + "step": 15335 + }, + { + "epoch": 0.46, + "learning_rate": 2.927072388107808e-06, + "loss": 1.0115, + "step": 15336 + }, + { + "epoch": 0.46, + "learning_rate": 2.926832051481301e-06, + "loss": 1.16, + "step": 15337 + }, + { + "epoch": 0.46, + "learning_rate": 2.9265917107915576e-06, + "loss": 1.1026, + "step": 15338 + }, + { + "epoch": 0.46, + "learning_rate": 2.926351366040868e-06, + "loss": 1.1342, + "step": 15339 + }, + { + "epoch": 0.46, + "learning_rate": 2.9261110172315177e-06, + "loss": 1.0918, + "step": 15340 + }, + { + "epoch": 0.46, + "learning_rate": 2.925870664365797e-06, + "loss": 1.0782, + "step": 15341 + }, + { + "epoch": 0.46, + "learning_rate": 2.925630307445991e-06, + "loss": 1.087, + "step": 15342 + }, + { + "epoch": 0.46, + "learning_rate": 2.925389946474391e-06, + "loss": 1.1384, + "step": 15343 + }, + { + "epoch": 0.46, + "learning_rate": 2.925149581453283e-06, + "loss": 1.1616, + "step": 15344 + }, + { + "epoch": 0.46, + "learning_rate": 2.9249092123849554e-06, + "loss": 1.1396, + "step": 15345 + }, + { + "epoch": 0.46, + "learning_rate": 2.924668839271697e-06, + "loss": 1.0593, + "step": 15346 + }, + { + "epoch": 0.46, + "learning_rate": 2.9244284621157958e-06, + "loss": 1.1718, + "step": 15347 + }, + { + "epoch": 0.46, + "learning_rate": 2.92418808091954e-06, + "loss": 1.1968, + "step": 15348 + }, + { + "epoch": 0.46, + "learning_rate": 2.923947695685218e-06, + "loss": 1.1286, + "step": 15349 + }, + { + "epoch": 0.46, + "learning_rate": 2.923707306415118e-06, + "loss": 1.1546, + "step": 15350 + }, + { + "epoch": 0.46, + "learning_rate": 2.923466913111529e-06, + "loss": 1.1969, + "step": 15351 + }, + { + "epoch": 0.46, + "learning_rate": 2.923226515776738e-06, + "loss": 1.0616, + "step": 15352 + }, + { + "epoch": 0.46, + "learning_rate": 2.9229861144130345e-06, + "loss": 1.1492, + "step": 15353 + }, + { + "epoch": 0.46, + "learning_rate": 2.9227457090227078e-06, + "loss": 1.2054, + "step": 15354 + }, + { + "epoch": 0.46, + "learning_rate": 2.922505299608045e-06, + "loss": 1.1171, + "step": 15355 + }, + { + "epoch": 0.46, + "learning_rate": 2.922264886171336e-06, + "loss": 1.1785, + "step": 15356 + }, + { + "epoch": 0.46, + "learning_rate": 2.9220244687148674e-06, + "loss": 1.1501, + "step": 15357 + }, + { + "epoch": 0.46, + "learning_rate": 2.9217840472409304e-06, + "loss": 1.1006, + "step": 15358 + }, + { + "epoch": 0.46, + "learning_rate": 2.9215436217518113e-06, + "loss": 1.098, + "step": 15359 + }, + { + "epoch": 0.46, + "learning_rate": 2.921303192249801e-06, + "loss": 1.2128, + "step": 15360 + }, + { + "epoch": 0.46, + "learning_rate": 2.921062758737186e-06, + "loss": 1.191, + "step": 15361 + }, + { + "epoch": 0.46, + "learning_rate": 2.920822321216257e-06, + "loss": 1.1768, + "step": 15362 + }, + { + "epoch": 0.46, + "learning_rate": 2.920581879689302e-06, + "loss": 1.1646, + "step": 15363 + }, + { + "epoch": 0.46, + "learning_rate": 2.92034143415861e-06, + "loss": 1.1682, + "step": 15364 + }, + { + "epoch": 0.46, + "learning_rate": 2.9201009846264698e-06, + "loss": 1.1083, + "step": 15365 + }, + { + "epoch": 0.46, + "learning_rate": 2.919860531095171e-06, + "loss": 1.0498, + "step": 15366 + }, + { + "epoch": 0.46, + "learning_rate": 2.919620073567002e-06, + "loss": 1.0893, + "step": 15367 + }, + { + "epoch": 0.46, + "learning_rate": 2.919379612044252e-06, + "loss": 1.1752, + "step": 15368 + }, + { + "epoch": 0.46, + "learning_rate": 2.9191391465292106e-06, + "loss": 1.1844, + "step": 15369 + }, + { + "epoch": 0.46, + "learning_rate": 2.9188986770241657e-06, + "loss": 1.1494, + "step": 15370 + }, + { + "epoch": 0.46, + "learning_rate": 2.9186582035314075e-06, + "loss": 1.1038, + "step": 15371 + }, + { + "epoch": 0.46, + "learning_rate": 2.918417726053224e-06, + "loss": 1.1061, + "step": 15372 + }, + { + "epoch": 0.46, + "learning_rate": 2.9181772445919065e-06, + "loss": 1.1005, + "step": 15373 + }, + { + "epoch": 0.46, + "learning_rate": 2.917936759149743e-06, + "loss": 1.1454, + "step": 15374 + }, + { + "epoch": 0.46, + "learning_rate": 2.9176962697290217e-06, + "loss": 0.9883, + "step": 15375 + }, + { + "epoch": 0.46, + "learning_rate": 2.9174557763320336e-06, + "loss": 1.0516, + "step": 15376 + }, + { + "epoch": 0.46, + "learning_rate": 2.9172152789610677e-06, + "loss": 1.1109, + "step": 15377 + }, + { + "epoch": 0.46, + "learning_rate": 2.9169747776184133e-06, + "loss": 1.1054, + "step": 15378 + }, + { + "epoch": 0.46, + "learning_rate": 2.9167342723063597e-06, + "loss": 1.2042, + "step": 15379 + }, + { + "epoch": 0.46, + "learning_rate": 2.916493763027197e-06, + "loss": 1.1685, + "step": 15380 + }, + { + "epoch": 0.46, + "learning_rate": 2.916253249783213e-06, + "loss": 1.2239, + "step": 15381 + }, + { + "epoch": 0.46, + "learning_rate": 2.9160127325767e-06, + "loss": 1.2192, + "step": 15382 + }, + { + "epoch": 0.46, + "learning_rate": 2.915772211409945e-06, + "loss": 1.0214, + "step": 15383 + }, + { + "epoch": 0.46, + "learning_rate": 2.9155316862852403e-06, + "loss": 1.1834, + "step": 15384 + }, + { + "epoch": 0.46, + "learning_rate": 2.9152911572048726e-06, + "loss": 1.1339, + "step": 15385 + }, + { + "epoch": 0.46, + "learning_rate": 2.915050624171134e-06, + "loss": 1.2709, + "step": 15386 + }, + { + "epoch": 0.46, + "learning_rate": 2.914810087186313e-06, + "loss": 1.4092, + "step": 15387 + }, + { + "epoch": 0.46, + "learning_rate": 2.914569546252699e-06, + "loss": 1.0567, + "step": 15388 + }, + { + "epoch": 0.46, + "learning_rate": 2.914329001372584e-06, + "loss": 1.1176, + "step": 15389 + }, + { + "epoch": 0.46, + "learning_rate": 2.9140884525482554e-06, + "loss": 1.2012, + "step": 15390 + }, + { + "epoch": 0.46, + "learning_rate": 2.9138478997820043e-06, + "loss": 1.1285, + "step": 15391 + }, + { + "epoch": 0.46, + "learning_rate": 2.913607343076121e-06, + "loss": 1.0853, + "step": 15392 + }, + { + "epoch": 0.46, + "learning_rate": 2.9133667824328947e-06, + "loss": 1.1532, + "step": 15393 + }, + { + "epoch": 0.46, + "learning_rate": 2.9131262178546154e-06, + "loss": 1.1221, + "step": 15394 + }, + { + "epoch": 0.46, + "learning_rate": 2.9128856493435744e-06, + "loss": 1.1426, + "step": 15395 + }, + { + "epoch": 0.46, + "learning_rate": 2.91264507690206e-06, + "loss": 1.1436, + "step": 15396 + }, + { + "epoch": 0.46, + "learning_rate": 2.9124045005323637e-06, + "loss": 1.2122, + "step": 15397 + }, + { + "epoch": 0.46, + "learning_rate": 2.9121639202367748e-06, + "loss": 1.027, + "step": 15398 + }, + { + "epoch": 0.46, + "learning_rate": 2.911923336017584e-06, + "loss": 1.0868, + "step": 15399 + }, + { + "epoch": 0.46, + "learning_rate": 2.9116827478770816e-06, + "loss": 1.1002, + "step": 15400 + }, + { + "epoch": 0.46, + "learning_rate": 2.911442155817558e-06, + "loss": 1.1552, + "step": 15401 + }, + { + "epoch": 0.46, + "learning_rate": 2.9112015598413024e-06, + "loss": 1.1176, + "step": 15402 + }, + { + "epoch": 0.46, + "learning_rate": 2.910960959950606e-06, + "loss": 1.1057, + "step": 15403 + }, + { + "epoch": 0.46, + "learning_rate": 2.9107203561477603e-06, + "loss": 1.108, + "step": 15404 + }, + { + "epoch": 0.46, + "learning_rate": 2.910479748435054e-06, + "loss": 1.2258, + "step": 15405 + }, + { + "epoch": 0.46, + "learning_rate": 2.9102391368147777e-06, + "loss": 1.2386, + "step": 15406 + }, + { + "epoch": 0.46, + "learning_rate": 2.9099985212892225e-06, + "loss": 1.1736, + "step": 15407 + }, + { + "epoch": 0.46, + "learning_rate": 2.9097579018606792e-06, + "loss": 1.0826, + "step": 15408 + }, + { + "epoch": 0.46, + "learning_rate": 2.909517278531438e-06, + "loss": 1.1401, + "step": 15409 + }, + { + "epoch": 0.46, + "learning_rate": 2.90927665130379e-06, + "loss": 1.0833, + "step": 15410 + }, + { + "epoch": 0.46, + "learning_rate": 2.9090360201800244e-06, + "loss": 1.1562, + "step": 15411 + }, + { + "epoch": 0.46, + "learning_rate": 2.908795385162434e-06, + "loss": 1.2131, + "step": 15412 + }, + { + "epoch": 0.46, + "learning_rate": 2.9085547462533077e-06, + "loss": 0.9659, + "step": 15413 + }, + { + "epoch": 0.46, + "learning_rate": 2.9083141034549374e-06, + "loss": 1.0551, + "step": 15414 + }, + { + "epoch": 0.46, + "learning_rate": 2.908073456769613e-06, + "loss": 0.9518, + "step": 15415 + }, + { + "epoch": 0.46, + "learning_rate": 2.9078328061996255e-06, + "loss": 1.1272, + "step": 15416 + }, + { + "epoch": 0.46, + "learning_rate": 2.907592151747267e-06, + "loss": 1.0624, + "step": 15417 + }, + { + "epoch": 0.46, + "learning_rate": 2.9073514934148268e-06, + "loss": 1.1208, + "step": 15418 + }, + { + "epoch": 0.46, + "learning_rate": 2.907110831204597e-06, + "loss": 1.1256, + "step": 15419 + }, + { + "epoch": 0.46, + "learning_rate": 2.9068701651188673e-06, + "loss": 1.1167, + "step": 15420 + }, + { + "epoch": 0.46, + "learning_rate": 2.906629495159931e-06, + "loss": 1.1276, + "step": 15421 + }, + { + "epoch": 0.46, + "learning_rate": 2.9063888213300767e-06, + "loss": 1.205, + "step": 15422 + }, + { + "epoch": 0.46, + "learning_rate": 2.9061481436315976e-06, + "loss": 1.1494, + "step": 15423 + }, + { + "epoch": 0.46, + "learning_rate": 2.9059074620667828e-06, + "loss": 1.1948, + "step": 15424 + }, + { + "epoch": 0.46, + "learning_rate": 2.905666776637925e-06, + "loss": 1.1508, + "step": 15425 + }, + { + "epoch": 0.46, + "learning_rate": 2.9054260873473145e-06, + "loss": 1.1298, + "step": 15426 + }, + { + "epoch": 0.46, + "learning_rate": 2.905185394197243e-06, + "loss": 1.1162, + "step": 15427 + }, + { + "epoch": 0.46, + "learning_rate": 2.904944697190002e-06, + "loss": 1.1188, + "step": 15428 + }, + { + "epoch": 0.46, + "learning_rate": 2.904703996327882e-06, + "loss": 1.1188, + "step": 15429 + }, + { + "epoch": 0.46, + "learning_rate": 2.9044632916131754e-06, + "loss": 1.0731, + "step": 15430 + }, + { + "epoch": 0.46, + "learning_rate": 2.9042225830481724e-06, + "loss": 1.2458, + "step": 15431 + }, + { + "epoch": 0.46, + "learning_rate": 2.903981870635165e-06, + "loss": 1.2482, + "step": 15432 + }, + { + "epoch": 0.46, + "learning_rate": 2.903741154376446e-06, + "loss": 1.1992, + "step": 15433 + }, + { + "epoch": 0.46, + "learning_rate": 2.9035004342743043e-06, + "loss": 1.1049, + "step": 15434 + }, + { + "epoch": 0.46, + "learning_rate": 2.9032597103310336e-06, + "loss": 1.1496, + "step": 15435 + }, + { + "epoch": 0.47, + "learning_rate": 2.903018982548924e-06, + "loss": 1.1624, + "step": 15436 + }, + { + "epoch": 0.47, + "learning_rate": 2.9027782509302684e-06, + "loss": 1.1592, + "step": 15437 + }, + { + "epoch": 0.47, + "learning_rate": 2.9025375154773577e-06, + "loss": 1.1997, + "step": 15438 + }, + { + "epoch": 0.47, + "learning_rate": 2.9022967761924835e-06, + "loss": 1.0994, + "step": 15439 + }, + { + "epoch": 0.47, + "learning_rate": 2.9020560330779387e-06, + "loss": 1.0758, + "step": 15440 + }, + { + "epoch": 0.47, + "learning_rate": 2.901815286136013e-06, + "loss": 1.1151, + "step": 15441 + }, + { + "epoch": 0.47, + "learning_rate": 2.9015745353689993e-06, + "loss": 1.1336, + "step": 15442 + }, + { + "epoch": 0.47, + "learning_rate": 2.90133378077919e-06, + "loss": 1.1876, + "step": 15443 + }, + { + "epoch": 0.47, + "learning_rate": 2.901093022368876e-06, + "loss": 1.0344, + "step": 15444 + }, + { + "epoch": 0.47, + "learning_rate": 2.90085226014035e-06, + "loss": 1.2045, + "step": 15445 + }, + { + "epoch": 0.47, + "learning_rate": 2.900611494095903e-06, + "loss": 1.1277, + "step": 15446 + }, + { + "epoch": 0.47, + "learning_rate": 2.9003707242378277e-06, + "loss": 1.0372, + "step": 15447 + }, + { + "epoch": 0.47, + "learning_rate": 2.900129950568416e-06, + "loss": 1.1934, + "step": 15448 + }, + { + "epoch": 0.47, + "learning_rate": 2.8998891730899604e-06, + "loss": 1.0757, + "step": 15449 + }, + { + "epoch": 0.47, + "learning_rate": 2.8996483918047512e-06, + "loss": 1.0126, + "step": 15450 + }, + { + "epoch": 0.47, + "learning_rate": 2.8994076067150834e-06, + "loss": 1.1448, + "step": 15451 + }, + { + "epoch": 0.47, + "learning_rate": 2.899166817823246e-06, + "loss": 1.2203, + "step": 15452 + }, + { + "epoch": 0.47, + "learning_rate": 2.8989260251315342e-06, + "loss": 1.2487, + "step": 15453 + }, + { + "epoch": 0.47, + "learning_rate": 2.898685228642238e-06, + "loss": 1.1958, + "step": 15454 + }, + { + "epoch": 0.47, + "learning_rate": 2.89844442835765e-06, + "loss": 1.1293, + "step": 15455 + }, + { + "epoch": 0.47, + "learning_rate": 2.898203624280064e-06, + "loss": 1.1465, + "step": 15456 + }, + { + "epoch": 0.47, + "learning_rate": 2.89796281641177e-06, + "loss": 1.067, + "step": 15457 + }, + { + "epoch": 0.47, + "learning_rate": 2.8977220047550625e-06, + "loss": 1.0596, + "step": 15458 + }, + { + "epoch": 0.47, + "learning_rate": 2.897481189312233e-06, + "loss": 1.0548, + "step": 15459 + }, + { + "epoch": 0.47, + "learning_rate": 2.8972403700855733e-06, + "loss": 1.0717, + "step": 15460 + }, + { + "epoch": 0.47, + "learning_rate": 2.896999547077377e-06, + "loss": 1.1292, + "step": 15461 + }, + { + "epoch": 0.47, + "learning_rate": 2.8967587202899374e-06, + "loss": 1.2329, + "step": 15462 + }, + { + "epoch": 0.47, + "learning_rate": 2.896517889725544e-06, + "loss": 1.0721, + "step": 15463 + }, + { + "epoch": 0.47, + "learning_rate": 2.8962770553864927e-06, + "loss": 1.1569, + "step": 15464 + }, + { + "epoch": 0.47, + "learning_rate": 2.896036217275074e-06, + "loss": 1.1213, + "step": 15465 + }, + { + "epoch": 0.47, + "learning_rate": 2.895795375393582e-06, + "loss": 1.1948, + "step": 15466 + }, + { + "epoch": 0.47, + "learning_rate": 2.8955545297443077e-06, + "loss": 1.0972, + "step": 15467 + }, + { + "epoch": 0.47, + "learning_rate": 2.8953136803295446e-06, + "loss": 1.2265, + "step": 15468 + }, + { + "epoch": 0.47, + "learning_rate": 2.8950728271515865e-06, + "loss": 0.9622, + "step": 15469 + }, + { + "epoch": 0.47, + "learning_rate": 2.8948319702127246e-06, + "loss": 1.1498, + "step": 15470 + }, + { + "epoch": 0.47, + "learning_rate": 2.8945911095152536e-06, + "loss": 1.0801, + "step": 15471 + }, + { + "epoch": 0.47, + "learning_rate": 2.894350245061464e-06, + "loss": 1.0844, + "step": 15472 + }, + { + "epoch": 0.47, + "learning_rate": 2.894109376853651e-06, + "loss": 1.2139, + "step": 15473 + }, + { + "epoch": 0.47, + "learning_rate": 2.8938685048941056e-06, + "loss": 1.1483, + "step": 15474 + }, + { + "epoch": 0.47, + "learning_rate": 2.8936276291851227e-06, + "loss": 1.0436, + "step": 15475 + }, + { + "epoch": 0.47, + "learning_rate": 2.8933867497289936e-06, + "loss": 1.1721, + "step": 15476 + }, + { + "epoch": 0.47, + "learning_rate": 2.893145866528013e-06, + "loss": 1.0829, + "step": 15477 + }, + { + "epoch": 0.47, + "learning_rate": 2.892904979584472e-06, + "loss": 1.1601, + "step": 15478 + }, + { + "epoch": 0.47, + "learning_rate": 2.892664088900666e-06, + "loss": 1.134, + "step": 15479 + }, + { + "epoch": 0.47, + "learning_rate": 2.8924231944788863e-06, + "loss": 1.0319, + "step": 15480 + }, + { + "epoch": 0.47, + "learning_rate": 2.8921822963214263e-06, + "loss": 1.0905, + "step": 15481 + }, + { + "epoch": 0.47, + "learning_rate": 2.89194139443058e-06, + "loss": 1.1843, + "step": 15482 + }, + { + "epoch": 0.47, + "learning_rate": 2.891700488808641e-06, + "loss": 1.1782, + "step": 15483 + }, + { + "epoch": 0.47, + "learning_rate": 2.8914595794579016e-06, + "loss": 1.0302, + "step": 15484 + }, + { + "epoch": 0.47, + "learning_rate": 2.891218666380655e-06, + "loss": 1.1299, + "step": 15485 + }, + { + "epoch": 0.47, + "learning_rate": 2.8909777495791965e-06, + "loss": 1.151, + "step": 15486 + }, + { + "epoch": 0.47, + "learning_rate": 2.8907368290558167e-06, + "loss": 1.2505, + "step": 15487 + }, + { + "epoch": 0.47, + "learning_rate": 2.890495904812811e-06, + "loss": 1.1427, + "step": 15488 + }, + { + "epoch": 0.47, + "learning_rate": 2.8902549768524724e-06, + "loss": 1.1201, + "step": 15489 + }, + { + "epoch": 0.47, + "learning_rate": 2.8900140451770946e-06, + "loss": 1.0848, + "step": 15490 + }, + { + "epoch": 0.47, + "learning_rate": 2.88977310978897e-06, + "loss": 1.1512, + "step": 15491 + }, + { + "epoch": 0.47, + "learning_rate": 2.8895321706903946e-06, + "loss": 1.1475, + "step": 15492 + }, + { + "epoch": 0.47, + "learning_rate": 2.88929122788366e-06, + "loss": 1.0983, + "step": 15493 + }, + { + "epoch": 0.47, + "learning_rate": 2.88905028137106e-06, + "loss": 1.105, + "step": 15494 + }, + { + "epoch": 0.47, + "learning_rate": 2.8888093311548887e-06, + "loss": 1.1317, + "step": 15495 + }, + { + "epoch": 0.47, + "learning_rate": 2.88856837723744e-06, + "loss": 1.1132, + "step": 15496 + }, + { + "epoch": 0.47, + "learning_rate": 2.8883274196210077e-06, + "loss": 1.1471, + "step": 15497 + }, + { + "epoch": 0.47, + "learning_rate": 2.8880864583078848e-06, + "loss": 1.149, + "step": 15498 + }, + { + "epoch": 0.47, + "learning_rate": 2.8878454933003662e-06, + "loss": 1.1446, + "step": 15499 + }, + { + "epoch": 0.47, + "learning_rate": 2.8876045246007454e-06, + "loss": 1.0942, + "step": 15500 + }, + { + "epoch": 0.47, + "learning_rate": 2.8873635522113157e-06, + "loss": 1.0443, + "step": 15501 + }, + { + "epoch": 0.47, + "learning_rate": 2.887122576134372e-06, + "loss": 0.9877, + "step": 15502 + }, + { + "epoch": 0.47, + "learning_rate": 2.8868815963722074e-06, + "loss": 1.2141, + "step": 15503 + }, + { + "epoch": 0.47, + "learning_rate": 2.886640612927117e-06, + "loss": 1.1041, + "step": 15504 + }, + { + "epoch": 0.47, + "learning_rate": 2.8863996258013938e-06, + "loss": 1.1407, + "step": 15505 + }, + { + "epoch": 0.47, + "learning_rate": 2.886158634997332e-06, + "loss": 1.2051, + "step": 15506 + }, + { + "epoch": 0.47, + "learning_rate": 2.885917640517226e-06, + "loss": 1.0466, + "step": 15507 + }, + { + "epoch": 0.47, + "learning_rate": 2.8856766423633703e-06, + "loss": 1.1061, + "step": 15508 + }, + { + "epoch": 0.47, + "learning_rate": 2.8854356405380587e-06, + "loss": 1.2193, + "step": 15509 + }, + { + "epoch": 0.47, + "learning_rate": 2.8851946350435854e-06, + "loss": 1.09, + "step": 15510 + }, + { + "epoch": 0.47, + "learning_rate": 2.8849536258822442e-06, + "loss": 1.1592, + "step": 15511 + }, + { + "epoch": 0.47, + "learning_rate": 2.8847126130563307e-06, + "loss": 1.1537, + "step": 15512 + }, + { + "epoch": 0.47, + "learning_rate": 2.884471596568138e-06, + "loss": 1.0901, + "step": 15513 + }, + { + "epoch": 0.47, + "learning_rate": 2.88423057641996e-06, + "loss": 1.0948, + "step": 15514 + }, + { + "epoch": 0.47, + "learning_rate": 2.8839895526140926e-06, + "loss": 1.1092, + "step": 15515 + }, + { + "epoch": 0.47, + "learning_rate": 2.8837485251528303e-06, + "loss": 1.1887, + "step": 15516 + }, + { + "epoch": 0.47, + "learning_rate": 2.883507494038466e-06, + "loss": 1.0682, + "step": 15517 + }, + { + "epoch": 0.47, + "learning_rate": 2.883266459273296e-06, + "loss": 1.1047, + "step": 15518 + }, + { + "epoch": 0.47, + "learning_rate": 2.883025420859613e-06, + "loss": 1.1804, + "step": 15519 + }, + { + "epoch": 0.47, + "learning_rate": 2.8827843787997135e-06, + "loss": 1.1248, + "step": 15520 + }, + { + "epoch": 0.47, + "learning_rate": 2.8825433330958895e-06, + "loss": 1.1284, + "step": 15521 + }, + { + "epoch": 0.47, + "learning_rate": 2.8823022837504384e-06, + "loss": 1.0198, + "step": 15522 + }, + { + "epoch": 0.47, + "learning_rate": 2.882061230765653e-06, + "loss": 1.219, + "step": 15523 + }, + { + "epoch": 0.47, + "learning_rate": 2.881820174143829e-06, + "loss": 1.223, + "step": 15524 + }, + { + "epoch": 0.47, + "learning_rate": 2.881579113887261e-06, + "loss": 1.2468, + "step": 15525 + }, + { + "epoch": 0.47, + "learning_rate": 2.8813380499982437e-06, + "loss": 1.0466, + "step": 15526 + }, + { + "epoch": 0.47, + "learning_rate": 2.8810969824790718e-06, + "loss": 1.1426, + "step": 15527 + }, + { + "epoch": 0.47, + "learning_rate": 2.88085591133204e-06, + "loss": 1.1066, + "step": 15528 + }, + { + "epoch": 0.47, + "learning_rate": 2.880614836559443e-06, + "loss": 1.1606, + "step": 15529 + }, + { + "epoch": 0.47, + "learning_rate": 2.880373758163576e-06, + "loss": 1.1298, + "step": 15530 + }, + { + "epoch": 0.47, + "learning_rate": 2.8801326761467346e-06, + "loss": 1.0627, + "step": 15531 + }, + { + "epoch": 0.47, + "learning_rate": 2.879891590511213e-06, + "loss": 1.093, + "step": 15532 + }, + { + "epoch": 0.47, + "learning_rate": 2.879650501259307e-06, + "loss": 1.1445, + "step": 15533 + }, + { + "epoch": 0.47, + "learning_rate": 2.87940940839331e-06, + "loss": 1.0542, + "step": 15534 + }, + { + "epoch": 0.47, + "learning_rate": 2.8791683119155183e-06, + "loss": 1.082, + "step": 15535 + }, + { + "epoch": 0.47, + "learning_rate": 2.8789272118282273e-06, + "loss": 1.1683, + "step": 15536 + }, + { + "epoch": 0.47, + "learning_rate": 2.8786861081337313e-06, + "loss": 1.2582, + "step": 15537 + }, + { + "epoch": 0.47, + "learning_rate": 2.8784450008343266e-06, + "loss": 1.0462, + "step": 15538 + }, + { + "epoch": 0.47, + "learning_rate": 2.878203889932308e-06, + "loss": 1.1447, + "step": 15539 + }, + { + "epoch": 0.47, + "learning_rate": 2.87796277542997e-06, + "loss": 1.0589, + "step": 15540 + }, + { + "epoch": 0.47, + "learning_rate": 2.877721657329608e-06, + "loss": 1.0918, + "step": 15541 + }, + { + "epoch": 0.47, + "learning_rate": 2.8774805356335177e-06, + "loss": 1.2114, + "step": 15542 + }, + { + "epoch": 0.47, + "learning_rate": 2.877239410343995e-06, + "loss": 1.081, + "step": 15543 + }, + { + "epoch": 0.47, + "learning_rate": 2.8769982814633352e-06, + "loss": 1.0557, + "step": 15544 + }, + { + "epoch": 0.47, + "learning_rate": 2.8767571489938324e-06, + "loss": 1.1317, + "step": 15545 + }, + { + "epoch": 0.47, + "learning_rate": 2.876516012937784e-06, + "loss": 1.1727, + "step": 15546 + }, + { + "epoch": 0.47, + "learning_rate": 2.8762748732974836e-06, + "loss": 1.0241, + "step": 15547 + }, + { + "epoch": 0.47, + "learning_rate": 2.8760337300752278e-06, + "loss": 1.1697, + "step": 15548 + }, + { + "epoch": 0.47, + "learning_rate": 2.8757925832733125e-06, + "loss": 1.2377, + "step": 15549 + }, + { + "epoch": 0.47, + "learning_rate": 2.875551432894032e-06, + "loss": 1.2383, + "step": 15550 + }, + { + "epoch": 0.47, + "learning_rate": 2.8753102789396836e-06, + "loss": 1.0278, + "step": 15551 + }, + { + "epoch": 0.47, + "learning_rate": 2.8750691214125613e-06, + "loss": 1.1058, + "step": 15552 + }, + { + "epoch": 0.47, + "learning_rate": 2.8748279603149626e-06, + "loss": 1.0067, + "step": 15553 + }, + { + "epoch": 0.47, + "learning_rate": 2.8745867956491813e-06, + "loss": 1.1114, + "step": 15554 + }, + { + "epoch": 0.47, + "learning_rate": 2.874345627417514e-06, + "loss": 1.1281, + "step": 15555 + }, + { + "epoch": 0.47, + "learning_rate": 2.874104455622257e-06, + "loss": 1.0629, + "step": 15556 + }, + { + "epoch": 0.47, + "learning_rate": 2.873863280265706e-06, + "loss": 1.1688, + "step": 15557 + }, + { + "epoch": 0.47, + "learning_rate": 2.8736221013501566e-06, + "loss": 1.1263, + "step": 15558 + }, + { + "epoch": 0.47, + "learning_rate": 2.873380918877905e-06, + "loss": 1.2072, + "step": 15559 + }, + { + "epoch": 0.47, + "learning_rate": 2.8731397328512463e-06, + "loss": 1.2432, + "step": 15560 + }, + { + "epoch": 0.47, + "learning_rate": 2.8728985432724765e-06, + "loss": 1.1444, + "step": 15561 + }, + { + "epoch": 0.47, + "learning_rate": 2.8726573501438937e-06, + "loss": 1.2194, + "step": 15562 + }, + { + "epoch": 0.47, + "learning_rate": 2.872416153467791e-06, + "loss": 1.0408, + "step": 15563 + }, + { + "epoch": 0.47, + "learning_rate": 2.872174953246467e-06, + "loss": 1.247, + "step": 15564 + }, + { + "epoch": 0.47, + "learning_rate": 2.8719337494822158e-06, + "loss": 1.0413, + "step": 15565 + }, + { + "epoch": 0.47, + "learning_rate": 2.871692542177335e-06, + "loss": 1.2166, + "step": 15566 + }, + { + "epoch": 0.47, + "learning_rate": 2.8714513313341203e-06, + "loss": 1.0969, + "step": 15567 + }, + { + "epoch": 0.47, + "learning_rate": 2.871210116954868e-06, + "loss": 1.2177, + "step": 15568 + }, + { + "epoch": 0.47, + "learning_rate": 2.870968899041873e-06, + "loss": 1.1101, + "step": 15569 + }, + { + "epoch": 0.47, + "learning_rate": 2.8707276775974337e-06, + "loss": 1.0975, + "step": 15570 + }, + { + "epoch": 0.47, + "learning_rate": 2.8704864526238447e-06, + "loss": 1.1304, + "step": 15571 + }, + { + "epoch": 0.47, + "learning_rate": 2.8702452241234036e-06, + "loss": 1.1483, + "step": 15572 + }, + { + "epoch": 0.47, + "learning_rate": 2.8700039920984063e-06, + "loss": 1.105, + "step": 15573 + }, + { + "epoch": 0.47, + "learning_rate": 2.8697627565511487e-06, + "loss": 1.1235, + "step": 15574 + }, + { + "epoch": 0.47, + "learning_rate": 2.869521517483929e-06, + "loss": 1.2334, + "step": 15575 + }, + { + "epoch": 0.47, + "learning_rate": 2.869280274899041e-06, + "loss": 1.0373, + "step": 15576 + }, + { + "epoch": 0.47, + "learning_rate": 2.8690390287987835e-06, + "loss": 1.1134, + "step": 15577 + }, + { + "epoch": 0.47, + "learning_rate": 2.868797779185452e-06, + "loss": 1.0865, + "step": 15578 + }, + { + "epoch": 0.47, + "learning_rate": 2.8685565260613434e-06, + "loss": 1.1311, + "step": 15579 + }, + { + "epoch": 0.47, + "learning_rate": 2.868315269428754e-06, + "loss": 1.0549, + "step": 15580 + }, + { + "epoch": 0.47, + "learning_rate": 2.8680740092899806e-06, + "loss": 1.2762, + "step": 15581 + }, + { + "epoch": 0.47, + "learning_rate": 2.86783274564732e-06, + "loss": 1.1279, + "step": 15582 + }, + { + "epoch": 0.47, + "learning_rate": 2.867591478503068e-06, + "loss": 0.9926, + "step": 15583 + }, + { + "epoch": 0.47, + "learning_rate": 2.8673502078595235e-06, + "loss": 1.0461, + "step": 15584 + }, + { + "epoch": 0.47, + "learning_rate": 2.867108933718981e-06, + "loss": 1.1714, + "step": 15585 + }, + { + "epoch": 0.47, + "learning_rate": 2.866867656083739e-06, + "loss": 1.0934, + "step": 15586 + }, + { + "epoch": 0.47, + "learning_rate": 2.866626374956093e-06, + "loss": 1.2943, + "step": 15587 + }, + { + "epoch": 0.47, + "learning_rate": 2.8663850903383407e-06, + "loss": 1.0835, + "step": 15588 + }, + { + "epoch": 0.47, + "learning_rate": 2.8661438022327785e-06, + "loss": 1.1624, + "step": 15589 + }, + { + "epoch": 0.47, + "learning_rate": 2.8659025106417045e-06, + "loss": 0.9821, + "step": 15590 + }, + { + "epoch": 0.47, + "learning_rate": 2.865661215567414e-06, + "loss": 1.0766, + "step": 15591 + }, + { + "epoch": 0.47, + "learning_rate": 2.8654199170122056e-06, + "loss": 1.0657, + "step": 15592 + }, + { + "epoch": 0.47, + "learning_rate": 2.8651786149783746e-06, + "loss": 1.1094, + "step": 15593 + }, + { + "epoch": 0.47, + "learning_rate": 2.86493730946822e-06, + "loss": 1.0826, + "step": 15594 + }, + { + "epoch": 0.47, + "learning_rate": 2.8646960004840367e-06, + "loss": 1.1003, + "step": 15595 + }, + { + "epoch": 0.47, + "learning_rate": 2.8644546880281243e-06, + "loss": 1.0663, + "step": 15596 + }, + { + "epoch": 0.47, + "learning_rate": 2.864213372102778e-06, + "loss": 0.964, + "step": 15597 + }, + { + "epoch": 0.47, + "learning_rate": 2.8639720527102967e-06, + "loss": 1.2181, + "step": 15598 + }, + { + "epoch": 0.47, + "learning_rate": 2.863730729852976e-06, + "loss": 1.1063, + "step": 15599 + }, + { + "epoch": 0.47, + "learning_rate": 2.8634894035331145e-06, + "loss": 1.2817, + "step": 15600 + }, + { + "epoch": 0.47, + "learning_rate": 2.8632480737530082e-06, + "loss": 1.1011, + "step": 15601 + }, + { + "epoch": 0.47, + "learning_rate": 2.863006740514955e-06, + "loss": 1.1407, + "step": 15602 + }, + { + "epoch": 0.47, + "learning_rate": 2.862765403821254e-06, + "loss": 1.1599, + "step": 15603 + }, + { + "epoch": 0.47, + "learning_rate": 2.8625240636742004e-06, + "loss": 1.0958, + "step": 15604 + }, + { + "epoch": 0.47, + "learning_rate": 2.8622827200760916e-06, + "loss": 1.1354, + "step": 15605 + }, + { + "epoch": 0.47, + "learning_rate": 2.8620413730292264e-06, + "loss": 1.2686, + "step": 15606 + }, + { + "epoch": 0.47, + "learning_rate": 2.8618000225359022e-06, + "loss": 1.1317, + "step": 15607 + }, + { + "epoch": 0.47, + "learning_rate": 2.8615586685984146e-06, + "loss": 1.2047, + "step": 15608 + }, + { + "epoch": 0.47, + "learning_rate": 2.861317311219064e-06, + "loss": 1.0989, + "step": 15609 + }, + { + "epoch": 0.47, + "learning_rate": 2.861075950400146e-06, + "loss": 1.1967, + "step": 15610 + }, + { + "epoch": 0.47, + "learning_rate": 2.8608345861439584e-06, + "loss": 1.1412, + "step": 15611 + }, + { + "epoch": 0.47, + "learning_rate": 2.8605932184527996e-06, + "loss": 1.1491, + "step": 15612 + }, + { + "epoch": 0.47, + "learning_rate": 2.8603518473289678e-06, + "loss": 1.2304, + "step": 15613 + }, + { + "epoch": 0.47, + "learning_rate": 2.860110472774759e-06, + "loss": 1.0798, + "step": 15614 + }, + { + "epoch": 0.47, + "learning_rate": 2.8598690947924716e-06, + "loss": 1.1926, + "step": 15615 + }, + { + "epoch": 0.47, + "learning_rate": 2.8596277133844053e-06, + "loss": 1.1512, + "step": 15616 + }, + { + "epoch": 0.47, + "learning_rate": 2.859386328552855e-06, + "loss": 1.2949, + "step": 15617 + }, + { + "epoch": 0.47, + "learning_rate": 2.859144940300121e-06, + "loss": 1.2212, + "step": 15618 + }, + { + "epoch": 0.47, + "learning_rate": 2.8589035486284993e-06, + "loss": 1.173, + "step": 15619 + }, + { + "epoch": 0.47, + "learning_rate": 2.8586621535402894e-06, + "loss": 1.1373, + "step": 15620 + }, + { + "epoch": 0.47, + "learning_rate": 2.858420755037788e-06, + "loss": 0.9487, + "step": 15621 + }, + { + "epoch": 0.47, + "learning_rate": 2.8581793531232937e-06, + "loss": 1.0055, + "step": 15622 + }, + { + "epoch": 0.47, + "learning_rate": 2.8579379477991043e-06, + "loss": 1.1744, + "step": 15623 + }, + { + "epoch": 0.47, + "learning_rate": 2.8576965390675183e-06, + "loss": 1.162, + "step": 15624 + }, + { + "epoch": 0.47, + "learning_rate": 2.857455126930833e-06, + "loss": 1.1237, + "step": 15625 + }, + { + "epoch": 0.47, + "learning_rate": 2.8572137113913477e-06, + "loss": 1.0577, + "step": 15626 + }, + { + "epoch": 0.47, + "learning_rate": 2.85697229245136e-06, + "loss": 1.1014, + "step": 15627 + }, + { + "epoch": 0.47, + "learning_rate": 2.8567308701131675e-06, + "loss": 1.074, + "step": 15628 + }, + { + "epoch": 0.47, + "learning_rate": 2.856489444379069e-06, + "loss": 1.1333, + "step": 15629 + }, + { + "epoch": 0.47, + "learning_rate": 2.8562480152513626e-06, + "loss": 1.1923, + "step": 15630 + }, + { + "epoch": 0.47, + "learning_rate": 2.8560065827323474e-06, + "loss": 1.2382, + "step": 15631 + }, + { + "epoch": 0.47, + "learning_rate": 2.8557651468243204e-06, + "loss": 1.0582, + "step": 15632 + }, + { + "epoch": 0.47, + "learning_rate": 2.8555237075295804e-06, + "loss": 1.1489, + "step": 15633 + }, + { + "epoch": 0.47, + "learning_rate": 2.855282264850426e-06, + "loss": 1.1724, + "step": 15634 + }, + { + "epoch": 0.47, + "learning_rate": 2.8550408187891567e-06, + "loss": 1.1995, + "step": 15635 + }, + { + "epoch": 0.47, + "learning_rate": 2.854799369348068e-06, + "loss": 1.1514, + "step": 15636 + }, + { + "epoch": 0.47, + "learning_rate": 2.854557916529461e-06, + "loss": 1.1815, + "step": 15637 + }, + { + "epoch": 0.47, + "learning_rate": 2.8543164603356333e-06, + "loss": 1.0981, + "step": 15638 + }, + { + "epoch": 0.47, + "learning_rate": 2.854075000768884e-06, + "loss": 1.1769, + "step": 15639 + }, + { + "epoch": 0.47, + "learning_rate": 2.8538335378315103e-06, + "loss": 1.0524, + "step": 15640 + }, + { + "epoch": 0.47, + "learning_rate": 2.853592071525812e-06, + "loss": 1.1013, + "step": 15641 + }, + { + "epoch": 0.47, + "learning_rate": 2.853350601854088e-06, + "loss": 1.1372, + "step": 15642 + }, + { + "epoch": 0.47, + "learning_rate": 2.8531091288186365e-06, + "loss": 1.1807, + "step": 15643 + }, + { + "epoch": 0.47, + "learning_rate": 2.8528676524217557e-06, + "loss": 1.1328, + "step": 15644 + }, + { + "epoch": 0.47, + "learning_rate": 2.852626172665745e-06, + "loss": 1.1471, + "step": 15645 + }, + { + "epoch": 0.47, + "learning_rate": 2.8523846895529027e-06, + "loss": 1.153, + "step": 15646 + }, + { + "epoch": 0.47, + "learning_rate": 2.852143203085528e-06, + "loss": 1.174, + "step": 15647 + }, + { + "epoch": 0.47, + "learning_rate": 2.8519017132659204e-06, + "loss": 1.0992, + "step": 15648 + }, + { + "epoch": 0.47, + "learning_rate": 2.8516602200963765e-06, + "loss": 1.0385, + "step": 15649 + }, + { + "epoch": 0.47, + "learning_rate": 2.851418723579198e-06, + "loss": 1.1651, + "step": 15650 + }, + { + "epoch": 0.47, + "learning_rate": 2.8511772237166818e-06, + "loss": 1.038, + "step": 15651 + }, + { + "epoch": 0.47, + "learning_rate": 2.8509357205111277e-06, + "loss": 1.0757, + "step": 15652 + }, + { + "epoch": 0.47, + "learning_rate": 2.8506942139648342e-06, + "loss": 1.0245, + "step": 15653 + }, + { + "epoch": 0.47, + "learning_rate": 2.8504527040801005e-06, + "loss": 1.1276, + "step": 15654 + }, + { + "epoch": 0.47, + "learning_rate": 2.850211190859227e-06, + "loss": 1.1207, + "step": 15655 + }, + { + "epoch": 0.47, + "learning_rate": 2.8499696743045106e-06, + "loss": 1.1945, + "step": 15656 + }, + { + "epoch": 0.47, + "learning_rate": 2.849728154418252e-06, + "loss": 1.2106, + "step": 15657 + }, + { + "epoch": 0.47, + "learning_rate": 2.8494866312027495e-06, + "loss": 1.1016, + "step": 15658 + }, + { + "epoch": 0.47, + "learning_rate": 2.849245104660303e-06, + "loss": 1.1637, + "step": 15659 + }, + { + "epoch": 0.47, + "learning_rate": 2.849003574793211e-06, + "loss": 1.1389, + "step": 15660 + }, + { + "epoch": 0.47, + "learning_rate": 2.8487620416037735e-06, + "loss": 1.0972, + "step": 15661 + }, + { + "epoch": 0.47, + "learning_rate": 2.848520505094289e-06, + "loss": 1.1602, + "step": 15662 + }, + { + "epoch": 0.47, + "learning_rate": 2.8482789652670574e-06, + "loss": 1.2797, + "step": 15663 + }, + { + "epoch": 0.47, + "learning_rate": 2.848037422124377e-06, + "loss": 1.1127, + "step": 15664 + }, + { + "epoch": 0.47, + "learning_rate": 2.847795875668548e-06, + "loss": 1.1205, + "step": 15665 + }, + { + "epoch": 0.47, + "learning_rate": 2.84755432590187e-06, + "loss": 1.1664, + "step": 15666 + }, + { + "epoch": 0.47, + "learning_rate": 2.8473127728266427e-06, + "loss": 1.2198, + "step": 15667 + }, + { + "epoch": 0.47, + "learning_rate": 2.8470712164451645e-06, + "loss": 1.183, + "step": 15668 + }, + { + "epoch": 0.47, + "learning_rate": 2.846829656759736e-06, + "loss": 1.2456, + "step": 15669 + }, + { + "epoch": 0.47, + "learning_rate": 2.8465880937726566e-06, + "loss": 1.0652, + "step": 15670 + }, + { + "epoch": 0.47, + "learning_rate": 2.846346527486224e-06, + "loss": 1.1077, + "step": 15671 + }, + { + "epoch": 0.47, + "learning_rate": 2.8461049579027404e-06, + "loss": 1.0833, + "step": 15672 + }, + { + "epoch": 0.47, + "learning_rate": 2.8458633850245036e-06, + "loss": 1.1633, + "step": 15673 + }, + { + "epoch": 0.47, + "learning_rate": 2.845621808853815e-06, + "loss": 1.2062, + "step": 15674 + }, + { + "epoch": 0.47, + "learning_rate": 2.845380229392972e-06, + "loss": 1.1697, + "step": 15675 + }, + { + "epoch": 0.47, + "learning_rate": 2.8451386466442773e-06, + "loss": 1.1102, + "step": 15676 + }, + { + "epoch": 0.47, + "learning_rate": 2.8448970606100268e-06, + "loss": 1.1168, + "step": 15677 + }, + { + "epoch": 0.47, + "learning_rate": 2.8446554712925232e-06, + "loss": 1.0455, + "step": 15678 + }, + { + "epoch": 0.47, + "learning_rate": 2.8444138786940655e-06, + "loss": 1.1006, + "step": 15679 + }, + { + "epoch": 0.47, + "learning_rate": 2.8441722828169542e-06, + "loss": 1.194, + "step": 15680 + }, + { + "epoch": 0.47, + "learning_rate": 2.8439306836634877e-06, + "loss": 1.1567, + "step": 15681 + }, + { + "epoch": 0.47, + "learning_rate": 2.843689081235967e-06, + "loss": 1.1198, + "step": 15682 + }, + { + "epoch": 0.47, + "learning_rate": 2.843447475536692e-06, + "loss": 1.1751, + "step": 15683 + }, + { + "epoch": 0.47, + "learning_rate": 2.843205866567962e-06, + "loss": 1.1116, + "step": 15684 + }, + { + "epoch": 0.47, + "learning_rate": 2.842964254332078e-06, + "loss": 1.0313, + "step": 15685 + }, + { + "epoch": 0.47, + "learning_rate": 2.8427226388313388e-06, + "loss": 1.1708, + "step": 15686 + }, + { + "epoch": 0.47, + "learning_rate": 2.8424810200680465e-06, + "loss": 1.1591, + "step": 15687 + }, + { + "epoch": 0.47, + "learning_rate": 2.8422393980444985e-06, + "loss": 1.1716, + "step": 15688 + }, + { + "epoch": 0.47, + "learning_rate": 2.8419977727629967e-06, + "loss": 1.1936, + "step": 15689 + }, + { + "epoch": 0.47, + "learning_rate": 2.8417561442258408e-06, + "loss": 1.0726, + "step": 15690 + }, + { + "epoch": 0.47, + "learning_rate": 2.8415145124353313e-06, + "loss": 1.1803, + "step": 15691 + }, + { + "epoch": 0.47, + "learning_rate": 2.841272877393767e-06, + "loss": 1.1077, + "step": 15692 + }, + { + "epoch": 0.47, + "learning_rate": 2.84103123910345e-06, + "loss": 1.1981, + "step": 15693 + }, + { + "epoch": 0.47, + "learning_rate": 2.8407895975666793e-06, + "loss": 1.0876, + "step": 15694 + }, + { + "epoch": 0.47, + "learning_rate": 2.8405479527857565e-06, + "loss": 1.1046, + "step": 15695 + }, + { + "epoch": 0.47, + "learning_rate": 2.8403063047629816e-06, + "loss": 1.0863, + "step": 15696 + }, + { + "epoch": 0.47, + "learning_rate": 2.8400646535006538e-06, + "loss": 1.1383, + "step": 15697 + }, + { + "epoch": 0.47, + "learning_rate": 2.8398229990010745e-06, + "loss": 1.1161, + "step": 15698 + }, + { + "epoch": 0.47, + "learning_rate": 2.8395813412665433e-06, + "loss": 1.2491, + "step": 15699 + }, + { + "epoch": 0.47, + "learning_rate": 2.8393396802993626e-06, + "loss": 1.2007, + "step": 15700 + }, + { + "epoch": 0.47, + "learning_rate": 2.8390980161018304e-06, + "loss": 1.1821, + "step": 15701 + }, + { + "epoch": 0.47, + "learning_rate": 2.838856348676249e-06, + "loss": 1.0787, + "step": 15702 + }, + { + "epoch": 0.47, + "learning_rate": 2.8386146780249183e-06, + "loss": 1.1014, + "step": 15703 + }, + { + "epoch": 0.47, + "learning_rate": 2.8383730041501397e-06, + "loss": 1.3087, + "step": 15704 + }, + { + "epoch": 0.47, + "learning_rate": 2.8381313270542116e-06, + "loss": 1.2269, + "step": 15705 + }, + { + "epoch": 0.47, + "learning_rate": 2.8378896467394368e-06, + "loss": 1.2182, + "step": 15706 + }, + { + "epoch": 0.47, + "learning_rate": 2.837647963208115e-06, + "loss": 1.015, + "step": 15707 + }, + { + "epoch": 0.47, + "learning_rate": 2.837406276462547e-06, + "loss": 1.1423, + "step": 15708 + }, + { + "epoch": 0.47, + "learning_rate": 2.8371645865050347e-06, + "loss": 1.0801, + "step": 15709 + }, + { + "epoch": 0.47, + "learning_rate": 2.8369228933378766e-06, + "loss": 1.0839, + "step": 15710 + }, + { + "epoch": 0.47, + "learning_rate": 2.836681196963376e-06, + "loss": 1.1504, + "step": 15711 + }, + { + "epoch": 0.47, + "learning_rate": 2.8364394973838322e-06, + "loss": 1.0372, + "step": 15712 + }, + { + "epoch": 0.47, + "learning_rate": 2.8361977946015466e-06, + "loss": 1.1924, + "step": 15713 + }, + { + "epoch": 0.47, + "learning_rate": 2.83595608861882e-06, + "loss": 1.1296, + "step": 15714 + }, + { + "epoch": 0.47, + "learning_rate": 2.8357143794379533e-06, + "loss": 1.1696, + "step": 15715 + }, + { + "epoch": 0.47, + "learning_rate": 2.8354726670612463e-06, + "loss": 1.1274, + "step": 15716 + }, + { + "epoch": 0.47, + "learning_rate": 2.8352309514910027e-06, + "loss": 1.1025, + "step": 15717 + }, + { + "epoch": 0.47, + "learning_rate": 2.834989232729521e-06, + "loss": 1.1508, + "step": 15718 + }, + { + "epoch": 0.47, + "learning_rate": 2.834747510779103e-06, + "loss": 1.1436, + "step": 15719 + }, + { + "epoch": 0.47, + "learning_rate": 2.8345057856420495e-06, + "loss": 1.0414, + "step": 15720 + }, + { + "epoch": 0.47, + "learning_rate": 2.834264057320663e-06, + "loss": 1.0894, + "step": 15721 + }, + { + "epoch": 0.47, + "learning_rate": 2.8340223258172427e-06, + "loss": 0.9772, + "step": 15722 + }, + { + "epoch": 0.47, + "learning_rate": 2.8337805911340915e-06, + "loss": 1.1258, + "step": 15723 + }, + { + "epoch": 0.47, + "learning_rate": 2.8335388532735098e-06, + "loss": 1.1698, + "step": 15724 + }, + { + "epoch": 0.47, + "learning_rate": 2.8332971122377983e-06, + "loss": 1.1793, + "step": 15725 + }, + { + "epoch": 0.47, + "learning_rate": 2.83305536802926e-06, + "loss": 1.1547, + "step": 15726 + }, + { + "epoch": 0.47, + "learning_rate": 2.832813620650194e-06, + "loss": 1.1132, + "step": 15727 + }, + { + "epoch": 0.47, + "learning_rate": 2.832571870102903e-06, + "loss": 1.1866, + "step": 15728 + }, + { + "epoch": 0.47, + "learning_rate": 2.8323301163896876e-06, + "loss": 1.094, + "step": 15729 + }, + { + "epoch": 0.47, + "learning_rate": 2.8320883595128503e-06, + "loss": 1.1392, + "step": 15730 + }, + { + "epoch": 0.47, + "learning_rate": 2.8318465994746907e-06, + "loss": 1.1655, + "step": 15731 + }, + { + "epoch": 0.47, + "learning_rate": 2.8316048362775124e-06, + "loss": 1.0966, + "step": 15732 + }, + { + "epoch": 0.47, + "learning_rate": 2.831363069923615e-06, + "loss": 1.0826, + "step": 15733 + }, + { + "epoch": 0.47, + "learning_rate": 2.8311213004153003e-06, + "loss": 0.9972, + "step": 15734 + }, + { + "epoch": 0.47, + "learning_rate": 2.8308795277548705e-06, + "loss": 1.1285, + "step": 15735 + }, + { + "epoch": 0.47, + "learning_rate": 2.8306377519446275e-06, + "loss": 1.2134, + "step": 15736 + }, + { + "epoch": 0.47, + "learning_rate": 2.8303959729868724e-06, + "loss": 1.0726, + "step": 15737 + }, + { + "epoch": 0.47, + "learning_rate": 2.8301541908839065e-06, + "loss": 1.1449, + "step": 15738 + }, + { + "epoch": 0.47, + "learning_rate": 2.8299124056380324e-06, + "loss": 1.1572, + "step": 15739 + }, + { + "epoch": 0.47, + "learning_rate": 2.82967061725155e-06, + "loss": 1.0914, + "step": 15740 + }, + { + "epoch": 0.47, + "learning_rate": 2.8294288257267626e-06, + "loss": 1.1031, + "step": 15741 + }, + { + "epoch": 0.47, + "learning_rate": 2.829187031065971e-06, + "loss": 1.1276, + "step": 15742 + }, + { + "epoch": 0.47, + "learning_rate": 2.8289452332714785e-06, + "loss": 1.1263, + "step": 15743 + }, + { + "epoch": 0.47, + "learning_rate": 2.8287034323455847e-06, + "loss": 1.064, + "step": 15744 + }, + { + "epoch": 0.47, + "learning_rate": 2.8284616282905935e-06, + "loss": 1.0815, + "step": 15745 + }, + { + "epoch": 0.47, + "learning_rate": 2.8282198211088053e-06, + "loss": 1.0972, + "step": 15746 + }, + { + "epoch": 0.47, + "learning_rate": 2.8279780108025217e-06, + "loss": 1.1523, + "step": 15747 + }, + { + "epoch": 0.47, + "learning_rate": 2.8277361973740463e-06, + "loss": 1.0793, + "step": 15748 + }, + { + "epoch": 0.47, + "learning_rate": 2.8274943808256792e-06, + "loss": 1.1396, + "step": 15749 + }, + { + "epoch": 0.47, + "learning_rate": 2.8272525611597248e-06, + "loss": 1.0883, + "step": 15750 + }, + { + "epoch": 0.47, + "learning_rate": 2.8270107383784827e-06, + "loss": 1.0867, + "step": 15751 + }, + { + "epoch": 0.47, + "learning_rate": 2.826768912484256e-06, + "loss": 1.166, + "step": 15752 + }, + { + "epoch": 0.47, + "learning_rate": 2.8265270834793466e-06, + "loss": 1.0722, + "step": 15753 + }, + { + "epoch": 0.47, + "learning_rate": 2.8262852513660575e-06, + "loss": 1.1102, + "step": 15754 + }, + { + "epoch": 0.47, + "learning_rate": 2.826043416146689e-06, + "loss": 1.1786, + "step": 15755 + }, + { + "epoch": 0.47, + "learning_rate": 2.825801577823545e-06, + "loss": 1.1751, + "step": 15756 + }, + { + "epoch": 0.47, + "learning_rate": 2.8255597363989256e-06, + "loss": 1.0936, + "step": 15757 + }, + { + "epoch": 0.47, + "learning_rate": 2.8253178918751355e-06, + "loss": 1.1324, + "step": 15758 + }, + { + "epoch": 0.47, + "learning_rate": 2.825076044254475e-06, + "loss": 1.1893, + "step": 15759 + }, + { + "epoch": 0.47, + "learning_rate": 2.824834193539247e-06, + "loss": 1.058, + "step": 15760 + }, + { + "epoch": 0.47, + "learning_rate": 2.824592339731754e-06, + "loss": 1.2367, + "step": 15761 + }, + { + "epoch": 0.47, + "learning_rate": 2.8243504828342984e-06, + "loss": 1.1476, + "step": 15762 + }, + { + "epoch": 0.47, + "learning_rate": 2.824108622849183e-06, + "loss": 1.0305, + "step": 15763 + }, + { + "epoch": 0.47, + "learning_rate": 2.823866759778709e-06, + "loss": 1.1476, + "step": 15764 + }, + { + "epoch": 0.47, + "learning_rate": 2.8236248936251797e-06, + "loss": 1.1052, + "step": 15765 + }, + { + "epoch": 0.47, + "learning_rate": 2.823383024390897e-06, + "loss": 1.1506, + "step": 15766 + }, + { + "epoch": 0.47, + "learning_rate": 2.823141152078164e-06, + "loss": 1.2333, + "step": 15767 + }, + { + "epoch": 0.48, + "learning_rate": 2.822899276689283e-06, + "loss": 1.2029, + "step": 15768 + }, + { + "epoch": 0.48, + "learning_rate": 2.822657398226556e-06, + "loss": 1.1074, + "step": 15769 + }, + { + "epoch": 0.48, + "learning_rate": 2.8224155166922858e-06, + "loss": 1.2382, + "step": 15770 + }, + { + "epoch": 0.48, + "learning_rate": 2.822173632088776e-06, + "loss": 1.0911, + "step": 15771 + }, + { + "epoch": 0.48, + "learning_rate": 2.8219317444183275e-06, + "loss": 1.1519, + "step": 15772 + }, + { + "epoch": 0.48, + "learning_rate": 2.821689853683244e-06, + "loss": 1.0919, + "step": 15773 + }, + { + "epoch": 0.48, + "learning_rate": 2.821447959885828e-06, + "loss": 1.186, + "step": 15774 + }, + { + "epoch": 0.48, + "learning_rate": 2.8212060630283822e-06, + "loss": 1.0684, + "step": 15775 + }, + { + "epoch": 0.48, + "learning_rate": 2.8209641631132096e-06, + "loss": 1.2028, + "step": 15776 + }, + { + "epoch": 0.48, + "learning_rate": 2.8207222601426126e-06, + "loss": 1.1364, + "step": 15777 + }, + { + "epoch": 0.48, + "learning_rate": 2.8204803541188947e-06, + "loss": 1.1792, + "step": 15778 + }, + { + "epoch": 0.48, + "learning_rate": 2.820238445044357e-06, + "loss": 1.2966, + "step": 15779 + }, + { + "epoch": 0.48, + "learning_rate": 2.819996532921305e-06, + "loss": 1.0896, + "step": 15780 + }, + { + "epoch": 0.48, + "learning_rate": 2.819754617752039e-06, + "loss": 1.098, + "step": 15781 + }, + { + "epoch": 0.48, + "learning_rate": 2.819512699538864e-06, + "loss": 1.0439, + "step": 15782 + }, + { + "epoch": 0.48, + "learning_rate": 2.8192707782840812e-06, + "loss": 1.1871, + "step": 15783 + }, + { + "epoch": 0.48, + "learning_rate": 2.8190288539899947e-06, + "loss": 1.1107, + "step": 15784 + }, + { + "epoch": 0.48, + "learning_rate": 2.8187869266589067e-06, + "loss": 1.1133, + "step": 15785 + }, + { + "epoch": 0.48, + "learning_rate": 2.8185449962931216e-06, + "loss": 1.1372, + "step": 15786 + }, + { + "epoch": 0.48, + "learning_rate": 2.8183030628949408e-06, + "loss": 1.2356, + "step": 15787 + }, + { + "epoch": 0.48, + "learning_rate": 2.818061126466668e-06, + "loss": 1.1266, + "step": 15788 + }, + { + "epoch": 0.48, + "learning_rate": 2.8178191870106063e-06, + "loss": 1.1439, + "step": 15789 + }, + { + "epoch": 0.48, + "learning_rate": 2.8175772445290593e-06, + "loss": 1.0853, + "step": 15790 + }, + { + "epoch": 0.48, + "learning_rate": 2.817335299024331e-06, + "loss": 1.0125, + "step": 15791 + }, + { + "epoch": 0.48, + "learning_rate": 2.817093350498722e-06, + "loss": 1.3207, + "step": 15792 + }, + { + "epoch": 0.48, + "learning_rate": 2.8168513989545377e-06, + "loss": 1.1824, + "step": 15793 + }, + { + "epoch": 0.48, + "learning_rate": 2.8166094443940806e-06, + "loss": 1.0826, + "step": 15794 + }, + { + "epoch": 0.48, + "learning_rate": 2.8163674868196546e-06, + "loss": 1.1281, + "step": 15795 + }, + { + "epoch": 0.48, + "learning_rate": 2.8161255262335614e-06, + "loss": 1.1685, + "step": 15796 + }, + { + "epoch": 0.48, + "learning_rate": 2.8158835626381066e-06, + "loss": 1.1527, + "step": 15797 + }, + { + "epoch": 0.48, + "learning_rate": 2.8156415960355914e-06, + "loss": 1.0707, + "step": 15798 + }, + { + "epoch": 0.48, + "learning_rate": 2.8153996264283207e-06, + "loss": 1.0466, + "step": 15799 + }, + { + "epoch": 0.48, + "learning_rate": 2.815157653818597e-06, + "loss": 1.1263, + "step": 15800 + }, + { + "epoch": 0.48, + "learning_rate": 2.8149156782087244e-06, + "loss": 1.2389, + "step": 15801 + }, + { + "epoch": 0.48, + "learning_rate": 2.8146736996010066e-06, + "loss": 1.033, + "step": 15802 + }, + { + "epoch": 0.48, + "learning_rate": 2.814431717997746e-06, + "loss": 1.0972, + "step": 15803 + }, + { + "epoch": 0.48, + "learning_rate": 2.814189733401248e-06, + "loss": 1.1805, + "step": 15804 + }, + { + "epoch": 0.48, + "learning_rate": 2.813947745813814e-06, + "loss": 1.196, + "step": 15805 + }, + { + "epoch": 0.48, + "learning_rate": 2.8137057552377495e-06, + "loss": 1.0582, + "step": 15806 + }, + { + "epoch": 0.48, + "learning_rate": 2.8134637616753567e-06, + "loss": 1.1791, + "step": 15807 + }, + { + "epoch": 0.48, + "learning_rate": 2.8132217651289405e-06, + "loss": 1.145, + "step": 15808 + }, + { + "epoch": 0.48, + "learning_rate": 2.8129797656008036e-06, + "loss": 1.1486, + "step": 15809 + }, + { + "epoch": 0.48, + "learning_rate": 2.81273776309325e-06, + "loss": 1.1284, + "step": 15810 + }, + { + "epoch": 0.48, + "learning_rate": 2.8124957576085834e-06, + "loss": 1.082, + "step": 15811 + }, + { + "epoch": 0.48, + "learning_rate": 2.8122537491491083e-06, + "loss": 1.0887, + "step": 15812 + }, + { + "epoch": 0.48, + "learning_rate": 2.812011737717127e-06, + "loss": 1.1171, + "step": 15813 + }, + { + "epoch": 0.48, + "learning_rate": 2.8117697233149445e-06, + "loss": 1.1827, + "step": 15814 + }, + { + "epoch": 0.48, + "learning_rate": 2.811527705944865e-06, + "loss": 0.9893, + "step": 15815 + }, + { + "epoch": 0.48, + "learning_rate": 2.811285685609191e-06, + "loss": 1.1826, + "step": 15816 + }, + { + "epoch": 0.48, + "learning_rate": 2.811043662310227e-06, + "loss": 1.2837, + "step": 15817 + }, + { + "epoch": 0.48, + "learning_rate": 2.8108016360502776e-06, + "loss": 1.2025, + "step": 15818 + }, + { + "epoch": 0.48, + "learning_rate": 2.8105596068316466e-06, + "loss": 1.1143, + "step": 15819 + }, + { + "epoch": 0.48, + "learning_rate": 2.8103175746566373e-06, + "loss": 1.1549, + "step": 15820 + }, + { + "epoch": 0.48, + "learning_rate": 2.810075539527555e-06, + "loss": 1.0789, + "step": 15821 + }, + { + "epoch": 0.48, + "learning_rate": 2.8098335014467015e-06, + "loss": 1.1497, + "step": 15822 + }, + { + "epoch": 0.48, + "learning_rate": 2.8095914604163833e-06, + "loss": 1.0611, + "step": 15823 + }, + { + "epoch": 0.48, + "learning_rate": 2.809349416438903e-06, + "loss": 1.1604, + "step": 15824 + }, + { + "epoch": 0.48, + "learning_rate": 2.809107369516566e-06, + "loss": 1.1637, + "step": 15825 + }, + { + "epoch": 0.48, + "learning_rate": 2.8088653196516745e-06, + "loss": 1.0883, + "step": 15826 + }, + { + "epoch": 0.48, + "learning_rate": 2.8086232668465345e-06, + "loss": 1.0762, + "step": 15827 + }, + { + "epoch": 0.48, + "learning_rate": 2.8083812111034505e-06, + "loss": 1.1531, + "step": 15828 + }, + { + "epoch": 0.48, + "learning_rate": 2.8081391524247248e-06, + "loss": 1.2607, + "step": 15829 + }, + { + "epoch": 0.48, + "learning_rate": 2.8078970908126625e-06, + "loss": 1.2229, + "step": 15830 + }, + { + "epoch": 0.48, + "learning_rate": 2.8076550262695686e-06, + "loss": 1.1131, + "step": 15831 + }, + { + "epoch": 0.48, + "learning_rate": 2.8074129587977473e-06, + "loss": 1.0975, + "step": 15832 + }, + { + "epoch": 0.48, + "learning_rate": 2.8071708883995025e-06, + "loss": 1.1271, + "step": 15833 + }, + { + "epoch": 0.48, + "learning_rate": 2.806928815077139e-06, + "loss": 1.2087, + "step": 15834 + }, + { + "epoch": 0.48, + "learning_rate": 2.806686738832961e-06, + "loss": 1.1649, + "step": 15835 + }, + { + "epoch": 0.48, + "learning_rate": 2.8064446596692727e-06, + "loss": 1.121, + "step": 15836 + }, + { + "epoch": 0.48, + "learning_rate": 2.806202577588379e-06, + "loss": 1.0818, + "step": 15837 + }, + { + "epoch": 0.48, + "learning_rate": 2.8059604925925844e-06, + "loss": 1.2614, + "step": 15838 + }, + { + "epoch": 0.48, + "learning_rate": 2.805718404684193e-06, + "loss": 1.1164, + "step": 15839 + }, + { + "epoch": 0.48, + "learning_rate": 2.8054763138655093e-06, + "loss": 1.0414, + "step": 15840 + }, + { + "epoch": 0.48, + "learning_rate": 2.8052342201388387e-06, + "loss": 1.2001, + "step": 15841 + }, + { + "epoch": 0.48, + "learning_rate": 2.804992123506485e-06, + "loss": 1.1055, + "step": 15842 + }, + { + "epoch": 0.48, + "learning_rate": 2.804750023970753e-06, + "loss": 1.2184, + "step": 15843 + }, + { + "epoch": 0.48, + "learning_rate": 2.804507921533948e-06, + "loss": 1.2592, + "step": 15844 + }, + { + "epoch": 0.48, + "learning_rate": 2.8042658161983743e-06, + "loss": 1.17, + "step": 15845 + }, + { + "epoch": 0.48, + "learning_rate": 2.804023707966336e-06, + "loss": 1.0128, + "step": 15846 + }, + { + "epoch": 0.48, + "learning_rate": 2.8037815968401393e-06, + "loss": 0.9963, + "step": 15847 + }, + { + "epoch": 0.48, + "learning_rate": 2.8035394828220876e-06, + "loss": 1.007, + "step": 15848 + }, + { + "epoch": 0.48, + "learning_rate": 2.803297365914487e-06, + "loss": 1.2304, + "step": 15849 + }, + { + "epoch": 0.48, + "learning_rate": 2.8030552461196404e-06, + "loss": 1.0334, + "step": 15850 + }, + { + "epoch": 0.48, + "learning_rate": 2.8028131234398544e-06, + "loss": 1.1462, + "step": 15851 + }, + { + "epoch": 0.48, + "learning_rate": 2.8025709978774327e-06, + "loss": 1.1263, + "step": 15852 + }, + { + "epoch": 0.48, + "learning_rate": 2.802328869434681e-06, + "loss": 1.1093, + "step": 15853 + }, + { + "epoch": 0.48, + "learning_rate": 2.802086738113905e-06, + "loss": 1.1143, + "step": 15854 + }, + { + "epoch": 0.48, + "learning_rate": 2.8018446039174075e-06, + "loss": 1.1556, + "step": 15855 + }, + { + "epoch": 0.48, + "learning_rate": 2.8016024668474957e-06, + "loss": 1.1443, + "step": 15856 + }, + { + "epoch": 0.48, + "learning_rate": 2.8013603269064733e-06, + "loss": 1.1166, + "step": 15857 + }, + { + "epoch": 0.48, + "learning_rate": 2.8011181840966453e-06, + "loss": 1.1925, + "step": 15858 + }, + { + "epoch": 0.48, + "learning_rate": 2.8008760384203175e-06, + "loss": 1.1765, + "step": 15859 + }, + { + "epoch": 0.48, + "learning_rate": 2.8006338898797953e-06, + "loss": 1.1426, + "step": 15860 + }, + { + "epoch": 0.48, + "learning_rate": 2.8003917384773825e-06, + "loss": 1.2002, + "step": 15861 + }, + { + "epoch": 0.48, + "learning_rate": 2.800149584215385e-06, + "loss": 1.1816, + "step": 15862 + }, + { + "epoch": 0.48, + "learning_rate": 2.7999074270961086e-06, + "loss": 1.0948, + "step": 15863 + }, + { + "epoch": 0.48, + "learning_rate": 2.7996652671218584e-06, + "loss": 1.1857, + "step": 15864 + }, + { + "epoch": 0.48, + "learning_rate": 2.7994231042949375e-06, + "loss": 1.1375, + "step": 15865 + }, + { + "epoch": 0.48, + "learning_rate": 2.7991809386176542e-06, + "loss": 1.1251, + "step": 15866 + }, + { + "epoch": 0.48, + "learning_rate": 2.798938770092312e-06, + "loss": 1.083, + "step": 15867 + }, + { + "epoch": 0.48, + "learning_rate": 2.7986965987212165e-06, + "loss": 1.0687, + "step": 15868 + }, + { + "epoch": 0.48, + "learning_rate": 2.798454424506674e-06, + "loss": 1.0422, + "step": 15869 + }, + { + "epoch": 0.48, + "learning_rate": 2.798212247450988e-06, + "loss": 1.124, + "step": 15870 + }, + { + "epoch": 0.48, + "learning_rate": 2.797970067556466e-06, + "loss": 1.0912, + "step": 15871 + }, + { + "epoch": 0.48, + "learning_rate": 2.797727884825412e-06, + "loss": 1.0186, + "step": 15872 + }, + { + "epoch": 0.48, + "learning_rate": 2.7974856992601317e-06, + "loss": 1.2622, + "step": 15873 + }, + { + "epoch": 0.48, + "learning_rate": 2.7972435108629315e-06, + "loss": 1.2587, + "step": 15874 + }, + { + "epoch": 0.48, + "learning_rate": 2.7970013196361157e-06, + "loss": 1.2162, + "step": 15875 + }, + { + "epoch": 0.48, + "learning_rate": 2.7967591255819903e-06, + "loss": 1.1089, + "step": 15876 + }, + { + "epoch": 0.48, + "learning_rate": 2.7965169287028614e-06, + "loss": 1.1506, + "step": 15877 + }, + { + "epoch": 0.48, + "learning_rate": 2.7962747290010337e-06, + "loss": 1.102, + "step": 15878 + }, + { + "epoch": 0.48, + "learning_rate": 2.796032526478814e-06, + "loss": 1.1649, + "step": 15879 + }, + { + "epoch": 0.48, + "learning_rate": 2.7957903211385067e-06, + "loss": 1.2628, + "step": 15880 + }, + { + "epoch": 0.48, + "learning_rate": 2.795548112982418e-06, + "loss": 1.1657, + "step": 15881 + }, + { + "epoch": 0.48, + "learning_rate": 2.7953059020128535e-06, + "loss": 1.1932, + "step": 15882 + }, + { + "epoch": 0.48, + "learning_rate": 2.7950636882321193e-06, + "loss": 1.1118, + "step": 15883 + }, + { + "epoch": 0.48, + "learning_rate": 2.79482147164252e-06, + "loss": 1.1571, + "step": 15884 + }, + { + "epoch": 0.48, + "learning_rate": 2.7945792522463634e-06, + "loss": 1.1457, + "step": 15885 + }, + { + "epoch": 0.48, + "learning_rate": 2.7943370300459544e-06, + "loss": 1.2512, + "step": 15886 + }, + { + "epoch": 0.48, + "learning_rate": 2.794094805043598e-06, + "loss": 1.0766, + "step": 15887 + }, + { + "epoch": 0.48, + "learning_rate": 2.7938525772416008e-06, + "loss": 1.2145, + "step": 15888 + }, + { + "epoch": 0.48, + "learning_rate": 2.793610346642268e-06, + "loss": 1.0289, + "step": 15889 + }, + { + "epoch": 0.48, + "learning_rate": 2.7933681132479076e-06, + "loss": 1.0585, + "step": 15890 + }, + { + "epoch": 0.48, + "learning_rate": 2.7931258770608226e-06, + "loss": 1.1281, + "step": 15891 + }, + { + "epoch": 0.48, + "learning_rate": 2.7928836380833215e-06, + "loss": 1.1946, + "step": 15892 + }, + { + "epoch": 0.48, + "learning_rate": 2.7926413963177085e-06, + "loss": 1.1229, + "step": 15893 + }, + { + "epoch": 0.48, + "learning_rate": 2.79239915176629e-06, + "loss": 1.0831, + "step": 15894 + }, + { + "epoch": 0.48, + "learning_rate": 2.7921569044313736e-06, + "loss": 1.1061, + "step": 15895 + }, + { + "epoch": 0.48, + "learning_rate": 2.791914654315263e-06, + "loss": 1.081, + "step": 15896 + }, + { + "epoch": 0.48, + "learning_rate": 2.791672401420266e-06, + "loss": 1.0427, + "step": 15897 + }, + { + "epoch": 0.48, + "learning_rate": 2.7914301457486882e-06, + "loss": 1.1341, + "step": 15898 + }, + { + "epoch": 0.48, + "learning_rate": 2.7911878873028353e-06, + "loss": 1.001, + "step": 15899 + }, + { + "epoch": 0.48, + "learning_rate": 2.790945626085014e-06, + "loss": 1.1184, + "step": 15900 + }, + { + "epoch": 0.48, + "learning_rate": 2.7907033620975315e-06, + "loss": 1.2368, + "step": 15901 + }, + { + "epoch": 0.48, + "learning_rate": 2.7904610953426924e-06, + "loss": 1.0264, + "step": 15902 + }, + { + "epoch": 0.48, + "learning_rate": 2.7902188258228035e-06, + "loss": 1.1085, + "step": 15903 + }, + { + "epoch": 0.48, + "learning_rate": 2.7899765535401715e-06, + "loss": 1.1982, + "step": 15904 + }, + { + "epoch": 0.48, + "learning_rate": 2.7897342784971022e-06, + "loss": 1.1452, + "step": 15905 + }, + { + "epoch": 0.48, + "learning_rate": 2.789492000695902e-06, + "loss": 1.2686, + "step": 15906 + }, + { + "epoch": 0.48, + "learning_rate": 2.789249720138877e-06, + "loss": 1.0075, + "step": 15907 + }, + { + "epoch": 0.48, + "learning_rate": 2.7890074368283345e-06, + "loss": 1.1171, + "step": 15908 + }, + { + "epoch": 0.48, + "learning_rate": 2.7887651507665804e-06, + "loss": 1.0785, + "step": 15909 + }, + { + "epoch": 0.48, + "learning_rate": 2.7885228619559206e-06, + "loss": 1.1324, + "step": 15910 + }, + { + "epoch": 0.48, + "learning_rate": 2.7882805703986625e-06, + "loss": 1.0767, + "step": 15911 + }, + { + "epoch": 0.48, + "learning_rate": 2.788038276097112e-06, + "loss": 1.2861, + "step": 15912 + }, + { + "epoch": 0.48, + "learning_rate": 2.787795979053576e-06, + "loss": 1.0555, + "step": 15913 + }, + { + "epoch": 0.48, + "learning_rate": 2.787553679270361e-06, + "loss": 1.0328, + "step": 15914 + }, + { + "epoch": 0.48, + "learning_rate": 2.7873113767497734e-06, + "loss": 1.0788, + "step": 15915 + }, + { + "epoch": 0.48, + "learning_rate": 2.78706907149412e-06, + "loss": 1.1522, + "step": 15916 + }, + { + "epoch": 0.48, + "learning_rate": 2.7868267635057066e-06, + "loss": 1.2133, + "step": 15917 + }, + { + "epoch": 0.48, + "learning_rate": 2.786584452786842e-06, + "loss": 1.1829, + "step": 15918 + }, + { + "epoch": 0.48, + "learning_rate": 2.78634213933983e-06, + "loss": 1.231, + "step": 15919 + }, + { + "epoch": 0.48, + "learning_rate": 2.7860998231669788e-06, + "loss": 1.092, + "step": 15920 + }, + { + "epoch": 0.48, + "learning_rate": 2.785857504270596e-06, + "loss": 1.0593, + "step": 15921 + }, + { + "epoch": 0.48, + "learning_rate": 2.7856151826529865e-06, + "loss": 1.0176, + "step": 15922 + }, + { + "epoch": 0.48, + "learning_rate": 2.785372858316459e-06, + "loss": 1.0851, + "step": 15923 + }, + { + "epoch": 0.48, + "learning_rate": 2.7851305312633185e-06, + "loss": 1.1845, + "step": 15924 + }, + { + "epoch": 0.48, + "learning_rate": 2.7848882014958727e-06, + "loss": 1.0592, + "step": 15925 + }, + { + "epoch": 0.48, + "learning_rate": 2.7846458690164285e-06, + "loss": 1.1414, + "step": 15926 + }, + { + "epoch": 0.48, + "learning_rate": 2.7844035338272932e-06, + "loss": 1.1316, + "step": 15927 + }, + { + "epoch": 0.48, + "learning_rate": 2.784161195930773e-06, + "loss": 1.0996, + "step": 15928 + }, + { + "epoch": 0.48, + "learning_rate": 2.7839188553291753e-06, + "loss": 1.1293, + "step": 15929 + }, + { + "epoch": 0.48, + "learning_rate": 2.7836765120248067e-06, + "loss": 1.2014, + "step": 15930 + }, + { + "epoch": 0.48, + "learning_rate": 2.7834341660199743e-06, + "loss": 1.1342, + "step": 15931 + }, + { + "epoch": 0.48, + "learning_rate": 2.783191817316985e-06, + "loss": 0.9939, + "step": 15932 + }, + { + "epoch": 0.48, + "learning_rate": 2.7829494659181454e-06, + "loss": 1.1471, + "step": 15933 + }, + { + "epoch": 0.48, + "learning_rate": 2.782707111825764e-06, + "loss": 1.0997, + "step": 15934 + }, + { + "epoch": 0.48, + "learning_rate": 2.782464755042147e-06, + "loss": 1.114, + "step": 15935 + }, + { + "epoch": 0.48, + "learning_rate": 2.7822223955696015e-06, + "loss": 1.1665, + "step": 15936 + }, + { + "epoch": 0.48, + "learning_rate": 2.7819800334104346e-06, + "loss": 1.1671, + "step": 15937 + }, + { + "epoch": 0.48, + "learning_rate": 2.781737668566954e-06, + "loss": 1.1064, + "step": 15938 + }, + { + "epoch": 0.48, + "learning_rate": 2.781495301041466e-06, + "loss": 1.1514, + "step": 15939 + }, + { + "epoch": 0.48, + "learning_rate": 2.781252930836278e-06, + "loss": 1.1168, + "step": 15940 + }, + { + "epoch": 0.48, + "learning_rate": 2.781010557953698e-06, + "loss": 1.0792, + "step": 15941 + }, + { + "epoch": 0.48, + "learning_rate": 2.7807681823960325e-06, + "loss": 1.1866, + "step": 15942 + }, + { + "epoch": 0.48, + "learning_rate": 2.7805258041655893e-06, + "loss": 1.0875, + "step": 15943 + }, + { + "epoch": 0.48, + "learning_rate": 2.7802834232646758e-06, + "loss": 1.0889, + "step": 15944 + }, + { + "epoch": 0.48, + "learning_rate": 2.780041039695599e-06, + "loss": 1.1226, + "step": 15945 + }, + { + "epoch": 0.48, + "learning_rate": 2.779798653460667e-06, + "loss": 1.1023, + "step": 15946 + }, + { + "epoch": 0.48, + "learning_rate": 2.7795562645621853e-06, + "loss": 1.0813, + "step": 15947 + }, + { + "epoch": 0.48, + "learning_rate": 2.7793138730024632e-06, + "loss": 1.1802, + "step": 15948 + }, + { + "epoch": 0.48, + "learning_rate": 2.7790714787838073e-06, + "loss": 1.1487, + "step": 15949 + }, + { + "epoch": 0.48, + "learning_rate": 2.7788290819085257e-06, + "loss": 1.0972, + "step": 15950 + }, + { + "epoch": 0.48, + "learning_rate": 2.778586682378926e-06, + "loss": 1.0242, + "step": 15951 + }, + { + "epoch": 0.48, + "learning_rate": 2.7783442801973145e-06, + "loss": 1.115, + "step": 15952 + }, + { + "epoch": 0.48, + "learning_rate": 2.7781018753659994e-06, + "loss": 1.0715, + "step": 15953 + }, + { + "epoch": 0.48, + "learning_rate": 2.7778594678872883e-06, + "loss": 1.0953, + "step": 15954 + }, + { + "epoch": 0.48, + "learning_rate": 2.77761705776349e-06, + "loss": 1.0111, + "step": 15955 + }, + { + "epoch": 0.48, + "learning_rate": 2.7773746449969097e-06, + "loss": 1.1254, + "step": 15956 + }, + { + "epoch": 0.48, + "learning_rate": 2.777132229589857e-06, + "loss": 1.0551, + "step": 15957 + }, + { + "epoch": 0.48, + "learning_rate": 2.7768898115446384e-06, + "loss": 1.1159, + "step": 15958 + }, + { + "epoch": 0.48, + "learning_rate": 2.776647390863563e-06, + "loss": 1.2104, + "step": 15959 + }, + { + "epoch": 0.48, + "learning_rate": 2.776404967548937e-06, + "loss": 1.0636, + "step": 15960 + }, + { + "epoch": 0.48, + "learning_rate": 2.776162541603069e-06, + "loss": 1.1579, + "step": 15961 + }, + { + "epoch": 0.48, + "learning_rate": 2.7759201130282676e-06, + "loss": 1.2128, + "step": 15962 + }, + { + "epoch": 0.48, + "learning_rate": 2.775677681826838e-06, + "loss": 1.0276, + "step": 15963 + }, + { + "epoch": 0.48, + "learning_rate": 2.775435248001091e-06, + "loss": 1.109, + "step": 15964 + }, + { + "epoch": 0.48, + "learning_rate": 2.7751928115533323e-06, + "loss": 1.1409, + "step": 15965 + }, + { + "epoch": 0.48, + "learning_rate": 2.7749503724858705e-06, + "loss": 1.1539, + "step": 15966 + }, + { + "epoch": 0.48, + "learning_rate": 2.7747079308010137e-06, + "loss": 1.1566, + "step": 15967 + }, + { + "epoch": 0.48, + "learning_rate": 2.77446548650107e-06, + "loss": 1.1265, + "step": 15968 + }, + { + "epoch": 0.48, + "learning_rate": 2.774223039588347e-06, + "loss": 1.0158, + "step": 15969 + }, + { + "epoch": 0.48, + "learning_rate": 2.7739805900651526e-06, + "loss": 1.041, + "step": 15970 + }, + { + "epoch": 0.48, + "learning_rate": 2.7737381379337954e-06, + "loss": 1.17, + "step": 15971 + }, + { + "epoch": 0.48, + "learning_rate": 2.7734956831965827e-06, + "loss": 1.1996, + "step": 15972 + }, + { + "epoch": 0.48, + "learning_rate": 2.773253225855822e-06, + "loss": 1.177, + "step": 15973 + }, + { + "epoch": 0.48, + "learning_rate": 2.7730107659138227e-06, + "loss": 1.1345, + "step": 15974 + }, + { + "epoch": 0.48, + "learning_rate": 2.772768303372893e-06, + "loss": 1.1562, + "step": 15975 + }, + { + "epoch": 0.48, + "learning_rate": 2.7725258382353397e-06, + "loss": 1.0854, + "step": 15976 + }, + { + "epoch": 0.48, + "learning_rate": 2.7722833705034723e-06, + "loss": 1.2116, + "step": 15977 + }, + { + "epoch": 0.48, + "learning_rate": 2.7720409001795977e-06, + "loss": 1.0856, + "step": 15978 + }, + { + "epoch": 0.48, + "learning_rate": 2.7717984272660253e-06, + "loss": 1.2396, + "step": 15979 + }, + { + "epoch": 0.48, + "learning_rate": 2.7715559517650624e-06, + "loss": 1.0737, + "step": 15980 + }, + { + "epoch": 0.48, + "learning_rate": 2.7713134736790177e-06, + "loss": 1.2092, + "step": 15981 + }, + { + "epoch": 0.48, + "learning_rate": 2.771070993010199e-06, + "loss": 1.1055, + "step": 15982 + }, + { + "epoch": 0.48, + "learning_rate": 2.7708285097609157e-06, + "loss": 1.124, + "step": 15983 + }, + { + "epoch": 0.48, + "learning_rate": 2.7705860239334748e-06, + "loss": 1.1552, + "step": 15984 + }, + { + "epoch": 0.48, + "learning_rate": 2.770343535530186e-06, + "loss": 1.1707, + "step": 15985 + }, + { + "epoch": 0.48, + "learning_rate": 2.7701010445533564e-06, + "loss": 1.1041, + "step": 15986 + }, + { + "epoch": 0.48, + "learning_rate": 2.769858551005295e-06, + "loss": 1.2188, + "step": 15987 + }, + { + "epoch": 0.48, + "learning_rate": 2.7696160548883107e-06, + "loss": 1.0878, + "step": 15988 + }, + { + "epoch": 0.48, + "learning_rate": 2.7693735562047104e-06, + "loss": 1.0731, + "step": 15989 + }, + { + "epoch": 0.48, + "learning_rate": 2.7691310549568047e-06, + "loss": 1.1761, + "step": 15990 + }, + { + "epoch": 0.48, + "learning_rate": 2.7688885511469e-06, + "loss": 1.1047, + "step": 15991 + }, + { + "epoch": 0.48, + "learning_rate": 2.7686460447773067e-06, + "loss": 1.1591, + "step": 15992 + }, + { + "epoch": 0.48, + "learning_rate": 2.7684035358503316e-06, + "loss": 1.1494, + "step": 15993 + }, + { + "epoch": 0.48, + "learning_rate": 2.7681610243682845e-06, + "loss": 1.2322, + "step": 15994 + }, + { + "epoch": 0.48, + "learning_rate": 2.7679185103334733e-06, + "loss": 1.1709, + "step": 15995 + }, + { + "epoch": 0.48, + "learning_rate": 2.7676759937482073e-06, + "loss": 1.0615, + "step": 15996 + }, + { + "epoch": 0.48, + "learning_rate": 2.7674334746147948e-06, + "loss": 1.2061, + "step": 15997 + }, + { + "epoch": 0.48, + "learning_rate": 2.7671909529355447e-06, + "loss": 0.9898, + "step": 15998 + }, + { + "epoch": 0.48, + "learning_rate": 2.7669484287127647e-06, + "loss": 1.1786, + "step": 15999 + }, + { + "epoch": 0.48, + "learning_rate": 2.766705901948764e-06, + "loss": 1.0267, + "step": 16000 + }, + { + "epoch": 0.48, + "learning_rate": 2.7664633726458523e-06, + "loss": 1.1178, + "step": 16001 + }, + { + "epoch": 0.48, + "learning_rate": 2.7662208408063373e-06, + "loss": 1.0682, + "step": 16002 + }, + { + "epoch": 0.48, + "learning_rate": 2.7659783064325286e-06, + "loss": 1.0961, + "step": 16003 + }, + { + "epoch": 0.48, + "learning_rate": 2.765735769526734e-06, + "loss": 1.0317, + "step": 16004 + }, + { + "epoch": 0.48, + "learning_rate": 2.765493230091263e-06, + "loss": 1.1462, + "step": 16005 + }, + { + "epoch": 0.48, + "learning_rate": 2.765250688128424e-06, + "loss": 1.269, + "step": 16006 + }, + { + "epoch": 0.48, + "learning_rate": 2.765008143640526e-06, + "loss": 1.1854, + "step": 16007 + }, + { + "epoch": 0.48, + "learning_rate": 2.7647655966298786e-06, + "loss": 1.1203, + "step": 16008 + }, + { + "epoch": 0.48, + "learning_rate": 2.7645230470987905e-06, + "loss": 1.0847, + "step": 16009 + }, + { + "epoch": 0.48, + "learning_rate": 2.76428049504957e-06, + "loss": 1.1017, + "step": 16010 + }, + { + "epoch": 0.48, + "learning_rate": 2.764037940484527e-06, + "loss": 1.0447, + "step": 16011 + }, + { + "epoch": 0.48, + "learning_rate": 2.7637953834059693e-06, + "loss": 1.1434, + "step": 16012 + }, + { + "epoch": 0.48, + "learning_rate": 2.7635528238162066e-06, + "loss": 1.1839, + "step": 16013 + }, + { + "epoch": 0.48, + "learning_rate": 2.7633102617175484e-06, + "loss": 1.1732, + "step": 16014 + }, + { + "epoch": 0.48, + "learning_rate": 2.7630676971123033e-06, + "loss": 1.1641, + "step": 16015 + }, + { + "epoch": 0.48, + "learning_rate": 2.7628251300027803e-06, + "loss": 1.1755, + "step": 16016 + }, + { + "epoch": 0.48, + "learning_rate": 2.762582560391288e-06, + "loss": 1.1737, + "step": 16017 + }, + { + "epoch": 0.48, + "learning_rate": 2.7623399882801375e-06, + "loss": 1.1424, + "step": 16018 + }, + { + "epoch": 0.48, + "learning_rate": 2.7620974136716353e-06, + "loss": 1.1116, + "step": 16019 + }, + { + "epoch": 0.48, + "learning_rate": 2.761854836568093e-06, + "loss": 1.2014, + "step": 16020 + }, + { + "epoch": 0.48, + "learning_rate": 2.7616122569718186e-06, + "loss": 1.1093, + "step": 16021 + }, + { + "epoch": 0.48, + "learning_rate": 2.761369674885121e-06, + "loss": 1.1188, + "step": 16022 + }, + { + "epoch": 0.48, + "learning_rate": 2.76112709031031e-06, + "loss": 1.2332, + "step": 16023 + }, + { + "epoch": 0.48, + "learning_rate": 2.7608845032496955e-06, + "loss": 1.1252, + "step": 16024 + }, + { + "epoch": 0.48, + "learning_rate": 2.760641913705586e-06, + "loss": 1.005, + "step": 16025 + }, + { + "epoch": 0.48, + "learning_rate": 2.76039932168029e-06, + "loss": 1.1461, + "step": 16026 + }, + { + "epoch": 0.48, + "learning_rate": 2.7601567271761194e-06, + "loss": 1.0936, + "step": 16027 + }, + { + "epoch": 0.48, + "learning_rate": 2.7599141301953807e-06, + "loss": 1.1173, + "step": 16028 + }, + { + "epoch": 0.48, + "learning_rate": 2.759671530740386e-06, + "loss": 1.1788, + "step": 16029 + }, + { + "epoch": 0.48, + "learning_rate": 2.7594289288134423e-06, + "loss": 1.1644, + "step": 16030 + }, + { + "epoch": 0.48, + "learning_rate": 2.759186324416861e-06, + "loss": 1.1646, + "step": 16031 + }, + { + "epoch": 0.48, + "learning_rate": 2.75894371755295e-06, + "loss": 1.075, + "step": 16032 + }, + { + "epoch": 0.48, + "learning_rate": 2.75870110822402e-06, + "loss": 1.1077, + "step": 16033 + }, + { + "epoch": 0.48, + "learning_rate": 2.7584584964323796e-06, + "loss": 1.1254, + "step": 16034 + }, + { + "epoch": 0.48, + "learning_rate": 2.7582158821803383e-06, + "loss": 1.1395, + "step": 16035 + }, + { + "epoch": 0.48, + "learning_rate": 2.7579732654702066e-06, + "loss": 1.1824, + "step": 16036 + }, + { + "epoch": 0.48, + "learning_rate": 2.7577306463042948e-06, + "loss": 1.105, + "step": 16037 + }, + { + "epoch": 0.48, + "learning_rate": 2.75748802468491e-06, + "loss": 1.1101, + "step": 16038 + }, + { + "epoch": 0.48, + "learning_rate": 2.757245400614364e-06, + "loss": 1.0481, + "step": 16039 + }, + { + "epoch": 0.48, + "learning_rate": 2.7570027740949652e-06, + "loss": 1.0468, + "step": 16040 + }, + { + "epoch": 0.48, + "learning_rate": 2.7567601451290236e-06, + "loss": 1.0306, + "step": 16041 + }, + { + "epoch": 0.48, + "learning_rate": 2.75651751371885e-06, + "loss": 1.147, + "step": 16042 + }, + { + "epoch": 0.48, + "learning_rate": 2.756274879866752e-06, + "loss": 1.1215, + "step": 16043 + }, + { + "epoch": 0.48, + "learning_rate": 2.756032243575042e-06, + "loss": 1.2065, + "step": 16044 + }, + { + "epoch": 0.48, + "learning_rate": 2.755789604846027e-06, + "loss": 1.2151, + "step": 16045 + }, + { + "epoch": 0.48, + "learning_rate": 2.7555469636820194e-06, + "loss": 1.1773, + "step": 16046 + }, + { + "epoch": 0.48, + "learning_rate": 2.755304320085327e-06, + "loss": 0.9988, + "step": 16047 + }, + { + "epoch": 0.48, + "learning_rate": 2.7550616740582595e-06, + "loss": 1.0742, + "step": 16048 + }, + { + "epoch": 0.48, + "learning_rate": 2.754819025603129e-06, + "loss": 1.1843, + "step": 16049 + }, + { + "epoch": 0.48, + "learning_rate": 2.754576374722244e-06, + "loss": 1.1708, + "step": 16050 + }, + { + "epoch": 0.48, + "learning_rate": 2.7543337214179145e-06, + "loss": 1.0774, + "step": 16051 + }, + { + "epoch": 0.48, + "learning_rate": 2.7540910656924504e-06, + "loss": 1.084, + "step": 16052 + }, + { + "epoch": 0.48, + "learning_rate": 2.7538484075481613e-06, + "loss": 1.0947, + "step": 16053 + }, + { + "epoch": 0.48, + "learning_rate": 2.753605746987358e-06, + "loss": 1.1231, + "step": 16054 + }, + { + "epoch": 0.48, + "learning_rate": 2.7533630840123503e-06, + "loss": 1.2329, + "step": 16055 + }, + { + "epoch": 0.48, + "learning_rate": 2.753120418625448e-06, + "loss": 1.1182, + "step": 16056 + }, + { + "epoch": 0.48, + "learning_rate": 2.752877750828961e-06, + "loss": 1.0246, + "step": 16057 + }, + { + "epoch": 0.48, + "learning_rate": 2.7526350806251996e-06, + "loss": 1.1885, + "step": 16058 + }, + { + "epoch": 0.48, + "learning_rate": 2.7523924080164745e-06, + "loss": 1.1606, + "step": 16059 + }, + { + "epoch": 0.48, + "learning_rate": 2.7521497330050947e-06, + "loss": 1.1003, + "step": 16060 + }, + { + "epoch": 0.48, + "learning_rate": 2.7519070555933704e-06, + "loss": 1.1291, + "step": 16061 + }, + { + "epoch": 0.48, + "learning_rate": 2.751664375783613e-06, + "loss": 1.1488, + "step": 16062 + }, + { + "epoch": 0.48, + "learning_rate": 2.751421693578131e-06, + "loss": 1.1351, + "step": 16063 + }, + { + "epoch": 0.48, + "learning_rate": 2.7511790089792367e-06, + "loss": 1.036, + "step": 16064 + }, + { + "epoch": 0.48, + "learning_rate": 2.750936321989239e-06, + "loss": 1.1066, + "step": 16065 + }, + { + "epoch": 0.48, + "learning_rate": 2.7506936326104477e-06, + "loss": 0.9763, + "step": 16066 + }, + { + "epoch": 0.48, + "learning_rate": 2.7504509408451742e-06, + "loss": 1.1485, + "step": 16067 + }, + { + "epoch": 0.48, + "learning_rate": 2.7502082466957287e-06, + "loss": 1.2507, + "step": 16068 + }, + { + "epoch": 0.48, + "learning_rate": 2.7499655501644206e-06, + "loss": 1.185, + "step": 16069 + }, + { + "epoch": 0.48, + "learning_rate": 2.749722851253561e-06, + "loss": 1.142, + "step": 16070 + }, + { + "epoch": 0.48, + "learning_rate": 2.7494801499654604e-06, + "loss": 1.0369, + "step": 16071 + }, + { + "epoch": 0.48, + "learning_rate": 2.7492374463024293e-06, + "loss": 1.1508, + "step": 16072 + }, + { + "epoch": 0.48, + "learning_rate": 2.7489947402667767e-06, + "loss": 1.1635, + "step": 16073 + }, + { + "epoch": 0.48, + "learning_rate": 2.748752031860815e-06, + "loss": 1.2188, + "step": 16074 + }, + { + "epoch": 0.48, + "learning_rate": 2.748509321086853e-06, + "loss": 1.2054, + "step": 16075 + }, + { + "epoch": 0.48, + "learning_rate": 2.748266607947202e-06, + "loss": 1.1135, + "step": 16076 + }, + { + "epoch": 0.48, + "learning_rate": 2.7480238924441727e-06, + "loss": 1.1978, + "step": 16077 + }, + { + "epoch": 0.48, + "learning_rate": 2.747781174580076e-06, + "loss": 1.1237, + "step": 16078 + }, + { + "epoch": 0.48, + "learning_rate": 2.747538454357221e-06, + "loss": 1.2153, + "step": 16079 + }, + { + "epoch": 0.48, + "learning_rate": 2.747295731777919e-06, + "loss": 1.1854, + "step": 16080 + }, + { + "epoch": 0.48, + "learning_rate": 2.7470530068444816e-06, + "loss": 1.0599, + "step": 16081 + }, + { + "epoch": 0.48, + "learning_rate": 2.746810279559218e-06, + "loss": 1.1895, + "step": 16082 + }, + { + "epoch": 0.48, + "learning_rate": 2.74656754992444e-06, + "loss": 1.1599, + "step": 16083 + }, + { + "epoch": 0.48, + "learning_rate": 2.7463248179424567e-06, + "loss": 1.0601, + "step": 16084 + }, + { + "epoch": 0.48, + "learning_rate": 2.746082083615581e-06, + "loss": 1.211, + "step": 16085 + }, + { + "epoch": 0.48, + "learning_rate": 2.7458393469461212e-06, + "loss": 1.1449, + "step": 16086 + }, + { + "epoch": 0.48, + "learning_rate": 2.74559660793639e-06, + "loss": 1.2852, + "step": 16087 + }, + { + "epoch": 0.48, + "learning_rate": 2.745353866588697e-06, + "loss": 1.0952, + "step": 16088 + }, + { + "epoch": 0.48, + "learning_rate": 2.7451111229053534e-06, + "loss": 1.1298, + "step": 16089 + }, + { + "epoch": 0.48, + "learning_rate": 2.7448683768886695e-06, + "loss": 1.1102, + "step": 16090 + }, + { + "epoch": 0.48, + "learning_rate": 2.7446256285409578e-06, + "loss": 1.0709, + "step": 16091 + }, + { + "epoch": 0.48, + "learning_rate": 2.7443828778645267e-06, + "loss": 1.1812, + "step": 16092 + }, + { + "epoch": 0.48, + "learning_rate": 2.7441401248616883e-06, + "loss": 1.1577, + "step": 16093 + }, + { + "epoch": 0.48, + "learning_rate": 2.743897369534755e-06, + "loss": 1.1987, + "step": 16094 + }, + { + "epoch": 0.48, + "learning_rate": 2.7436546118860345e-06, + "loss": 1.0576, + "step": 16095 + }, + { + "epoch": 0.48, + "learning_rate": 2.7434118519178404e-06, + "loss": 1.1311, + "step": 16096 + }, + { + "epoch": 0.48, + "learning_rate": 2.7431690896324827e-06, + "loss": 1.1349, + "step": 16097 + }, + { + "epoch": 0.48, + "learning_rate": 2.7429263250322725e-06, + "loss": 1.0914, + "step": 16098 + }, + { + "epoch": 0.48, + "learning_rate": 2.74268355811952e-06, + "loss": 1.0321, + "step": 16099 + }, + { + "epoch": 0.49, + "learning_rate": 2.7424407888965377e-06, + "loss": 1.167, + "step": 16100 + }, + { + "epoch": 0.49, + "learning_rate": 2.742198017365635e-06, + "loss": 1.0995, + "step": 16101 + }, + { + "epoch": 0.49, + "learning_rate": 2.7419552435291234e-06, + "loss": 1.1304, + "step": 16102 + }, + { + "epoch": 0.49, + "learning_rate": 2.7417124673893158e-06, + "loss": 1.2036, + "step": 16103 + }, + { + "epoch": 0.49, + "learning_rate": 2.7414696889485216e-06, + "loss": 1.0356, + "step": 16104 + }, + { + "epoch": 0.49, + "learning_rate": 2.7412269082090514e-06, + "loss": 1.1152, + "step": 16105 + }, + { + "epoch": 0.49, + "learning_rate": 2.740984125173218e-06, + "loss": 1.2353, + "step": 16106 + }, + { + "epoch": 0.49, + "learning_rate": 2.7407413398433314e-06, + "loss": 1.0413, + "step": 16107 + }, + { + "epoch": 0.49, + "learning_rate": 2.740498552221703e-06, + "loss": 1.0149, + "step": 16108 + }, + { + "epoch": 0.49, + "learning_rate": 2.740255762310645e-06, + "loss": 1.119, + "step": 16109 + }, + { + "epoch": 0.49, + "learning_rate": 2.740012970112467e-06, + "loss": 1.165, + "step": 16110 + }, + { + "epoch": 0.49, + "learning_rate": 2.7397701756294826e-06, + "loss": 1.1661, + "step": 16111 + }, + { + "epoch": 0.49, + "learning_rate": 2.7395273788640005e-06, + "loss": 1.2197, + "step": 16112 + }, + { + "epoch": 0.49, + "learning_rate": 2.739284579818333e-06, + "loss": 1.1774, + "step": 16113 + }, + { + "epoch": 0.49, + "learning_rate": 2.7390417784947914e-06, + "loss": 1.153, + "step": 16114 + }, + { + "epoch": 0.49, + "learning_rate": 2.7387989748956884e-06, + "loss": 1.0751, + "step": 16115 + }, + { + "epoch": 0.49, + "learning_rate": 2.7385561690233324e-06, + "loss": 1.1922, + "step": 16116 + }, + { + "epoch": 0.49, + "learning_rate": 2.738313360880038e-06, + "loss": 1.2065, + "step": 16117 + }, + { + "epoch": 0.49, + "learning_rate": 2.738070550468114e-06, + "loss": 1.0917, + "step": 16118 + }, + { + "epoch": 0.49, + "learning_rate": 2.737827737789873e-06, + "loss": 1.1201, + "step": 16119 + }, + { + "epoch": 0.49, + "learning_rate": 2.737584922847628e-06, + "loss": 1.1282, + "step": 16120 + }, + { + "epoch": 0.49, + "learning_rate": 2.7373421056436876e-06, + "loss": 1.1486, + "step": 16121 + }, + { + "epoch": 0.49, + "learning_rate": 2.7370992861803657e-06, + "loss": 1.0176, + "step": 16122 + }, + { + "epoch": 0.49, + "learning_rate": 2.736856464459972e-06, + "loss": 1.1735, + "step": 16123 + }, + { + "epoch": 0.49, + "learning_rate": 2.7366136404848193e-06, + "loss": 1.1764, + "step": 16124 + }, + { + "epoch": 0.49, + "learning_rate": 2.736370814257218e-06, + "loss": 1.188, + "step": 16125 + }, + { + "epoch": 0.49, + "learning_rate": 2.7361279857794814e-06, + "loss": 1.1405, + "step": 16126 + }, + { + "epoch": 0.49, + "learning_rate": 2.7358851550539195e-06, + "loss": 1.0406, + "step": 16127 + }, + { + "epoch": 0.49, + "learning_rate": 2.735642322082845e-06, + "loss": 1.0134, + "step": 16128 + }, + { + "epoch": 0.49, + "learning_rate": 2.7353994868685685e-06, + "loss": 1.0696, + "step": 16129 + }, + { + "epoch": 0.49, + "learning_rate": 2.735156649413402e-06, + "loss": 1.2159, + "step": 16130 + }, + { + "epoch": 0.49, + "learning_rate": 2.7349138097196577e-06, + "loss": 1.0328, + "step": 16131 + }, + { + "epoch": 0.49, + "learning_rate": 2.734670967789648e-06, + "loss": 1.2195, + "step": 16132 + }, + { + "epoch": 0.49, + "learning_rate": 2.7344281236256826e-06, + "loss": 1.1967, + "step": 16133 + }, + { + "epoch": 0.49, + "learning_rate": 2.7341852772300743e-06, + "loss": 1.1661, + "step": 16134 + }, + { + "epoch": 0.49, + "learning_rate": 2.733942428605136e-06, + "loss": 1.0835, + "step": 16135 + }, + { + "epoch": 0.49, + "learning_rate": 2.7336995777531773e-06, + "loss": 1.1985, + "step": 16136 + }, + { + "epoch": 0.49, + "learning_rate": 2.733456724676512e-06, + "loss": 1.1201, + "step": 16137 + }, + { + "epoch": 0.49, + "learning_rate": 2.7332138693774508e-06, + "loss": 1.1113, + "step": 16138 + }, + { + "epoch": 0.49, + "learning_rate": 2.732971011858306e-06, + "loss": 1.1176, + "step": 16139 + }, + { + "epoch": 0.49, + "learning_rate": 2.732728152121389e-06, + "loss": 1.1664, + "step": 16140 + }, + { + "epoch": 0.49, + "learning_rate": 2.732485290169013e-06, + "loss": 0.9858, + "step": 16141 + }, + { + "epoch": 0.49, + "learning_rate": 2.732242426003488e-06, + "loss": 1.071, + "step": 16142 + }, + { + "epoch": 0.49, + "learning_rate": 2.731999559627127e-06, + "loss": 1.0351, + "step": 16143 + }, + { + "epoch": 0.49, + "learning_rate": 2.7317566910422428e-06, + "loss": 1.1217, + "step": 16144 + }, + { + "epoch": 0.49, + "learning_rate": 2.7315138202511454e-06, + "loss": 1.1962, + "step": 16145 + }, + { + "epoch": 0.49, + "learning_rate": 2.7312709472561484e-06, + "loss": 1.0366, + "step": 16146 + }, + { + "epoch": 0.49, + "learning_rate": 2.7310280720595633e-06, + "loss": 1.0448, + "step": 16147 + }, + { + "epoch": 0.49, + "learning_rate": 2.7307851946637025e-06, + "loss": 1.1024, + "step": 16148 + }, + { + "epoch": 0.49, + "learning_rate": 2.730542315070878e-06, + "loss": 1.1063, + "step": 16149 + }, + { + "epoch": 0.49, + "learning_rate": 2.7302994332834014e-06, + "loss": 1.1545, + "step": 16150 + }, + { + "epoch": 0.49, + "learning_rate": 2.730056549303585e-06, + "loss": 1.0533, + "step": 16151 + }, + { + "epoch": 0.49, + "learning_rate": 2.7298136631337412e-06, + "loss": 1.1269, + "step": 16152 + }, + { + "epoch": 0.49, + "learning_rate": 2.7295707747761818e-06, + "loss": 1.1809, + "step": 16153 + }, + { + "epoch": 0.49, + "learning_rate": 2.7293278842332193e-06, + "loss": 1.1437, + "step": 16154 + }, + { + "epoch": 0.49, + "learning_rate": 2.729084991507166e-06, + "loss": 1.0942, + "step": 16155 + }, + { + "epoch": 0.49, + "learning_rate": 2.7288420966003336e-06, + "loss": 1.1827, + "step": 16156 + }, + { + "epoch": 0.49, + "learning_rate": 2.728599199515035e-06, + "loss": 1.124, + "step": 16157 + }, + { + "epoch": 0.49, + "learning_rate": 2.7283563002535816e-06, + "loss": 1.0665, + "step": 16158 + }, + { + "epoch": 0.49, + "learning_rate": 2.7281133988182862e-06, + "loss": 1.0693, + "step": 16159 + }, + { + "epoch": 0.49, + "learning_rate": 2.727870495211461e-06, + "loss": 1.1979, + "step": 16160 + }, + { + "epoch": 0.49, + "learning_rate": 2.7276275894354194e-06, + "loss": 1.2285, + "step": 16161 + }, + { + "epoch": 0.49, + "learning_rate": 2.727384681492472e-06, + "loss": 1.1289, + "step": 16162 + }, + { + "epoch": 0.49, + "learning_rate": 2.7271417713849326e-06, + "loss": 1.1462, + "step": 16163 + }, + { + "epoch": 0.49, + "learning_rate": 2.7268988591151125e-06, + "loss": 0.9995, + "step": 16164 + }, + { + "epoch": 0.49, + "learning_rate": 2.7266559446853246e-06, + "loss": 1.0909, + "step": 16165 + }, + { + "epoch": 0.49, + "learning_rate": 2.7264130280978807e-06, + "loss": 1.0823, + "step": 16166 + }, + { + "epoch": 0.49, + "learning_rate": 2.7261701093550946e-06, + "loss": 1.1763, + "step": 16167 + }, + { + "epoch": 0.49, + "learning_rate": 2.7259271884592773e-06, + "loss": 1.3292, + "step": 16168 + }, + { + "epoch": 0.49, + "learning_rate": 2.725684265412743e-06, + "loss": 1.0997, + "step": 16169 + }, + { + "epoch": 0.49, + "learning_rate": 2.7254413402178025e-06, + "loss": 1.1576, + "step": 16170 + }, + { + "epoch": 0.49, + "learning_rate": 2.725198412876769e-06, + "loss": 1.1338, + "step": 16171 + }, + { + "epoch": 0.49, + "learning_rate": 2.724955483391955e-06, + "loss": 1.1196, + "step": 16172 + }, + { + "epoch": 0.49, + "learning_rate": 2.724712551765673e-06, + "loss": 1.2173, + "step": 16173 + }, + { + "epoch": 0.49, + "learning_rate": 2.724469618000236e-06, + "loss": 1.1686, + "step": 16174 + }, + { + "epoch": 0.49, + "learning_rate": 2.724226682097956e-06, + "loss": 1.1, + "step": 16175 + }, + { + "epoch": 0.49, + "learning_rate": 2.7239837440611473e-06, + "loss": 1.1018, + "step": 16176 + }, + { + "epoch": 0.49, + "learning_rate": 2.72374080389212e-06, + "loss": 1.1727, + "step": 16177 + }, + { + "epoch": 0.49, + "learning_rate": 2.723497861593188e-06, + "loss": 1.0082, + "step": 16178 + }, + { + "epoch": 0.49, + "learning_rate": 2.7232549171666644e-06, + "loss": 1.0677, + "step": 16179 + }, + { + "epoch": 0.49, + "learning_rate": 2.7230119706148617e-06, + "loss": 1.1005, + "step": 16180 + }, + { + "epoch": 0.49, + "learning_rate": 2.722769021940092e-06, + "loss": 1.1389, + "step": 16181 + }, + { + "epoch": 0.49, + "learning_rate": 2.722526071144669e-06, + "loss": 1.0229, + "step": 16182 + }, + { + "epoch": 0.49, + "learning_rate": 2.7222831182309047e-06, + "loss": 1.1027, + "step": 16183 + }, + { + "epoch": 0.49, + "learning_rate": 2.722040163201112e-06, + "loss": 1.0336, + "step": 16184 + }, + { + "epoch": 0.49, + "learning_rate": 2.7217972060576035e-06, + "loss": 1.0279, + "step": 16185 + }, + { + "epoch": 0.49, + "learning_rate": 2.721554246802693e-06, + "loss": 0.9888, + "step": 16186 + }, + { + "epoch": 0.49, + "learning_rate": 2.7213112854386926e-06, + "loss": 1.1224, + "step": 16187 + }, + { + "epoch": 0.49, + "learning_rate": 2.721068321967915e-06, + "loss": 1.1281, + "step": 16188 + }, + { + "epoch": 0.49, + "learning_rate": 2.7208253563926747e-06, + "loss": 1.1609, + "step": 16189 + }, + { + "epoch": 0.49, + "learning_rate": 2.7205823887152815e-06, + "loss": 1.0848, + "step": 16190 + }, + { + "epoch": 0.49, + "learning_rate": 2.720339418938052e-06, + "loss": 1.1535, + "step": 16191 + }, + { + "epoch": 0.49, + "learning_rate": 2.720096447063296e-06, + "loss": 1.0323, + "step": 16192 + }, + { + "epoch": 0.49, + "learning_rate": 2.719853473093329e-06, + "loss": 1.0972, + "step": 16193 + }, + { + "epoch": 0.49, + "learning_rate": 2.719610497030462e-06, + "loss": 1.0518, + "step": 16194 + }, + { + "epoch": 0.49, + "learning_rate": 2.7193675188770093e-06, + "loss": 1.1384, + "step": 16195 + }, + { + "epoch": 0.49, + "learning_rate": 2.7191245386352834e-06, + "loss": 1.2073, + "step": 16196 + }, + { + "epoch": 0.49, + "learning_rate": 2.718881556307597e-06, + "loss": 1.1428, + "step": 16197 + }, + { + "epoch": 0.49, + "learning_rate": 2.7186385718962637e-06, + "loss": 1.1469, + "step": 16198 + }, + { + "epoch": 0.49, + "learning_rate": 2.7183955854035964e-06, + "loss": 1.0115, + "step": 16199 + }, + { + "epoch": 0.49, + "learning_rate": 2.7181525968319084e-06, + "loss": 1.1637, + "step": 16200 + }, + { + "epoch": 0.49, + "learning_rate": 2.7179096061835133e-06, + "loss": 1.153, + "step": 16201 + }, + { + "epoch": 0.49, + "learning_rate": 2.7176666134607234e-06, + "loss": 1.2159, + "step": 16202 + }, + { + "epoch": 0.49, + "learning_rate": 2.7174236186658513e-06, + "loss": 1.1008, + "step": 16203 + }, + { + "epoch": 0.49, + "learning_rate": 2.7171806218012126e-06, + "loss": 1.1016, + "step": 16204 + }, + { + "epoch": 0.49, + "learning_rate": 2.716937622869118e-06, + "loss": 1.1647, + "step": 16205 + }, + { + "epoch": 0.49, + "learning_rate": 2.716694621871882e-06, + "loss": 1.0443, + "step": 16206 + }, + { + "epoch": 0.49, + "learning_rate": 2.7164516188118173e-06, + "loss": 1.1197, + "step": 16207 + }, + { + "epoch": 0.49, + "learning_rate": 2.716208613691238e-06, + "loss": 1.2527, + "step": 16208 + }, + { + "epoch": 0.49, + "learning_rate": 2.715965606512456e-06, + "loss": 1.1545, + "step": 16209 + }, + { + "epoch": 0.49, + "learning_rate": 2.7157225972777864e-06, + "loss": 0.9782, + "step": 16210 + }, + { + "epoch": 0.49, + "learning_rate": 2.715479585989541e-06, + "loss": 1.0524, + "step": 16211 + }, + { + "epoch": 0.49, + "learning_rate": 2.7152365726500334e-06, + "loss": 1.0975, + "step": 16212 + }, + { + "epoch": 0.49, + "learning_rate": 2.714993557261578e-06, + "loss": 1.1462, + "step": 16213 + }, + { + "epoch": 0.49, + "learning_rate": 2.714750539826486e-06, + "loss": 1.0798, + "step": 16214 + }, + { + "epoch": 0.49, + "learning_rate": 2.714507520347074e-06, + "loss": 1.0593, + "step": 16215 + }, + { + "epoch": 0.49, + "learning_rate": 2.7142644988256527e-06, + "loss": 1.0996, + "step": 16216 + }, + { + "epoch": 0.49, + "learning_rate": 2.7140214752645376e-06, + "loss": 1.1531, + "step": 16217 + }, + { + "epoch": 0.49, + "learning_rate": 2.71377844966604e-06, + "loss": 1.184, + "step": 16218 + }, + { + "epoch": 0.49, + "learning_rate": 2.713535422032476e-06, + "loss": 1.1413, + "step": 16219 + }, + { + "epoch": 0.49, + "learning_rate": 2.7132923923661565e-06, + "loss": 1.1027, + "step": 16220 + }, + { + "epoch": 0.49, + "learning_rate": 2.713049360669396e-06, + "loss": 1.2507, + "step": 16221 + }, + { + "epoch": 0.49, + "learning_rate": 2.7128063269445086e-06, + "loss": 1.1148, + "step": 16222 + }, + { + "epoch": 0.49, + "learning_rate": 2.7125632911938075e-06, + "loss": 1.065, + "step": 16223 + }, + { + "epoch": 0.49, + "learning_rate": 2.7123202534196065e-06, + "loss": 1.2606, + "step": 16224 + }, + { + "epoch": 0.49, + "learning_rate": 2.712077213624218e-06, + "loss": 1.0832, + "step": 16225 + }, + { + "epoch": 0.49, + "learning_rate": 2.711834171809958e-06, + "loss": 1.1629, + "step": 16226 + }, + { + "epoch": 0.49, + "learning_rate": 2.711591127979137e-06, + "loss": 1.1162, + "step": 16227 + }, + { + "epoch": 0.49, + "learning_rate": 2.711348082134071e-06, + "loss": 1.2245, + "step": 16228 + }, + { + "epoch": 0.49, + "learning_rate": 2.7111050342770734e-06, + "loss": 1.0168, + "step": 16229 + }, + { + "epoch": 0.49, + "learning_rate": 2.7108619844104577e-06, + "loss": 1.2194, + "step": 16230 + }, + { + "epoch": 0.49, + "learning_rate": 2.710618932536537e-06, + "loss": 1.2864, + "step": 16231 + }, + { + "epoch": 0.49, + "learning_rate": 2.710375878657626e-06, + "loss": 1.1174, + "step": 16232 + }, + { + "epoch": 0.49, + "learning_rate": 2.710132822776037e-06, + "loss": 1.1466, + "step": 16233 + }, + { + "epoch": 0.49, + "learning_rate": 2.709889764894086e-06, + "loss": 1.0679, + "step": 16234 + }, + { + "epoch": 0.49, + "learning_rate": 2.7096467050140847e-06, + "loss": 1.2128, + "step": 16235 + }, + { + "epoch": 0.49, + "learning_rate": 2.709403643138348e-06, + "loss": 1.1299, + "step": 16236 + }, + { + "epoch": 0.49, + "learning_rate": 2.7091605792691893e-06, + "loss": 1.1202, + "step": 16237 + }, + { + "epoch": 0.49, + "learning_rate": 2.708917513408923e-06, + "loss": 1.1326, + "step": 16238 + }, + { + "epoch": 0.49, + "learning_rate": 2.7086744455598625e-06, + "loss": 1.1417, + "step": 16239 + }, + { + "epoch": 0.49, + "learning_rate": 2.708431375724321e-06, + "loss": 0.9979, + "step": 16240 + }, + { + "epoch": 0.49, + "learning_rate": 2.7081883039046136e-06, + "loss": 1.075, + "step": 16241 + }, + { + "epoch": 0.49, + "learning_rate": 2.707945230103054e-06, + "loss": 1.1306, + "step": 16242 + }, + { + "epoch": 0.49, + "learning_rate": 2.7077021543219563e-06, + "loss": 1.2521, + "step": 16243 + }, + { + "epoch": 0.49, + "learning_rate": 2.707459076563633e-06, + "loss": 1.0849, + "step": 16244 + }, + { + "epoch": 0.49, + "learning_rate": 2.7072159968304007e-06, + "loss": 1.2342, + "step": 16245 + }, + { + "epoch": 0.49, + "learning_rate": 2.7069729151245712e-06, + "loss": 0.9863, + "step": 16246 + }, + { + "epoch": 0.49, + "learning_rate": 2.7067298314484592e-06, + "loss": 1.0994, + "step": 16247 + }, + { + "epoch": 0.49, + "learning_rate": 2.706486745804379e-06, + "loss": 1.0363, + "step": 16248 + }, + { + "epoch": 0.49, + "learning_rate": 2.7062436581946437e-06, + "loss": 1.1758, + "step": 16249 + }, + { + "epoch": 0.49, + "learning_rate": 2.706000568621569e-06, + "loss": 1.1384, + "step": 16250 + }, + { + "epoch": 0.49, + "learning_rate": 2.705757477087468e-06, + "loss": 1.1237, + "step": 16251 + }, + { + "epoch": 0.49, + "learning_rate": 2.705514383594654e-06, + "loss": 1.071, + "step": 16252 + }, + { + "epoch": 0.49, + "learning_rate": 2.705271288145443e-06, + "loss": 1.2394, + "step": 16253 + }, + { + "epoch": 0.49, + "learning_rate": 2.7050281907421473e-06, + "loss": 1.0516, + "step": 16254 + }, + { + "epoch": 0.49, + "learning_rate": 2.704785091387082e-06, + "loss": 1.2152, + "step": 16255 + }, + { + "epoch": 0.49, + "learning_rate": 2.7045419900825626e-06, + "loss": 1.2141, + "step": 16256 + }, + { + "epoch": 0.49, + "learning_rate": 2.7042988868309004e-06, + "loss": 1.1366, + "step": 16257 + }, + { + "epoch": 0.49, + "learning_rate": 2.7040557816344125e-06, + "loss": 1.1832, + "step": 16258 + }, + { + "epoch": 0.49, + "learning_rate": 2.7038126744954112e-06, + "loss": 1.1533, + "step": 16259 + }, + { + "epoch": 0.49, + "learning_rate": 2.703569565416212e-06, + "loss": 1.1017, + "step": 16260 + }, + { + "epoch": 0.49, + "learning_rate": 2.703326454399128e-06, + "loss": 1.1273, + "step": 16261 + }, + { + "epoch": 0.49, + "learning_rate": 2.703083341446474e-06, + "loss": 1.1221, + "step": 16262 + }, + { + "epoch": 0.49, + "learning_rate": 2.7028402265605645e-06, + "loss": 1.1063, + "step": 16263 + }, + { + "epoch": 0.49, + "learning_rate": 2.702597109743714e-06, + "loss": 1.0961, + "step": 16264 + }, + { + "epoch": 0.49, + "learning_rate": 2.7023539909982367e-06, + "loss": 1.1641, + "step": 16265 + }, + { + "epoch": 0.49, + "learning_rate": 2.702110870326446e-06, + "loss": 1.0535, + "step": 16266 + }, + { + "epoch": 0.49, + "learning_rate": 2.701867747730658e-06, + "loss": 1.0539, + "step": 16267 + }, + { + "epoch": 0.49, + "learning_rate": 2.701624623213186e-06, + "loss": 1.3209, + "step": 16268 + }, + { + "epoch": 0.49, + "learning_rate": 2.701381496776344e-06, + "loss": 1.2203, + "step": 16269 + }, + { + "epoch": 0.49, + "learning_rate": 2.701138368422448e-06, + "loss": 1.1614, + "step": 16270 + }, + { + "epoch": 0.49, + "learning_rate": 2.700895238153811e-06, + "loss": 1.0237, + "step": 16271 + }, + { + "epoch": 0.49, + "learning_rate": 2.7006521059727488e-06, + "loss": 1.0729, + "step": 16272 + }, + { + "epoch": 0.49, + "learning_rate": 2.700408971881575e-06, + "loss": 1.1751, + "step": 16273 + }, + { + "epoch": 0.49, + "learning_rate": 2.700165835882604e-06, + "loss": 1.1071, + "step": 16274 + }, + { + "epoch": 0.49, + "learning_rate": 2.6999226979781514e-06, + "loss": 1.0557, + "step": 16275 + }, + { + "epoch": 0.49, + "learning_rate": 2.6996795581705297e-06, + "loss": 1.1005, + "step": 16276 + }, + { + "epoch": 0.49, + "learning_rate": 2.6994364164620564e-06, + "loss": 1.1377, + "step": 16277 + }, + { + "epoch": 0.49, + "learning_rate": 2.699193272855043e-06, + "loss": 1.1104, + "step": 16278 + }, + { + "epoch": 0.49, + "learning_rate": 2.6989501273518058e-06, + "loss": 1.2094, + "step": 16279 + }, + { + "epoch": 0.49, + "learning_rate": 2.69870697995466e-06, + "loss": 1.1356, + "step": 16280 + }, + { + "epoch": 0.49, + "learning_rate": 2.698463830665919e-06, + "loss": 1.1298, + "step": 16281 + }, + { + "epoch": 0.49, + "learning_rate": 2.6982206794878973e-06, + "loss": 1.0122, + "step": 16282 + }, + { + "epoch": 0.49, + "learning_rate": 2.6979775264229107e-06, + "loss": 1.1778, + "step": 16283 + }, + { + "epoch": 0.49, + "learning_rate": 2.697734371473274e-06, + "loss": 1.165, + "step": 16284 + }, + { + "epoch": 0.49, + "learning_rate": 2.6974912146413006e-06, + "loss": 1.2074, + "step": 16285 + }, + { + "epoch": 0.49, + "learning_rate": 2.6972480559293062e-06, + "loss": 1.1784, + "step": 16286 + }, + { + "epoch": 0.49, + "learning_rate": 2.697004895339605e-06, + "loss": 1.1812, + "step": 16287 + }, + { + "epoch": 0.49, + "learning_rate": 2.6967617328745127e-06, + "loss": 1.1143, + "step": 16288 + }, + { + "epoch": 0.49, + "learning_rate": 2.6965185685363433e-06, + "loss": 1.1572, + "step": 16289 + }, + { + "epoch": 0.49, + "learning_rate": 2.696275402327412e-06, + "loss": 1.0795, + "step": 16290 + }, + { + "epoch": 0.49, + "learning_rate": 2.696032234250032e-06, + "loss": 1.1423, + "step": 16291 + }, + { + "epoch": 0.49, + "learning_rate": 2.695789064306521e-06, + "loss": 1.2546, + "step": 16292 + }, + { + "epoch": 0.49, + "learning_rate": 2.6955458924991924e-06, + "loss": 1.0999, + "step": 16293 + }, + { + "epoch": 0.49, + "learning_rate": 2.6953027188303597e-06, + "loss": 1.1105, + "step": 16294 + }, + { + "epoch": 0.49, + "learning_rate": 2.69505954330234e-06, + "loss": 1.0972, + "step": 16295 + }, + { + "epoch": 0.49, + "learning_rate": 2.6948163659174476e-06, + "loss": 1.1732, + "step": 16296 + }, + { + "epoch": 0.49, + "learning_rate": 2.6945731866779973e-06, + "loss": 1.2339, + "step": 16297 + }, + { + "epoch": 0.49, + "learning_rate": 2.6943300055863036e-06, + "loss": 1.1475, + "step": 16298 + }, + { + "epoch": 0.49, + "learning_rate": 2.6940868226446827e-06, + "loss": 1.1474, + "step": 16299 + }, + { + "epoch": 0.49, + "learning_rate": 2.693843637855448e-06, + "loss": 1.1157, + "step": 16300 + }, + { + "epoch": 0.49, + "learning_rate": 2.693600451220915e-06, + "loss": 1.1985, + "step": 16301 + }, + { + "epoch": 0.49, + "learning_rate": 2.693357262743399e-06, + "loss": 1.114, + "step": 16302 + }, + { + "epoch": 0.49, + "learning_rate": 2.693114072425216e-06, + "loss": 1.2533, + "step": 16303 + }, + { + "epoch": 0.49, + "learning_rate": 2.6928708802686788e-06, + "loss": 1.2197, + "step": 16304 + }, + { + "epoch": 0.49, + "learning_rate": 2.6926276862761036e-06, + "loss": 1.0855, + "step": 16305 + }, + { + "epoch": 0.49, + "learning_rate": 2.692384490449807e-06, + "loss": 1.1702, + "step": 16306 + }, + { + "epoch": 0.49, + "learning_rate": 2.6921412927921015e-06, + "loss": 1.1601, + "step": 16307 + }, + { + "epoch": 0.49, + "learning_rate": 2.6918980933053035e-06, + "loss": 1.0528, + "step": 16308 + }, + { + "epoch": 0.49, + "learning_rate": 2.6916548919917286e-06, + "loss": 1.0484, + "step": 16309 + }, + { + "epoch": 0.49, + "learning_rate": 2.6914116888536913e-06, + "loss": 1.2371, + "step": 16310 + }, + { + "epoch": 0.49, + "learning_rate": 2.6911684838935066e-06, + "loss": 1.1931, + "step": 16311 + }, + { + "epoch": 0.49, + "learning_rate": 2.69092527711349e-06, + "loss": 1.2063, + "step": 16312 + }, + { + "epoch": 0.49, + "learning_rate": 2.6906820685159567e-06, + "loss": 1.1242, + "step": 16313 + }, + { + "epoch": 0.49, + "learning_rate": 2.6904388581032226e-06, + "loss": 1.1718, + "step": 16314 + }, + { + "epoch": 0.49, + "learning_rate": 2.690195645877602e-06, + "loss": 1.033, + "step": 16315 + }, + { + "epoch": 0.49, + "learning_rate": 2.6899524318414103e-06, + "loss": 1.0667, + "step": 16316 + }, + { + "epoch": 0.49, + "learning_rate": 2.6897092159969628e-06, + "loss": 1.1906, + "step": 16317 + }, + { + "epoch": 0.49, + "learning_rate": 2.6894659983465753e-06, + "loss": 1.0877, + "step": 16318 + }, + { + "epoch": 0.49, + "learning_rate": 2.6892227788925625e-06, + "loss": 1.2109, + "step": 16319 + }, + { + "epoch": 0.49, + "learning_rate": 2.6889795576372397e-06, + "loss": 1.1696, + "step": 16320 + }, + { + "epoch": 0.49, + "learning_rate": 2.688736334582923e-06, + "loss": 1.1514, + "step": 16321 + }, + { + "epoch": 0.49, + "learning_rate": 2.688493109731927e-06, + "loss": 1.0701, + "step": 16322 + }, + { + "epoch": 0.49, + "learning_rate": 2.6882498830865673e-06, + "loss": 1.2657, + "step": 16323 + }, + { + "epoch": 0.49, + "learning_rate": 2.6880066546491594e-06, + "loss": 1.1025, + "step": 16324 + }, + { + "epoch": 0.49, + "learning_rate": 2.687763424422019e-06, + "loss": 1.2386, + "step": 16325 + }, + { + "epoch": 0.49, + "learning_rate": 2.687520192407461e-06, + "loss": 1.1917, + "step": 16326 + }, + { + "epoch": 0.49, + "learning_rate": 2.6872769586078018e-06, + "loss": 1.1006, + "step": 16327 + }, + { + "epoch": 0.49, + "learning_rate": 2.687033723025355e-06, + "loss": 1.0901, + "step": 16328 + }, + { + "epoch": 0.49, + "learning_rate": 2.686790485662438e-06, + "loss": 1.1181, + "step": 16329 + }, + { + "epoch": 0.49, + "learning_rate": 2.686547246521365e-06, + "loss": 1.157, + "step": 16330 + }, + { + "epoch": 0.49, + "learning_rate": 2.6863040056044533e-06, + "loss": 1.186, + "step": 16331 + }, + { + "epoch": 0.49, + "learning_rate": 2.6860607629140156e-06, + "loss": 1.073, + "step": 16332 + }, + { + "epoch": 0.49, + "learning_rate": 2.6858175184523694e-06, + "loss": 1.0871, + "step": 16333 + }, + { + "epoch": 0.49, + "learning_rate": 2.6855742722218303e-06, + "loss": 1.0262, + "step": 16334 + }, + { + "epoch": 0.49, + "learning_rate": 2.6853310242247134e-06, + "loss": 1.141, + "step": 16335 + }, + { + "epoch": 0.49, + "learning_rate": 2.685087774463334e-06, + "loss": 1.1243, + "step": 16336 + }, + { + "epoch": 0.49, + "learning_rate": 2.684844522940009e-06, + "loss": 1.2472, + "step": 16337 + }, + { + "epoch": 0.49, + "learning_rate": 2.6846012696570527e-06, + "loss": 1.0868, + "step": 16338 + }, + { + "epoch": 0.49, + "learning_rate": 2.6843580146167806e-06, + "loss": 1.1002, + "step": 16339 + }, + { + "epoch": 0.49, + "learning_rate": 2.6841147578215105e-06, + "loss": 1.2405, + "step": 16340 + }, + { + "epoch": 0.49, + "learning_rate": 2.6838714992735555e-06, + "loss": 1.1787, + "step": 16341 + }, + { + "epoch": 0.49, + "learning_rate": 2.683628238975233e-06, + "loss": 1.1547, + "step": 16342 + }, + { + "epoch": 0.49, + "learning_rate": 2.6833849769288573e-06, + "loss": 1.112, + "step": 16343 + }, + { + "epoch": 0.49, + "learning_rate": 2.6831417131367456e-06, + "loss": 1.1737, + "step": 16344 + }, + { + "epoch": 0.49, + "learning_rate": 2.6828984476012127e-06, + "loss": 1.111, + "step": 16345 + }, + { + "epoch": 0.49, + "learning_rate": 2.6826551803245743e-06, + "loss": 1.0966, + "step": 16346 + }, + { + "epoch": 0.49, + "learning_rate": 2.682411911309147e-06, + "loss": 1.1732, + "step": 16347 + }, + { + "epoch": 0.49, + "learning_rate": 2.682168640557246e-06, + "loss": 1.1445, + "step": 16348 + }, + { + "epoch": 0.49, + "learning_rate": 2.681925368071187e-06, + "loss": 1.2224, + "step": 16349 + }, + { + "epoch": 0.49, + "learning_rate": 2.6816820938532873e-06, + "loss": 1.209, + "step": 16350 + }, + { + "epoch": 0.49, + "learning_rate": 2.68143881790586e-06, + "loss": 1.1494, + "step": 16351 + }, + { + "epoch": 0.49, + "learning_rate": 2.6811955402312232e-06, + "loss": 1.0744, + "step": 16352 + }, + { + "epoch": 0.49, + "learning_rate": 2.680952260831693e-06, + "loss": 1.0465, + "step": 16353 + }, + { + "epoch": 0.49, + "learning_rate": 2.6807089797095833e-06, + "loss": 1.1115, + "step": 16354 + }, + { + "epoch": 0.49, + "learning_rate": 2.6804656968672115e-06, + "loss": 1.1699, + "step": 16355 + }, + { + "epoch": 0.49, + "learning_rate": 2.6802224123068933e-06, + "loss": 1.2184, + "step": 16356 + }, + { + "epoch": 0.49, + "learning_rate": 2.6799791260309447e-06, + "loss": 1.123, + "step": 16357 + }, + { + "epoch": 0.49, + "learning_rate": 2.679735838041681e-06, + "loss": 1.0979, + "step": 16358 + }, + { + "epoch": 0.49, + "learning_rate": 2.6794925483414187e-06, + "loss": 1.1146, + "step": 16359 + }, + { + "epoch": 0.49, + "learning_rate": 2.679249256932474e-06, + "loss": 1.2062, + "step": 16360 + }, + { + "epoch": 0.49, + "learning_rate": 2.679005963817163e-06, + "loss": 1.027, + "step": 16361 + }, + { + "epoch": 0.49, + "learning_rate": 2.678762668997801e-06, + "loss": 1.1417, + "step": 16362 + }, + { + "epoch": 0.49, + "learning_rate": 2.6785193724767045e-06, + "loss": 1.1116, + "step": 16363 + }, + { + "epoch": 0.49, + "learning_rate": 2.67827607425619e-06, + "loss": 1.0894, + "step": 16364 + }, + { + "epoch": 0.49, + "learning_rate": 2.678032774338572e-06, + "loss": 1.0458, + "step": 16365 + }, + { + "epoch": 0.49, + "learning_rate": 2.677789472726169e-06, + "loss": 1.0014, + "step": 16366 + }, + { + "epoch": 0.49, + "learning_rate": 2.677546169421295e-06, + "loss": 1.1577, + "step": 16367 + }, + { + "epoch": 0.49, + "learning_rate": 2.6773028644262676e-06, + "loss": 1.1682, + "step": 16368 + }, + { + "epoch": 0.49, + "learning_rate": 2.677059557743402e-06, + "loss": 1.1899, + "step": 16369 + }, + { + "epoch": 0.49, + "learning_rate": 2.676816249375015e-06, + "loss": 1.0936, + "step": 16370 + }, + { + "epoch": 0.49, + "learning_rate": 2.676572939323422e-06, + "loss": 1.0131, + "step": 16371 + }, + { + "epoch": 0.49, + "learning_rate": 2.6763296275909394e-06, + "loss": 0.9768, + "step": 16372 + }, + { + "epoch": 0.49, + "learning_rate": 2.676086314179885e-06, + "loss": 1.1167, + "step": 16373 + }, + { + "epoch": 0.49, + "learning_rate": 2.6758429990925727e-06, + "loss": 1.0216, + "step": 16374 + }, + { + "epoch": 0.49, + "learning_rate": 2.67559968233132e-06, + "loss": 1.1259, + "step": 16375 + }, + { + "epoch": 0.49, + "learning_rate": 2.6753563638984424e-06, + "loss": 1.123, + "step": 16376 + }, + { + "epoch": 0.49, + "learning_rate": 2.6751130437962567e-06, + "loss": 1.1638, + "step": 16377 + }, + { + "epoch": 0.49, + "learning_rate": 2.6748697220270797e-06, + "loss": 1.1241, + "step": 16378 + }, + { + "epoch": 0.49, + "learning_rate": 2.6746263985932267e-06, + "loss": 1.2039, + "step": 16379 + }, + { + "epoch": 0.49, + "learning_rate": 2.674383073497015e-06, + "loss": 1.1835, + "step": 16380 + }, + { + "epoch": 0.49, + "learning_rate": 2.6741397467407603e-06, + "loss": 1.1512, + "step": 16381 + }, + { + "epoch": 0.49, + "learning_rate": 2.6738964183267792e-06, + "loss": 1.11, + "step": 16382 + }, + { + "epoch": 0.49, + "learning_rate": 2.673653088257388e-06, + "loss": 1.0912, + "step": 16383 + }, + { + "epoch": 0.49, + "learning_rate": 2.673409756534902e-06, + "loss": 1.0038, + "step": 16384 + }, + { + "epoch": 0.49, + "learning_rate": 2.6731664231616392e-06, + "loss": 1.1285, + "step": 16385 + }, + { + "epoch": 0.49, + "learning_rate": 2.6729230881399165e-06, + "loss": 1.0875, + "step": 16386 + }, + { + "epoch": 0.49, + "learning_rate": 2.6726797514720483e-06, + "loss": 1.2291, + "step": 16387 + }, + { + "epoch": 0.49, + "learning_rate": 2.672436413160352e-06, + "loss": 1.1127, + "step": 16388 + }, + { + "epoch": 0.49, + "learning_rate": 2.6721930732071442e-06, + "loss": 1.1823, + "step": 16389 + }, + { + "epoch": 0.49, + "learning_rate": 2.6719497316147412e-06, + "loss": 1.1365, + "step": 16390 + }, + { + "epoch": 0.49, + "learning_rate": 2.6717063883854598e-06, + "loss": 0.9999, + "step": 16391 + }, + { + "epoch": 0.49, + "learning_rate": 2.671463043521616e-06, + "loss": 1.1047, + "step": 16392 + }, + { + "epoch": 0.49, + "learning_rate": 2.6712196970255267e-06, + "loss": 1.1946, + "step": 16393 + }, + { + "epoch": 0.49, + "learning_rate": 2.670976348899509e-06, + "loss": 1.1218, + "step": 16394 + }, + { + "epoch": 0.49, + "learning_rate": 2.6707329991458774e-06, + "loss": 1.117, + "step": 16395 + }, + { + "epoch": 0.49, + "learning_rate": 2.670489647766951e-06, + "loss": 1.071, + "step": 16396 + }, + { + "epoch": 0.49, + "learning_rate": 2.6702462947650447e-06, + "loss": 1.154, + "step": 16397 + }, + { + "epoch": 0.49, + "learning_rate": 2.670002940142476e-06, + "loss": 1.1116, + "step": 16398 + }, + { + "epoch": 0.49, + "learning_rate": 2.669759583901562e-06, + "loss": 1.133, + "step": 16399 + }, + { + "epoch": 0.49, + "learning_rate": 2.669516226044617e-06, + "loss": 1.1386, + "step": 16400 + }, + { + "epoch": 0.49, + "learning_rate": 2.6692728665739597e-06, + "loss": 1.1048, + "step": 16401 + }, + { + "epoch": 0.49, + "learning_rate": 2.6690295054919063e-06, + "loss": 1.0625, + "step": 16402 + }, + { + "epoch": 0.49, + "learning_rate": 2.668786142800774e-06, + "loss": 1.1882, + "step": 16403 + }, + { + "epoch": 0.49, + "learning_rate": 2.6685427785028783e-06, + "loss": 1.2377, + "step": 16404 + }, + { + "epoch": 0.49, + "learning_rate": 2.668299412600536e-06, + "loss": 1.1736, + "step": 16405 + }, + { + "epoch": 0.49, + "learning_rate": 2.6680560450960646e-06, + "loss": 1.1854, + "step": 16406 + }, + { + "epoch": 0.49, + "learning_rate": 2.6678126759917816e-06, + "loss": 1.0002, + "step": 16407 + }, + { + "epoch": 0.49, + "learning_rate": 2.667569305290002e-06, + "loss": 1.1433, + "step": 16408 + }, + { + "epoch": 0.49, + "learning_rate": 2.6673259329930435e-06, + "loss": 0.9651, + "step": 16409 + }, + { + "epoch": 0.49, + "learning_rate": 2.667082559103222e-06, + "loss": 1.1854, + "step": 16410 + }, + { + "epoch": 0.49, + "learning_rate": 2.6668391836228563e-06, + "loss": 1.0206, + "step": 16411 + }, + { + "epoch": 0.49, + "learning_rate": 2.666595806554261e-06, + "loss": 1.2062, + "step": 16412 + }, + { + "epoch": 0.49, + "learning_rate": 2.666352427899754e-06, + "loss": 1.1327, + "step": 16413 + }, + { + "epoch": 0.49, + "learning_rate": 2.6661090476616527e-06, + "loss": 1.1321, + "step": 16414 + }, + { + "epoch": 0.49, + "learning_rate": 2.6658656658422722e-06, + "loss": 1.212, + "step": 16415 + }, + { + "epoch": 0.49, + "learning_rate": 2.665622282443931e-06, + "loss": 1.222, + "step": 16416 + }, + { + "epoch": 0.49, + "learning_rate": 2.6653788974689453e-06, + "loss": 1.15, + "step": 16417 + }, + { + "epoch": 0.49, + "learning_rate": 2.665135510919632e-06, + "loss": 1.1836, + "step": 16418 + }, + { + "epoch": 0.49, + "learning_rate": 2.6648921227983083e-06, + "loss": 1.1082, + "step": 16419 + }, + { + "epoch": 0.49, + "learning_rate": 2.664648733107291e-06, + "loss": 1.0963, + "step": 16420 + }, + { + "epoch": 0.49, + "learning_rate": 2.664405341848897e-06, + "loss": 1.0835, + "step": 16421 + }, + { + "epoch": 0.49, + "learning_rate": 2.664161949025444e-06, + "loss": 1.1815, + "step": 16422 + }, + { + "epoch": 0.49, + "learning_rate": 2.663918554639247e-06, + "loss": 1.153, + "step": 16423 + }, + { + "epoch": 0.49, + "learning_rate": 2.6636751586926255e-06, + "loss": 1.1642, + "step": 16424 + }, + { + "epoch": 0.49, + "learning_rate": 2.6634317611878945e-06, + "loss": 1.2688, + "step": 16425 + }, + { + "epoch": 0.49, + "learning_rate": 2.6631883621273723e-06, + "loss": 1.1171, + "step": 16426 + }, + { + "epoch": 0.49, + "learning_rate": 2.6629449615133755e-06, + "loss": 1.1241, + "step": 16427 + }, + { + "epoch": 0.49, + "learning_rate": 2.662701559348221e-06, + "loss": 1.0867, + "step": 16428 + }, + { + "epoch": 0.49, + "learning_rate": 2.6624581556342268e-06, + "loss": 1.0283, + "step": 16429 + }, + { + "epoch": 0.49, + "learning_rate": 2.662214750373708e-06, + "loss": 1.1674, + "step": 16430 + }, + { + "epoch": 0.49, + "learning_rate": 2.661971343568983e-06, + "loss": 1.1182, + "step": 16431 + }, + { + "epoch": 0.5, + "learning_rate": 2.6617279352223695e-06, + "loss": 1.0688, + "step": 16432 + }, + { + "epoch": 0.5, + "learning_rate": 2.661484525336183e-06, + "loss": 1.0829, + "step": 16433 + }, + { + "epoch": 0.5, + "learning_rate": 2.6612411139127424e-06, + "loss": 1.0527, + "step": 16434 + }, + { + "epoch": 0.5, + "learning_rate": 2.660997700954364e-06, + "loss": 1.1825, + "step": 16435 + }, + { + "epoch": 0.5, + "learning_rate": 2.660754286463365e-06, + "loss": 1.1137, + "step": 16436 + }, + { + "epoch": 0.5, + "learning_rate": 2.6605108704420627e-06, + "loss": 1.176, + "step": 16437 + }, + { + "epoch": 0.5, + "learning_rate": 2.6602674528927743e-06, + "loss": 1.1696, + "step": 16438 + }, + { + "epoch": 0.5, + "learning_rate": 2.6600240338178164e-06, + "loss": 1.2024, + "step": 16439 + }, + { + "epoch": 0.5, + "learning_rate": 2.659780613219507e-06, + "loss": 1.16, + "step": 16440 + }, + { + "epoch": 0.5, + "learning_rate": 2.6595371911001625e-06, + "loss": 0.9632, + "step": 16441 + }, + { + "epoch": 0.5, + "learning_rate": 2.6592937674621023e-06, + "loss": 1.1301, + "step": 16442 + }, + { + "epoch": 0.5, + "learning_rate": 2.659050342307641e-06, + "loss": 0.9903, + "step": 16443 + }, + { + "epoch": 0.5, + "learning_rate": 2.658806915639098e-06, + "loss": 1.0276, + "step": 16444 + }, + { + "epoch": 0.5, + "learning_rate": 2.6585634874587882e-06, + "loss": 1.1776, + "step": 16445 + }, + { + "epoch": 0.5, + "learning_rate": 2.658320057769031e-06, + "loss": 1.1405, + "step": 16446 + }, + { + "epoch": 0.5, + "learning_rate": 2.658076626572143e-06, + "loss": 1.1509, + "step": 16447 + }, + { + "epoch": 0.5, + "learning_rate": 2.657833193870442e-06, + "loss": 1.0981, + "step": 16448 + }, + { + "epoch": 0.5, + "learning_rate": 2.6575897596662448e-06, + "loss": 1.162, + "step": 16449 + }, + { + "epoch": 0.5, + "learning_rate": 2.65734632396187e-06, + "loss": 1.0261, + "step": 16450 + }, + { + "epoch": 0.5, + "learning_rate": 2.6571028867596327e-06, + "loss": 0.9948, + "step": 16451 + }, + { + "epoch": 0.5, + "learning_rate": 2.6568594480618514e-06, + "loss": 1.1669, + "step": 16452 + }, + { + "epoch": 0.5, + "learning_rate": 2.6566160078708446e-06, + "loss": 1.0821, + "step": 16453 + }, + { + "epoch": 0.5, + "learning_rate": 2.6563725661889285e-06, + "loss": 1.2504, + "step": 16454 + }, + { + "epoch": 0.5, + "learning_rate": 2.656129123018421e-06, + "loss": 1.1358, + "step": 16455 + }, + { + "epoch": 0.5, + "learning_rate": 2.655885678361639e-06, + "loss": 1.1837, + "step": 16456 + }, + { + "epoch": 0.5, + "learning_rate": 2.6556422322209006e-06, + "loss": 1.2019, + "step": 16457 + }, + { + "epoch": 0.5, + "learning_rate": 2.6553987845985235e-06, + "loss": 1.0967, + "step": 16458 + }, + { + "epoch": 0.5, + "learning_rate": 2.655155335496824e-06, + "loss": 1.1907, + "step": 16459 + }, + { + "epoch": 0.5, + "learning_rate": 2.654911884918121e-06, + "loss": 1.2303, + "step": 16460 + }, + { + "epoch": 0.5, + "learning_rate": 2.654668432864732e-06, + "loss": 1.1834, + "step": 16461 + }, + { + "epoch": 0.5, + "learning_rate": 2.6544249793389733e-06, + "loss": 1.2109, + "step": 16462 + }, + { + "epoch": 0.5, + "learning_rate": 2.6541815243431634e-06, + "loss": 1.1489, + "step": 16463 + }, + { + "epoch": 0.5, + "learning_rate": 2.6539380678796194e-06, + "loss": 1.1683, + "step": 16464 + }, + { + "epoch": 0.5, + "learning_rate": 2.653694609950659e-06, + "loss": 1.096, + "step": 16465 + }, + { + "epoch": 0.5, + "learning_rate": 2.6534511505586e-06, + "loss": 1.109, + "step": 16466 + }, + { + "epoch": 0.5, + "learning_rate": 2.6532076897057607e-06, + "loss": 1.1473, + "step": 16467 + }, + { + "epoch": 0.5, + "learning_rate": 2.652964227394458e-06, + "loss": 1.0883, + "step": 16468 + }, + { + "epoch": 0.5, + "learning_rate": 2.6527207636270086e-06, + "loss": 1.1163, + "step": 16469 + }, + { + "epoch": 0.5, + "learning_rate": 2.6524772984057318e-06, + "loss": 1.0175, + "step": 16470 + }, + { + "epoch": 0.5, + "learning_rate": 2.6522338317329438e-06, + "loss": 1.1592, + "step": 16471 + }, + { + "epoch": 0.5, + "learning_rate": 2.6519903636109632e-06, + "loss": 1.1376, + "step": 16472 + }, + { + "epoch": 0.5, + "learning_rate": 2.651746894042108e-06, + "loss": 1.174, + "step": 16473 + }, + { + "epoch": 0.5, + "learning_rate": 2.651503423028695e-06, + "loss": 1.0832, + "step": 16474 + }, + { + "epoch": 0.5, + "learning_rate": 2.6512599505730425e-06, + "loss": 1.1268, + "step": 16475 + }, + { + "epoch": 0.5, + "learning_rate": 2.6510164766774686e-06, + "loss": 1.0908, + "step": 16476 + }, + { + "epoch": 0.5, + "learning_rate": 2.65077300134429e-06, + "loss": 1.1699, + "step": 16477 + }, + { + "epoch": 0.5, + "learning_rate": 2.650529524575825e-06, + "loss": 1.0605, + "step": 16478 + }, + { + "epoch": 0.5, + "learning_rate": 2.6502860463743922e-06, + "loss": 1.0557, + "step": 16479 + }, + { + "epoch": 0.5, + "learning_rate": 2.650042566742308e-06, + "loss": 1.1394, + "step": 16480 + }, + { + "epoch": 0.5, + "learning_rate": 2.649799085681891e-06, + "loss": 1.1137, + "step": 16481 + }, + { + "epoch": 0.5, + "learning_rate": 2.6495556031954588e-06, + "loss": 1.1036, + "step": 16482 + }, + { + "epoch": 0.5, + "learning_rate": 2.649312119285329e-06, + "loss": 1.118, + "step": 16483 + }, + { + "epoch": 0.5, + "learning_rate": 2.6490686339538203e-06, + "loss": 0.9872, + "step": 16484 + }, + { + "epoch": 0.5, + "learning_rate": 2.64882514720325e-06, + "loss": 1.0922, + "step": 16485 + }, + { + "epoch": 0.5, + "learning_rate": 2.6485816590359354e-06, + "loss": 1.1678, + "step": 16486 + }, + { + "epoch": 0.5, + "learning_rate": 2.6483381694541947e-06, + "loss": 1.1927, + "step": 16487 + }, + { + "epoch": 0.5, + "learning_rate": 2.648094678460347e-06, + "loss": 1.1893, + "step": 16488 + }, + { + "epoch": 0.5, + "learning_rate": 2.647851186056709e-06, + "loss": 1.0967, + "step": 16489 + }, + { + "epoch": 0.5, + "learning_rate": 2.6476076922455983e-06, + "loss": 1.1441, + "step": 16490 + }, + { + "epoch": 0.5, + "learning_rate": 2.647364197029334e-06, + "loss": 1.1124, + "step": 16491 + }, + { + "epoch": 0.5, + "learning_rate": 2.647120700410234e-06, + "loss": 1.1, + "step": 16492 + }, + { + "epoch": 0.5, + "learning_rate": 2.646877202390615e-06, + "loss": 1.1007, + "step": 16493 + }, + { + "epoch": 0.5, + "learning_rate": 2.646633702972796e-06, + "loss": 1.1766, + "step": 16494 + }, + { + "epoch": 0.5, + "learning_rate": 2.646390202159095e-06, + "loss": 1.0137, + "step": 16495 + }, + { + "epoch": 0.5, + "learning_rate": 2.6461466999518296e-06, + "loss": 1.0421, + "step": 16496 + }, + { + "epoch": 0.5, + "learning_rate": 2.6459031963533183e-06, + "loss": 1.1744, + "step": 16497 + }, + { + "epoch": 0.5, + "learning_rate": 2.6456596913658788e-06, + "loss": 1.1777, + "step": 16498 + }, + { + "epoch": 0.5, + "learning_rate": 2.6454161849918285e-06, + "loss": 1.3663, + "step": 16499 + }, + { + "epoch": 0.5, + "learning_rate": 2.6451726772334863e-06, + "loss": 1.1062, + "step": 16500 + }, + { + "epoch": 0.5, + "learning_rate": 2.6449291680931705e-06, + "loss": 1.1226, + "step": 16501 + }, + { + "epoch": 0.5, + "learning_rate": 2.644685657573199e-06, + "loss": 1.0723, + "step": 16502 + }, + { + "epoch": 0.5, + "learning_rate": 2.644442145675889e-06, + "loss": 1.2527, + "step": 16503 + }, + { + "epoch": 0.5, + "learning_rate": 2.64419863240356e-06, + "loss": 1.1442, + "step": 16504 + }, + { + "epoch": 0.5, + "learning_rate": 2.643955117758529e-06, + "loss": 1.1694, + "step": 16505 + }, + { + "epoch": 0.5, + "learning_rate": 2.6437116017431154e-06, + "loss": 1.1255, + "step": 16506 + }, + { + "epoch": 0.5, + "learning_rate": 2.6434680843596362e-06, + "loss": 0.9567, + "step": 16507 + }, + { + "epoch": 0.5, + "learning_rate": 2.6432245656104092e-06, + "loss": 0.9895, + "step": 16508 + }, + { + "epoch": 0.5, + "learning_rate": 2.6429810454977544e-06, + "loss": 1.1877, + "step": 16509 + }, + { + "epoch": 0.5, + "learning_rate": 2.6427375240239883e-06, + "loss": 1.129, + "step": 16510 + }, + { + "epoch": 0.5, + "learning_rate": 2.64249400119143e-06, + "loss": 1.1843, + "step": 16511 + }, + { + "epoch": 0.5, + "learning_rate": 2.642250477002397e-06, + "loss": 1.1679, + "step": 16512 + }, + { + "epoch": 0.5, + "learning_rate": 2.6420069514592085e-06, + "loss": 1.1343, + "step": 16513 + }, + { + "epoch": 0.5, + "learning_rate": 2.641763424564182e-06, + "loss": 1.0812, + "step": 16514 + }, + { + "epoch": 0.5, + "learning_rate": 2.6415198963196353e-06, + "loss": 1.0761, + "step": 16515 + }, + { + "epoch": 0.5, + "learning_rate": 2.641276366727888e-06, + "loss": 1.0593, + "step": 16516 + }, + { + "epoch": 0.5, + "learning_rate": 2.641032835791258e-06, + "loss": 1.1437, + "step": 16517 + }, + { + "epoch": 0.5, + "learning_rate": 2.640789303512063e-06, + "loss": 1.1514, + "step": 16518 + }, + { + "epoch": 0.5, + "learning_rate": 2.6405457698926214e-06, + "loss": 1.0845, + "step": 16519 + }, + { + "epoch": 0.5, + "learning_rate": 2.640302234935252e-06, + "loss": 1.1848, + "step": 16520 + }, + { + "epoch": 0.5, + "learning_rate": 2.6400586986422727e-06, + "loss": 1.1628, + "step": 16521 + }, + { + "epoch": 0.5, + "learning_rate": 2.639815161016003e-06, + "loss": 1.0733, + "step": 16522 + }, + { + "epoch": 0.5, + "learning_rate": 2.639571622058759e-06, + "loss": 1.1058, + "step": 16523 + }, + { + "epoch": 0.5, + "learning_rate": 2.6393280817728612e-06, + "loss": 0.9875, + "step": 16524 + }, + { + "epoch": 0.5, + "learning_rate": 2.6390845401606268e-06, + "loss": 1.252, + "step": 16525 + }, + { + "epoch": 0.5, + "learning_rate": 2.6388409972243752e-06, + "loss": 1.1385, + "step": 16526 + }, + { + "epoch": 0.5, + "learning_rate": 2.638597452966423e-06, + "loss": 1.0741, + "step": 16527 + }, + { + "epoch": 0.5, + "learning_rate": 2.6383539073890907e-06, + "loss": 1.0649, + "step": 16528 + }, + { + "epoch": 0.5, + "learning_rate": 2.638110360494695e-06, + "loss": 1.0828, + "step": 16529 + }, + { + "epoch": 0.5, + "learning_rate": 2.637866812285556e-06, + "loss": 1.0912, + "step": 16530 + }, + { + "epoch": 0.5, + "learning_rate": 2.637623262763991e-06, + "loss": 1.0361, + "step": 16531 + }, + { + "epoch": 0.5, + "learning_rate": 2.6373797119323187e-06, + "loss": 1.0995, + "step": 16532 + }, + { + "epoch": 0.5, + "learning_rate": 2.6371361597928585e-06, + "loss": 1.1426, + "step": 16533 + }, + { + "epoch": 0.5, + "learning_rate": 2.636892606347927e-06, + "loss": 1.1117, + "step": 16534 + }, + { + "epoch": 0.5, + "learning_rate": 2.636649051599845e-06, + "loss": 1.1412, + "step": 16535 + }, + { + "epoch": 0.5, + "learning_rate": 2.636405495550929e-06, + "loss": 1.2289, + "step": 16536 + }, + { + "epoch": 0.5, + "learning_rate": 2.6361619382034985e-06, + "loss": 1.1517, + "step": 16537 + }, + { + "epoch": 0.5, + "learning_rate": 2.635918379559872e-06, + "loss": 1.239, + "step": 16538 + }, + { + "epoch": 0.5, + "learning_rate": 2.6356748196223687e-06, + "loss": 1.0403, + "step": 16539 + }, + { + "epoch": 0.5, + "learning_rate": 2.6354312583933052e-06, + "loss": 1.0519, + "step": 16540 + }, + { + "epoch": 0.5, + "learning_rate": 2.6351876958750017e-06, + "loss": 1.154, + "step": 16541 + }, + { + "epoch": 0.5, + "learning_rate": 2.6349441320697764e-06, + "loss": 1.1201, + "step": 16542 + }, + { + "epoch": 0.5, + "learning_rate": 2.6347005669799486e-06, + "loss": 1.18, + "step": 16543 + }, + { + "epoch": 0.5, + "learning_rate": 2.6344570006078357e-06, + "loss": 1.1465, + "step": 16544 + }, + { + "epoch": 0.5, + "learning_rate": 2.6342134329557565e-06, + "loss": 1.079, + "step": 16545 + }, + { + "epoch": 0.5, + "learning_rate": 2.6339698640260315e-06, + "loss": 1.1329, + "step": 16546 + }, + { + "epoch": 0.5, + "learning_rate": 2.6337262938209764e-06, + "loss": 1.1494, + "step": 16547 + }, + { + "epoch": 0.5, + "learning_rate": 2.633482722342913e-06, + "loss": 1.2474, + "step": 16548 + }, + { + "epoch": 0.5, + "learning_rate": 2.633239149594157e-06, + "loss": 1.095, + "step": 16549 + }, + { + "epoch": 0.5, + "learning_rate": 2.6329955755770287e-06, + "loss": 1.1317, + "step": 16550 + }, + { + "epoch": 0.5, + "learning_rate": 2.6327520002938467e-06, + "loss": 1.1766, + "step": 16551 + }, + { + "epoch": 0.5, + "learning_rate": 2.63250842374693e-06, + "loss": 1.0091, + "step": 16552 + }, + { + "epoch": 0.5, + "learning_rate": 2.6322648459385964e-06, + "loss": 1.146, + "step": 16553 + }, + { + "epoch": 0.5, + "learning_rate": 2.6320212668711647e-06, + "loss": 1.1421, + "step": 16554 + }, + { + "epoch": 0.5, + "learning_rate": 2.6317776865469547e-06, + "loss": 1.1824, + "step": 16555 + }, + { + "epoch": 0.5, + "learning_rate": 2.631534104968285e-06, + "loss": 1.1598, + "step": 16556 + }, + { + "epoch": 0.5, + "learning_rate": 2.6312905221374737e-06, + "loss": 1.0858, + "step": 16557 + }, + { + "epoch": 0.5, + "learning_rate": 2.6310469380568394e-06, + "loss": 1.1255, + "step": 16558 + }, + { + "epoch": 0.5, + "learning_rate": 2.6308033527287018e-06, + "loss": 1.1255, + "step": 16559 + }, + { + "epoch": 0.5, + "learning_rate": 2.6305597661553795e-06, + "loss": 1.1444, + "step": 16560 + }, + { + "epoch": 0.5, + "learning_rate": 2.6303161783391906e-06, + "loss": 1.14, + "step": 16561 + }, + { + "epoch": 0.5, + "learning_rate": 2.6300725892824546e-06, + "loss": 1.0586, + "step": 16562 + }, + { + "epoch": 0.5, + "learning_rate": 2.629828998987491e-06, + "loss": 0.9861, + "step": 16563 + }, + { + "epoch": 0.5, + "learning_rate": 2.6295854074566167e-06, + "loss": 1.086, + "step": 16564 + }, + { + "epoch": 0.5, + "learning_rate": 2.6293418146921524e-06, + "loss": 1.1586, + "step": 16565 + }, + { + "epoch": 0.5, + "learning_rate": 2.629098220696416e-06, + "loss": 1.0521, + "step": 16566 + }, + { + "epoch": 0.5, + "learning_rate": 2.6288546254717266e-06, + "loss": 1.1453, + "step": 16567 + }, + { + "epoch": 0.5, + "learning_rate": 2.6286110290204035e-06, + "loss": 1.2411, + "step": 16568 + }, + { + "epoch": 0.5, + "learning_rate": 2.628367431344765e-06, + "loss": 1.2621, + "step": 16569 + }, + { + "epoch": 0.5, + "learning_rate": 2.6281238324471304e-06, + "loss": 1.196, + "step": 16570 + }, + { + "epoch": 0.5, + "learning_rate": 2.6278802323298187e-06, + "loss": 1.0553, + "step": 16571 + }, + { + "epoch": 0.5, + "learning_rate": 2.6276366309951495e-06, + "loss": 1.1459, + "step": 16572 + }, + { + "epoch": 0.5, + "learning_rate": 2.6273930284454404e-06, + "loss": 1.2091, + "step": 16573 + }, + { + "epoch": 0.5, + "learning_rate": 2.627149424683011e-06, + "loss": 1.1449, + "step": 16574 + }, + { + "epoch": 0.5, + "learning_rate": 2.6269058197101806e-06, + "loss": 1.1021, + "step": 16575 + }, + { + "epoch": 0.5, + "learning_rate": 2.626662213529268e-06, + "loss": 1.133, + "step": 16576 + }, + { + "epoch": 0.5, + "learning_rate": 2.626418606142591e-06, + "loss": 1.1454, + "step": 16577 + }, + { + "epoch": 0.5, + "learning_rate": 2.6261749975524715e-06, + "loss": 1.0692, + "step": 16578 + }, + { + "epoch": 0.5, + "learning_rate": 2.6259313877612257e-06, + "loss": 1.0551, + "step": 16579 + }, + { + "epoch": 0.5, + "learning_rate": 2.625687776771174e-06, + "loss": 1.1087, + "step": 16580 + }, + { + "epoch": 0.5, + "learning_rate": 2.6254441645846353e-06, + "loss": 1.1472, + "step": 16581 + }, + { + "epoch": 0.5, + "learning_rate": 2.625200551203928e-06, + "loss": 1.0444, + "step": 16582 + }, + { + "epoch": 0.5, + "learning_rate": 2.624956936631372e-06, + "loss": 1.0944, + "step": 16583 + }, + { + "epoch": 0.5, + "learning_rate": 2.624713320869286e-06, + "loss": 1.1906, + "step": 16584 + }, + { + "epoch": 0.5, + "learning_rate": 2.6244697039199895e-06, + "loss": 1.0756, + "step": 16585 + }, + { + "epoch": 0.5, + "learning_rate": 2.6242260857858017e-06, + "loss": 1.2603, + "step": 16586 + }, + { + "epoch": 0.5, + "learning_rate": 2.623982466469041e-06, + "loss": 1.0677, + "step": 16587 + }, + { + "epoch": 0.5, + "learning_rate": 2.623738845972027e-06, + "loss": 1.0778, + "step": 16588 + }, + { + "epoch": 0.5, + "learning_rate": 2.623495224297079e-06, + "loss": 1.1273, + "step": 16589 + }, + { + "epoch": 0.5, + "learning_rate": 2.623251601446516e-06, + "loss": 1.0131, + "step": 16590 + }, + { + "epoch": 0.5, + "learning_rate": 2.623007977422657e-06, + "loss": 1.1219, + "step": 16591 + }, + { + "epoch": 0.5, + "learning_rate": 2.6227643522278213e-06, + "loss": 1.1732, + "step": 16592 + }, + { + "epoch": 0.5, + "learning_rate": 2.622520725864328e-06, + "loss": 1.229, + "step": 16593 + }, + { + "epoch": 0.5, + "learning_rate": 2.6222770983344963e-06, + "loss": 1.0087, + "step": 16594 + }, + { + "epoch": 0.5, + "learning_rate": 2.622033469640645e-06, + "loss": 1.0571, + "step": 16595 + }, + { + "epoch": 0.5, + "learning_rate": 2.6217898397850942e-06, + "loss": 1.14, + "step": 16596 + }, + { + "epoch": 0.5, + "learning_rate": 2.6215462087701636e-06, + "loss": 1.1188, + "step": 16597 + }, + { + "epoch": 0.5, + "learning_rate": 2.621302576598171e-06, + "loss": 1.1362, + "step": 16598 + }, + { + "epoch": 0.5, + "learning_rate": 2.621058943271436e-06, + "loss": 1.1239, + "step": 16599 + }, + { + "epoch": 0.5, + "learning_rate": 2.620815308792279e-06, + "loss": 1.0438, + "step": 16600 + }, + { + "epoch": 0.5, + "learning_rate": 2.620571673163018e-06, + "loss": 1.2146, + "step": 16601 + }, + { + "epoch": 0.5, + "learning_rate": 2.6203280363859724e-06, + "loss": 1.2043, + "step": 16602 + }, + { + "epoch": 0.5, + "learning_rate": 2.620084398463462e-06, + "loss": 1.2311, + "step": 16603 + }, + { + "epoch": 0.5, + "learning_rate": 2.6198407593978065e-06, + "loss": 1.0746, + "step": 16604 + }, + { + "epoch": 0.5, + "learning_rate": 2.6195971191913237e-06, + "loss": 1.098, + "step": 16605 + }, + { + "epoch": 0.5, + "learning_rate": 2.6193534778463354e-06, + "loss": 1.116, + "step": 16606 + }, + { + "epoch": 0.5, + "learning_rate": 2.619109835365158e-06, + "loss": 1.1925, + "step": 16607 + }, + { + "epoch": 0.5, + "learning_rate": 2.6188661917501136e-06, + "loss": 1.0834, + "step": 16608 + }, + { + "epoch": 0.5, + "learning_rate": 2.6186225470035194e-06, + "loss": 1.0485, + "step": 16609 + }, + { + "epoch": 0.5, + "learning_rate": 2.6183789011276955e-06, + "loss": 1.1027, + "step": 16610 + }, + { + "epoch": 0.5, + "learning_rate": 2.6181352541249617e-06, + "loss": 1.1917, + "step": 16611 + }, + { + "epoch": 0.5, + "learning_rate": 2.6178916059976374e-06, + "loss": 1.082, + "step": 16612 + }, + { + "epoch": 0.5, + "learning_rate": 2.617647956748042e-06, + "loss": 1.2108, + "step": 16613 + }, + { + "epoch": 0.5, + "learning_rate": 2.6174043063784936e-06, + "loss": 1.0815, + "step": 16614 + }, + { + "epoch": 0.5, + "learning_rate": 2.617160654891314e-06, + "loss": 1.183, + "step": 16615 + }, + { + "epoch": 0.5, + "learning_rate": 2.616917002288821e-06, + "loss": 1.1263, + "step": 16616 + }, + { + "epoch": 0.5, + "learning_rate": 2.6166733485733348e-06, + "loss": 1.1918, + "step": 16617 + }, + { + "epoch": 0.5, + "learning_rate": 2.6164296937471738e-06, + "loss": 1.2331, + "step": 16618 + }, + { + "epoch": 0.5, + "learning_rate": 2.616186037812659e-06, + "loss": 1.0633, + "step": 16619 + }, + { + "epoch": 0.5, + "learning_rate": 2.6159423807721085e-06, + "loss": 1.0718, + "step": 16620 + }, + { + "epoch": 0.5, + "learning_rate": 2.615698722627843e-06, + "loss": 1.0929, + "step": 16621 + }, + { + "epoch": 0.5, + "learning_rate": 2.6154550633821803e-06, + "loss": 1.0201, + "step": 16622 + }, + { + "epoch": 0.5, + "learning_rate": 2.6152114030374413e-06, + "loss": 1.154, + "step": 16623 + }, + { + "epoch": 0.5, + "learning_rate": 2.614967741595945e-06, + "loss": 1.2108, + "step": 16624 + }, + { + "epoch": 0.5, + "learning_rate": 2.614724079060012e-06, + "loss": 1.0533, + "step": 16625 + }, + { + "epoch": 0.5, + "learning_rate": 2.614480415431961e-06, + "loss": 1.1174, + "step": 16626 + }, + { + "epoch": 0.5, + "learning_rate": 2.614236750714111e-06, + "loss": 1.1929, + "step": 16627 + }, + { + "epoch": 0.5, + "learning_rate": 2.6139930849087823e-06, + "loss": 1.14, + "step": 16628 + }, + { + "epoch": 0.5, + "learning_rate": 2.613749418018295e-06, + "loss": 1.112, + "step": 16629 + }, + { + "epoch": 0.5, + "learning_rate": 2.6135057500449672e-06, + "loss": 1.2023, + "step": 16630 + }, + { + "epoch": 0.5, + "learning_rate": 2.6132620809911197e-06, + "loss": 1.1484, + "step": 16631 + }, + { + "epoch": 0.5, + "learning_rate": 2.6130184108590717e-06, + "loss": 1.2401, + "step": 16632 + }, + { + "epoch": 0.5, + "learning_rate": 2.6127747396511428e-06, + "loss": 1.1431, + "step": 16633 + }, + { + "epoch": 0.5, + "learning_rate": 2.612531067369653e-06, + "loss": 1.0347, + "step": 16634 + }, + { + "epoch": 0.5, + "learning_rate": 2.6122873940169214e-06, + "loss": 1.0856, + "step": 16635 + }, + { + "epoch": 0.5, + "learning_rate": 2.6120437195952677e-06, + "loss": 1.1741, + "step": 16636 + }, + { + "epoch": 0.5, + "learning_rate": 2.6118000441070115e-06, + "loss": 1.2667, + "step": 16637 + }, + { + "epoch": 0.5, + "learning_rate": 2.611556367554473e-06, + "loss": 1.1116, + "step": 16638 + }, + { + "epoch": 0.5, + "learning_rate": 2.6113126899399716e-06, + "loss": 1.2153, + "step": 16639 + }, + { + "epoch": 0.5, + "learning_rate": 2.611069011265827e-06, + "loss": 1.0347, + "step": 16640 + }, + { + "epoch": 0.5, + "learning_rate": 2.6108253315343598e-06, + "loss": 1.1227, + "step": 16641 + }, + { + "epoch": 0.5, + "learning_rate": 2.6105816507478875e-06, + "loss": 1.0068, + "step": 16642 + }, + { + "epoch": 0.5, + "learning_rate": 2.610337968908732e-06, + "loss": 1.2175, + "step": 16643 + }, + { + "epoch": 0.5, + "learning_rate": 2.610094286019211e-06, + "loss": 1.1491, + "step": 16644 + }, + { + "epoch": 0.5, + "learning_rate": 2.609850602081647e-06, + "loss": 1.1605, + "step": 16645 + }, + { + "epoch": 0.5, + "learning_rate": 2.6096069170983574e-06, + "loss": 1.1201, + "step": 16646 + }, + { + "epoch": 0.5, + "learning_rate": 2.6093632310716633e-06, + "loss": 1.07, + "step": 16647 + }, + { + "epoch": 0.5, + "learning_rate": 2.609119544003883e-06, + "loss": 1.1543, + "step": 16648 + }, + { + "epoch": 0.5, + "learning_rate": 2.608875855897338e-06, + "loss": 1.217, + "step": 16649 + }, + { + "epoch": 0.5, + "learning_rate": 2.6086321667543467e-06, + "loss": 1.1596, + "step": 16650 + }, + { + "epoch": 0.5, + "learning_rate": 2.6083884765772292e-06, + "loss": 1.1191, + "step": 16651 + }, + { + "epoch": 0.5, + "learning_rate": 2.6081447853683062e-06, + "loss": 1.1636, + "step": 16652 + }, + { + "epoch": 0.5, + "learning_rate": 2.6079010931298964e-06, + "loss": 1.1028, + "step": 16653 + }, + { + "epoch": 0.5, + "learning_rate": 2.607657399864321e-06, + "loss": 1.0754, + "step": 16654 + }, + { + "epoch": 0.5, + "learning_rate": 2.6074137055738986e-06, + "loss": 1.1182, + "step": 16655 + }, + { + "epoch": 0.5, + "learning_rate": 2.6071700102609493e-06, + "loss": 1.2564, + "step": 16656 + }, + { + "epoch": 0.5, + "learning_rate": 2.6069263139277933e-06, + "loss": 1.0811, + "step": 16657 + }, + { + "epoch": 0.5, + "learning_rate": 2.6066826165767507e-06, + "loss": 1.0853, + "step": 16658 + }, + { + "epoch": 0.5, + "learning_rate": 2.60643891821014e-06, + "loss": 1.1833, + "step": 16659 + }, + { + "epoch": 0.5, + "learning_rate": 2.6061952188302832e-06, + "loss": 1.1301, + "step": 16660 + }, + { + "epoch": 0.5, + "learning_rate": 2.605951518439498e-06, + "loss": 1.2018, + "step": 16661 + }, + { + "epoch": 0.5, + "learning_rate": 2.6057078170401063e-06, + "loss": 1.1253, + "step": 16662 + }, + { + "epoch": 0.5, + "learning_rate": 2.6054641146344263e-06, + "loss": 1.0452, + "step": 16663 + }, + { + "epoch": 0.5, + "learning_rate": 2.6052204112247785e-06, + "loss": 1.0859, + "step": 16664 + }, + { + "epoch": 0.5, + "learning_rate": 2.6049767068134833e-06, + "loss": 1.1172, + "step": 16665 + }, + { + "epoch": 0.5, + "learning_rate": 2.6047330014028603e-06, + "loss": 1.1082, + "step": 16666 + }, + { + "epoch": 0.5, + "learning_rate": 2.6044892949952304e-06, + "loss": 1.075, + "step": 16667 + }, + { + "epoch": 0.5, + "learning_rate": 2.6042455875929123e-06, + "loss": 1.1638, + "step": 16668 + }, + { + "epoch": 0.5, + "learning_rate": 2.604001879198227e-06, + "loss": 1.2184, + "step": 16669 + }, + { + "epoch": 0.5, + "learning_rate": 2.6037581698134927e-06, + "loss": 1.1907, + "step": 16670 + }, + { + "epoch": 0.5, + "learning_rate": 2.6035144594410316e-06, + "loss": 1.1401, + "step": 16671 + }, + { + "epoch": 0.5, + "learning_rate": 2.603270748083162e-06, + "loss": 1.0405, + "step": 16672 + }, + { + "epoch": 0.5, + "learning_rate": 2.6030270357422057e-06, + "loss": 1.1776, + "step": 16673 + }, + { + "epoch": 0.5, + "learning_rate": 2.60278332242048e-06, + "loss": 1.1821, + "step": 16674 + }, + { + "epoch": 0.5, + "learning_rate": 2.602539608120308e-06, + "loss": 1.2385, + "step": 16675 + }, + { + "epoch": 0.5, + "learning_rate": 2.6022958928440073e-06, + "loss": 1.1855, + "step": 16676 + }, + { + "epoch": 0.5, + "learning_rate": 2.6020521765938995e-06, + "loss": 1.0399, + "step": 16677 + }, + { + "epoch": 0.5, + "learning_rate": 2.6018084593723037e-06, + "loss": 1.0009, + "step": 16678 + }, + { + "epoch": 0.5, + "learning_rate": 2.601564741181541e-06, + "loss": 1.1275, + "step": 16679 + }, + { + "epoch": 0.5, + "learning_rate": 2.6013210220239306e-06, + "loss": 1.1846, + "step": 16680 + }, + { + "epoch": 0.5, + "learning_rate": 2.6010773019017925e-06, + "loss": 1.2061, + "step": 16681 + }, + { + "epoch": 0.5, + "learning_rate": 2.6008335808174478e-06, + "loss": 0.9975, + "step": 16682 + }, + { + "epoch": 0.5, + "learning_rate": 2.6005898587732157e-06, + "loss": 1.2238, + "step": 16683 + }, + { + "epoch": 0.5, + "learning_rate": 2.600346135771417e-06, + "loss": 1.1369, + "step": 16684 + }, + { + "epoch": 0.5, + "learning_rate": 2.6001024118143708e-06, + "loss": 1.2011, + "step": 16685 + }, + { + "epoch": 0.5, + "learning_rate": 2.5998586869043984e-06, + "loss": 1.2015, + "step": 16686 + }, + { + "epoch": 0.5, + "learning_rate": 2.5996149610438187e-06, + "loss": 1.1436, + "step": 16687 + }, + { + "epoch": 0.5, + "learning_rate": 2.599371234234953e-06, + "loss": 1.1035, + "step": 16688 + }, + { + "epoch": 0.5, + "learning_rate": 2.599127506480121e-06, + "loss": 1.0574, + "step": 16689 + }, + { + "epoch": 0.5, + "learning_rate": 2.5988837777816434e-06, + "loss": 1.0038, + "step": 16690 + }, + { + "epoch": 0.5, + "learning_rate": 2.598640048141839e-06, + "loss": 1.0719, + "step": 16691 + }, + { + "epoch": 0.5, + "learning_rate": 2.598396317563029e-06, + "loss": 1.1042, + "step": 16692 + }, + { + "epoch": 0.5, + "learning_rate": 2.598152586047533e-06, + "loss": 1.1343, + "step": 16693 + }, + { + "epoch": 0.5, + "learning_rate": 2.597908853597672e-06, + "loss": 0.9987, + "step": 16694 + }, + { + "epoch": 0.5, + "learning_rate": 2.5976651202157666e-06, + "loss": 1.1093, + "step": 16695 + }, + { + "epoch": 0.5, + "learning_rate": 2.597421385904135e-06, + "loss": 1.0887, + "step": 16696 + }, + { + "epoch": 0.5, + "learning_rate": 2.5971776506651003e-06, + "loss": 1.0652, + "step": 16697 + }, + { + "epoch": 0.5, + "learning_rate": 2.5969339145009802e-06, + "loss": 1.206, + "step": 16698 + }, + { + "epoch": 0.5, + "learning_rate": 2.596690177414096e-06, + "loss": 1.1052, + "step": 16699 + }, + { + "epoch": 0.5, + "learning_rate": 2.596446439406768e-06, + "loss": 1.1631, + "step": 16700 + }, + { + "epoch": 0.5, + "learning_rate": 2.5962027004813166e-06, + "loss": 1.1467, + "step": 16701 + }, + { + "epoch": 0.5, + "learning_rate": 2.5959589606400613e-06, + "loss": 1.1895, + "step": 16702 + }, + { + "epoch": 0.5, + "learning_rate": 2.5957152198853237e-06, + "loss": 1.0811, + "step": 16703 + }, + { + "epoch": 0.5, + "learning_rate": 2.5954714782194222e-06, + "loss": 1.245, + "step": 16704 + }, + { + "epoch": 0.5, + "learning_rate": 2.5952277356446785e-06, + "loss": 1.1161, + "step": 16705 + }, + { + "epoch": 0.5, + "learning_rate": 2.594983992163413e-06, + "loss": 1.238, + "step": 16706 + }, + { + "epoch": 0.5, + "learning_rate": 2.5947402477779454e-06, + "loss": 1.1978, + "step": 16707 + }, + { + "epoch": 0.5, + "learning_rate": 2.5944965024905965e-06, + "loss": 1.1307, + "step": 16708 + }, + { + "epoch": 0.5, + "learning_rate": 2.5942527563036863e-06, + "loss": 1.1084, + "step": 16709 + }, + { + "epoch": 0.5, + "learning_rate": 2.5940090092195353e-06, + "loss": 1.1315, + "step": 16710 + }, + { + "epoch": 0.5, + "learning_rate": 2.5937652612404635e-06, + "loss": 1.1394, + "step": 16711 + }, + { + "epoch": 0.5, + "learning_rate": 2.593521512368792e-06, + "loss": 1.0763, + "step": 16712 + }, + { + "epoch": 0.5, + "learning_rate": 2.5932777626068405e-06, + "loss": 1.1769, + "step": 16713 + }, + { + "epoch": 0.5, + "learning_rate": 2.59303401195693e-06, + "loss": 1.1337, + "step": 16714 + }, + { + "epoch": 0.5, + "learning_rate": 2.59279026042138e-06, + "loss": 1.0856, + "step": 16715 + }, + { + "epoch": 0.5, + "learning_rate": 2.5925465080025118e-06, + "loss": 1.1179, + "step": 16716 + }, + { + "epoch": 0.5, + "learning_rate": 2.5923027547026454e-06, + "loss": 1.157, + "step": 16717 + }, + { + "epoch": 0.5, + "learning_rate": 2.592059000524101e-06, + "loss": 1.2821, + "step": 16718 + }, + { + "epoch": 0.5, + "learning_rate": 2.591815245469199e-06, + "loss": 1.1807, + "step": 16719 + }, + { + "epoch": 0.5, + "learning_rate": 2.5915714895402606e-06, + "loss": 1.0963, + "step": 16720 + }, + { + "epoch": 0.5, + "learning_rate": 2.5913277327396053e-06, + "loss": 1.1583, + "step": 16721 + }, + { + "epoch": 0.5, + "learning_rate": 2.5910839750695537e-06, + "loss": 1.2213, + "step": 16722 + }, + { + "epoch": 0.5, + "learning_rate": 2.5908402165324276e-06, + "loss": 1.212, + "step": 16723 + }, + { + "epoch": 0.5, + "learning_rate": 2.590596457130546e-06, + "loss": 1.1345, + "step": 16724 + }, + { + "epoch": 0.5, + "learning_rate": 2.5903526968662294e-06, + "loss": 1.2047, + "step": 16725 + }, + { + "epoch": 0.5, + "learning_rate": 2.5901089357417987e-06, + "loss": 1.0348, + "step": 16726 + }, + { + "epoch": 0.5, + "learning_rate": 2.589865173759575e-06, + "loss": 1.1439, + "step": 16727 + }, + { + "epoch": 0.5, + "learning_rate": 2.589621410921877e-06, + "loss": 1.057, + "step": 16728 + }, + { + "epoch": 0.5, + "learning_rate": 2.5893776472310274e-06, + "loss": 1.1127, + "step": 16729 + }, + { + "epoch": 0.5, + "learning_rate": 2.589133882689345e-06, + "loss": 1.0104, + "step": 16730 + }, + { + "epoch": 0.5, + "learning_rate": 2.588890117299151e-06, + "loss": 1.267, + "step": 16731 + }, + { + "epoch": 0.5, + "learning_rate": 2.588646351062766e-06, + "loss": 1.1302, + "step": 16732 + }, + { + "epoch": 0.5, + "learning_rate": 2.5884025839825106e-06, + "loss": 1.1801, + "step": 16733 + }, + { + "epoch": 0.5, + "learning_rate": 2.5881588160607045e-06, + "loss": 1.0269, + "step": 16734 + }, + { + "epoch": 0.5, + "learning_rate": 2.5879150472996695e-06, + "loss": 1.1744, + "step": 16735 + }, + { + "epoch": 0.5, + "learning_rate": 2.5876712777017254e-06, + "loss": 1.1754, + "step": 16736 + }, + { + "epoch": 0.5, + "learning_rate": 2.587427507269193e-06, + "loss": 1.1991, + "step": 16737 + }, + { + "epoch": 0.5, + "learning_rate": 2.5871837360043934e-06, + "loss": 1.2144, + "step": 16738 + }, + { + "epoch": 0.5, + "learning_rate": 2.586939963909646e-06, + "loss": 1.1179, + "step": 16739 + }, + { + "epoch": 0.5, + "learning_rate": 2.5866961909872725e-06, + "loss": 1.0918, + "step": 16740 + }, + { + "epoch": 0.5, + "learning_rate": 2.5864524172395924e-06, + "loss": 1.0362, + "step": 16741 + }, + { + "epoch": 0.5, + "learning_rate": 2.5862086426689275e-06, + "loss": 1.1778, + "step": 16742 + }, + { + "epoch": 0.5, + "learning_rate": 2.5859648672775973e-06, + "loss": 1.1042, + "step": 16743 + }, + { + "epoch": 0.5, + "learning_rate": 2.585721091067923e-06, + "loss": 1.2343, + "step": 16744 + }, + { + "epoch": 0.5, + "learning_rate": 2.5854773140422256e-06, + "loss": 1.1088, + "step": 16745 + }, + { + "epoch": 0.5, + "learning_rate": 2.5852335362028254e-06, + "loss": 1.1133, + "step": 16746 + }, + { + "epoch": 0.5, + "learning_rate": 2.584989757552042e-06, + "loss": 1.1143, + "step": 16747 + }, + { + "epoch": 0.5, + "learning_rate": 2.584745978092198e-06, + "loss": 1.0395, + "step": 16748 + }, + { + "epoch": 0.5, + "learning_rate": 2.584502197825613e-06, + "loss": 1.1476, + "step": 16749 + }, + { + "epoch": 0.5, + "learning_rate": 2.5842584167546076e-06, + "loss": 1.1534, + "step": 16750 + }, + { + "epoch": 0.5, + "learning_rate": 2.5840146348815026e-06, + "loss": 1.164, + "step": 16751 + }, + { + "epoch": 0.5, + "learning_rate": 2.5837708522086186e-06, + "loss": 1.0822, + "step": 16752 + }, + { + "epoch": 0.5, + "learning_rate": 2.5835270687382776e-06, + "loss": 1.2137, + "step": 16753 + }, + { + "epoch": 0.5, + "learning_rate": 2.583283284472798e-06, + "loss": 1.0349, + "step": 16754 + }, + { + "epoch": 0.5, + "learning_rate": 2.583039499414502e-06, + "loss": 1.0617, + "step": 16755 + }, + { + "epoch": 0.5, + "learning_rate": 2.5827957135657093e-06, + "loss": 1.1553, + "step": 16756 + }, + { + "epoch": 0.5, + "learning_rate": 2.582551926928742e-06, + "loss": 1.0775, + "step": 16757 + }, + { + "epoch": 0.5, + "learning_rate": 2.5823081395059203e-06, + "loss": 1.2025, + "step": 16758 + }, + { + "epoch": 0.5, + "learning_rate": 2.5820643512995636e-06, + "loss": 1.1393, + "step": 16759 + }, + { + "epoch": 0.5, + "learning_rate": 2.5818205623119947e-06, + "loss": 1.113, + "step": 16760 + }, + { + "epoch": 0.5, + "learning_rate": 2.5815767725455333e-06, + "loss": 1.3136, + "step": 16761 + }, + { + "epoch": 0.5, + "learning_rate": 2.5813329820025e-06, + "loss": 1.1371, + "step": 16762 + }, + { + "epoch": 0.5, + "learning_rate": 2.5810891906852163e-06, + "loss": 0.9639, + "step": 16763 + }, + { + "epoch": 0.51, + "learning_rate": 2.5808453985960025e-06, + "loss": 1.2301, + "step": 16764 + }, + { + "epoch": 0.51, + "learning_rate": 2.5806016057371797e-06, + "loss": 1.1335, + "step": 16765 + }, + { + "epoch": 0.51, + "learning_rate": 2.580357812111068e-06, + "loss": 0.9995, + "step": 16766 + }, + { + "epoch": 0.51, + "learning_rate": 2.5801140177199886e-06, + "loss": 1.0784, + "step": 16767 + }, + { + "epoch": 0.51, + "learning_rate": 2.579870222566263e-06, + "loss": 1.1646, + "step": 16768 + }, + { + "epoch": 0.51, + "learning_rate": 2.579626426652211e-06, + "loss": 1.17, + "step": 16769 + }, + { + "epoch": 0.51, + "learning_rate": 2.579382629980153e-06, + "loss": 1.1572, + "step": 16770 + }, + { + "epoch": 0.51, + "learning_rate": 2.5791388325524114e-06, + "loss": 1.1202, + "step": 16771 + }, + { + "epoch": 0.51, + "learning_rate": 2.5788950343713058e-06, + "loss": 1.1255, + "step": 16772 + }, + { + "epoch": 0.51, + "learning_rate": 2.5786512354391584e-06, + "loss": 1.1921, + "step": 16773 + }, + { + "epoch": 0.51, + "learning_rate": 2.578407435758288e-06, + "loss": 1.1093, + "step": 16774 + }, + { + "epoch": 0.51, + "learning_rate": 2.5781636353310167e-06, + "loss": 1.0077, + "step": 16775 + }, + { + "epoch": 0.51, + "learning_rate": 2.577919834159666e-06, + "loss": 1.0513, + "step": 16776 + }, + { + "epoch": 0.51, + "learning_rate": 2.5776760322465554e-06, + "loss": 1.1013, + "step": 16777 + }, + { + "epoch": 0.51, + "learning_rate": 2.5774322295940064e-06, + "loss": 1.1082, + "step": 16778 + }, + { + "epoch": 0.51, + "learning_rate": 2.57718842620434e-06, + "loss": 1.2587, + "step": 16779 + }, + { + "epoch": 0.51, + "learning_rate": 2.576944622079877e-06, + "loss": 1.1735, + "step": 16780 + }, + { + "epoch": 0.51, + "learning_rate": 2.5767008172229384e-06, + "loss": 1.1837, + "step": 16781 + }, + { + "epoch": 0.51, + "learning_rate": 2.5764570116358446e-06, + "loss": 1.1198, + "step": 16782 + }, + { + "epoch": 0.51, + "learning_rate": 2.576213205320918e-06, + "loss": 1.1951, + "step": 16783 + }, + { + "epoch": 0.51, + "learning_rate": 2.575969398280477e-06, + "loss": 1.0488, + "step": 16784 + }, + { + "epoch": 0.51, + "learning_rate": 2.575725590516844e-06, + "loss": 1.2521, + "step": 16785 + }, + { + "epoch": 0.51, + "learning_rate": 2.57548178203234e-06, + "loss": 1.1577, + "step": 16786 + }, + { + "epoch": 0.51, + "learning_rate": 2.575237972829286e-06, + "loss": 1.1749, + "step": 16787 + }, + { + "epoch": 0.51, + "learning_rate": 2.5749941629100028e-06, + "loss": 1.0553, + "step": 16788 + }, + { + "epoch": 0.51, + "learning_rate": 2.574750352276811e-06, + "loss": 1.036, + "step": 16789 + }, + { + "epoch": 0.51, + "learning_rate": 2.5745065409320324e-06, + "loss": 1.1171, + "step": 16790 + }, + { + "epoch": 0.51, + "learning_rate": 2.5742627288779865e-06, + "loss": 1.1718, + "step": 16791 + }, + { + "epoch": 0.51, + "learning_rate": 2.5740189161169967e-06, + "loss": 1.1383, + "step": 16792 + }, + { + "epoch": 0.51, + "learning_rate": 2.5737751026513805e-06, + "loss": 1.1277, + "step": 16793 + }, + { + "epoch": 0.51, + "learning_rate": 2.5735312884834623e-06, + "loss": 1.1516, + "step": 16794 + }, + { + "epoch": 0.51, + "learning_rate": 2.573287473615561e-06, + "loss": 1.0837, + "step": 16795 + }, + { + "epoch": 0.51, + "learning_rate": 2.573043658049999e-06, + "loss": 1.0162, + "step": 16796 + }, + { + "epoch": 0.51, + "learning_rate": 2.572799841789096e-06, + "loss": 1.2064, + "step": 16797 + }, + { + "epoch": 0.51, + "learning_rate": 2.5725560248351735e-06, + "loss": 1.2227, + "step": 16798 + }, + { + "epoch": 0.51, + "learning_rate": 2.5723122071905526e-06, + "loss": 1.2068, + "step": 16799 + }, + { + "epoch": 0.51, + "learning_rate": 2.5720683888575544e-06, + "loss": 0.9722, + "step": 16800 + }, + { + "epoch": 0.51, + "learning_rate": 2.5718245698384997e-06, + "loss": 1.1746, + "step": 16801 + }, + { + "epoch": 0.51, + "learning_rate": 2.57158075013571e-06, + "loss": 1.1303, + "step": 16802 + }, + { + "epoch": 0.51, + "learning_rate": 2.5713369297515057e-06, + "loss": 1.1706, + "step": 16803 + }, + { + "epoch": 0.51, + "learning_rate": 2.5710931086882077e-06, + "loss": 1.201, + "step": 16804 + }, + { + "epoch": 0.51, + "learning_rate": 2.570849286948139e-06, + "loss": 1.2168, + "step": 16805 + }, + { + "epoch": 0.51, + "learning_rate": 2.570605464533618e-06, + "loss": 1.0879, + "step": 16806 + }, + { + "epoch": 0.51, + "learning_rate": 2.570361641446968e-06, + "loss": 1.1945, + "step": 16807 + }, + { + "epoch": 0.51, + "learning_rate": 2.5701178176905084e-06, + "loss": 1.0551, + "step": 16808 + }, + { + "epoch": 0.51, + "learning_rate": 2.569873993266561e-06, + "loss": 1.1772, + "step": 16809 + }, + { + "epoch": 0.51, + "learning_rate": 2.5696301681774467e-06, + "loss": 1.059, + "step": 16810 + }, + { + "epoch": 0.51, + "learning_rate": 2.569386342425487e-06, + "loss": 1.2003, + "step": 16811 + }, + { + "epoch": 0.51, + "learning_rate": 2.5691425160130025e-06, + "loss": 1.0834, + "step": 16812 + }, + { + "epoch": 0.51, + "learning_rate": 2.5688986889423144e-06, + "loss": 1.1256, + "step": 16813 + }, + { + "epoch": 0.51, + "learning_rate": 2.5686548612157445e-06, + "loss": 1.1407, + "step": 16814 + }, + { + "epoch": 0.51, + "learning_rate": 2.5684110328356133e-06, + "loss": 1.0648, + "step": 16815 + }, + { + "epoch": 0.51, + "learning_rate": 2.5681672038042417e-06, + "loss": 1.1103, + "step": 16816 + }, + { + "epoch": 0.51, + "learning_rate": 2.5679233741239505e-06, + "loss": 1.1175, + "step": 16817 + }, + { + "epoch": 0.51, + "learning_rate": 2.567679543797063e-06, + "loss": 1.1467, + "step": 16818 + }, + { + "epoch": 0.51, + "learning_rate": 2.5674357128258975e-06, + "loss": 1.1351, + "step": 16819 + }, + { + "epoch": 0.51, + "learning_rate": 2.567191881212778e-06, + "loss": 1.176, + "step": 16820 + }, + { + "epoch": 0.51, + "learning_rate": 2.566948048960023e-06, + "loss": 1.0549, + "step": 16821 + }, + { + "epoch": 0.51, + "learning_rate": 2.566704216069955e-06, + "loss": 1.0185, + "step": 16822 + }, + { + "epoch": 0.51, + "learning_rate": 2.5664603825448946e-06, + "loss": 1.1284, + "step": 16823 + }, + { + "epoch": 0.51, + "learning_rate": 2.566216548387164e-06, + "loss": 1.1334, + "step": 16824 + }, + { + "epoch": 0.51, + "learning_rate": 2.5659727135990836e-06, + "loss": 1.0963, + "step": 16825 + }, + { + "epoch": 0.51, + "learning_rate": 2.565728878182975e-06, + "loss": 1.0482, + "step": 16826 + }, + { + "epoch": 0.51, + "learning_rate": 2.565485042141159e-06, + "loss": 1.0534, + "step": 16827 + }, + { + "epoch": 0.51, + "learning_rate": 2.565241205475956e-06, + "loss": 1.164, + "step": 16828 + }, + { + "epoch": 0.51, + "learning_rate": 2.564997368189689e-06, + "loss": 1.2064, + "step": 16829 + }, + { + "epoch": 0.51, + "learning_rate": 2.5647535302846782e-06, + "loss": 1.2422, + "step": 16830 + }, + { + "epoch": 0.51, + "learning_rate": 2.5645096917632456e-06, + "loss": 1.1141, + "step": 16831 + }, + { + "epoch": 0.51, + "learning_rate": 2.564265852627711e-06, + "loss": 1.1448, + "step": 16832 + }, + { + "epoch": 0.51, + "learning_rate": 2.5640220128803965e-06, + "loss": 1.0131, + "step": 16833 + }, + { + "epoch": 0.51, + "learning_rate": 2.563778172523624e-06, + "loss": 1.0567, + "step": 16834 + }, + { + "epoch": 0.51, + "learning_rate": 2.5635343315597133e-06, + "loss": 1.1666, + "step": 16835 + }, + { + "epoch": 0.51, + "learning_rate": 2.5632904899909864e-06, + "loss": 1.1031, + "step": 16836 + }, + { + "epoch": 0.51, + "learning_rate": 2.5630466478197646e-06, + "loss": 1.0439, + "step": 16837 + }, + { + "epoch": 0.51, + "learning_rate": 2.5628028050483696e-06, + "loss": 1.0814, + "step": 16838 + }, + { + "epoch": 0.51, + "learning_rate": 2.5625589616791213e-06, + "loss": 1.0477, + "step": 16839 + }, + { + "epoch": 0.51, + "learning_rate": 2.5623151177143424e-06, + "loss": 1.1525, + "step": 16840 + }, + { + "epoch": 0.51, + "learning_rate": 2.5620712731563537e-06, + "loss": 1.163, + "step": 16841 + }, + { + "epoch": 0.51, + "learning_rate": 2.5618274280074756e-06, + "loss": 1.1508, + "step": 16842 + }, + { + "epoch": 0.51, + "learning_rate": 2.5615835822700304e-06, + "loss": 1.08, + "step": 16843 + }, + { + "epoch": 0.51, + "learning_rate": 2.5613397359463393e-06, + "loss": 1.1271, + "step": 16844 + }, + { + "epoch": 0.51, + "learning_rate": 2.561095889038724e-06, + "loss": 1.0839, + "step": 16845 + }, + { + "epoch": 0.51, + "learning_rate": 2.560852041549505e-06, + "loss": 1.2415, + "step": 16846 + }, + { + "epoch": 0.51, + "learning_rate": 2.5606081934810034e-06, + "loss": 1.1419, + "step": 16847 + }, + { + "epoch": 0.51, + "learning_rate": 2.5603643448355416e-06, + "loss": 1.009, + "step": 16848 + }, + { + "epoch": 0.51, + "learning_rate": 2.5601204956154395e-06, + "loss": 1.1767, + "step": 16849 + }, + { + "epoch": 0.51, + "learning_rate": 2.5598766458230197e-06, + "loss": 1.2078, + "step": 16850 + }, + { + "epoch": 0.51, + "learning_rate": 2.559632795460603e-06, + "loss": 1.1092, + "step": 16851 + }, + { + "epoch": 0.51, + "learning_rate": 2.559388944530511e-06, + "loss": 1.0172, + "step": 16852 + }, + { + "epoch": 0.51, + "learning_rate": 2.559145093035065e-06, + "loss": 1.0823, + "step": 16853 + }, + { + "epoch": 0.51, + "learning_rate": 2.558901240976586e-06, + "loss": 1.177, + "step": 16854 + }, + { + "epoch": 0.51, + "learning_rate": 2.5586573883573956e-06, + "loss": 1.1772, + "step": 16855 + }, + { + "epoch": 0.51, + "learning_rate": 2.5584135351798145e-06, + "loss": 1.1646, + "step": 16856 + }, + { + "epoch": 0.51, + "learning_rate": 2.5581696814461652e-06, + "loss": 1.1398, + "step": 16857 + }, + { + "epoch": 0.51, + "learning_rate": 2.557925827158768e-06, + "loss": 1.106, + "step": 16858 + }, + { + "epoch": 0.51, + "learning_rate": 2.557681972319946e-06, + "loss": 1.0331, + "step": 16859 + }, + { + "epoch": 0.51, + "learning_rate": 2.5574381169320184e-06, + "loss": 1.1465, + "step": 16860 + }, + { + "epoch": 0.51, + "learning_rate": 2.5571942609973082e-06, + "loss": 1.1821, + "step": 16861 + }, + { + "epoch": 0.51, + "learning_rate": 2.556950404518136e-06, + "loss": 1.1644, + "step": 16862 + }, + { + "epoch": 0.51, + "learning_rate": 2.5567065474968227e-06, + "loss": 1.2087, + "step": 16863 + }, + { + "epoch": 0.51, + "learning_rate": 2.5564626899356915e-06, + "loss": 1.1661, + "step": 16864 + }, + { + "epoch": 0.51, + "learning_rate": 2.5562188318370617e-06, + "loss": 1.1578, + "step": 16865 + }, + { + "epoch": 0.51, + "learning_rate": 2.555974973203257e-06, + "loss": 1.1328, + "step": 16866 + }, + { + "epoch": 0.51, + "learning_rate": 2.5557311140365964e-06, + "loss": 1.1846, + "step": 16867 + }, + { + "epoch": 0.51, + "learning_rate": 2.5554872543394028e-06, + "loss": 1.1182, + "step": 16868 + }, + { + "epoch": 0.51, + "learning_rate": 2.555243394113997e-06, + "loss": 1.2904, + "step": 16869 + }, + { + "epoch": 0.51, + "learning_rate": 2.5549995333627008e-06, + "loss": 1.0657, + "step": 16870 + }, + { + "epoch": 0.51, + "learning_rate": 2.5547556720878354e-06, + "loss": 1.105, + "step": 16871 + }, + { + "epoch": 0.51, + "learning_rate": 2.5545118102917225e-06, + "loss": 1.106, + "step": 16872 + }, + { + "epoch": 0.51, + "learning_rate": 2.5542679479766833e-06, + "loss": 1.1221, + "step": 16873 + }, + { + "epoch": 0.51, + "learning_rate": 2.5540240851450405e-06, + "loss": 1.0092, + "step": 16874 + }, + { + "epoch": 0.51, + "learning_rate": 2.553780221799113e-06, + "loss": 1.2045, + "step": 16875 + }, + { + "epoch": 0.51, + "learning_rate": 2.553536357941224e-06, + "loss": 1.1362, + "step": 16876 + }, + { + "epoch": 0.51, + "learning_rate": 2.5532924935736954e-06, + "loss": 1.17, + "step": 16877 + }, + { + "epoch": 0.51, + "learning_rate": 2.5530486286988472e-06, + "loss": 1.094, + "step": 16878 + }, + { + "epoch": 0.51, + "learning_rate": 2.552804763319002e-06, + "loss": 1.1139, + "step": 16879 + }, + { + "epoch": 0.51, + "learning_rate": 2.55256089743648e-06, + "loss": 1.0737, + "step": 16880 + }, + { + "epoch": 0.51, + "learning_rate": 2.552317031053605e-06, + "loss": 1.0607, + "step": 16881 + }, + { + "epoch": 0.51, + "learning_rate": 2.5520731641726958e-06, + "loss": 1.0477, + "step": 16882 + }, + { + "epoch": 0.51, + "learning_rate": 2.5518292967960757e-06, + "loss": 1.1622, + "step": 16883 + }, + { + "epoch": 0.51, + "learning_rate": 2.551585428926065e-06, + "loss": 1.0882, + "step": 16884 + }, + { + "epoch": 0.51, + "learning_rate": 2.551341560564987e-06, + "loss": 1.1725, + "step": 16885 + }, + { + "epoch": 0.51, + "learning_rate": 2.5510976917151616e-06, + "loss": 1.2616, + "step": 16886 + }, + { + "epoch": 0.51, + "learning_rate": 2.550853822378911e-06, + "loss": 1.0623, + "step": 16887 + }, + { + "epoch": 0.51, + "learning_rate": 2.550609952558556e-06, + "loss": 1.2084, + "step": 16888 + }, + { + "epoch": 0.51, + "learning_rate": 2.550366082256419e-06, + "loss": 1.2184, + "step": 16889 + }, + { + "epoch": 0.51, + "learning_rate": 2.550122211474821e-06, + "loss": 1.0699, + "step": 16890 + }, + { + "epoch": 0.51, + "learning_rate": 2.5498783402160833e-06, + "loss": 1.0677, + "step": 16891 + }, + { + "epoch": 0.51, + "learning_rate": 2.5496344684825286e-06, + "loss": 1.2279, + "step": 16892 + }, + { + "epoch": 0.51, + "learning_rate": 2.549390596276477e-06, + "loss": 1.2598, + "step": 16893 + }, + { + "epoch": 0.51, + "learning_rate": 2.549146723600251e-06, + "loss": 1.1896, + "step": 16894 + }, + { + "epoch": 0.51, + "learning_rate": 2.548902850456172e-06, + "loss": 1.1022, + "step": 16895 + }, + { + "epoch": 0.51, + "learning_rate": 2.5486589768465613e-06, + "loss": 1.0935, + "step": 16896 + }, + { + "epoch": 0.51, + "learning_rate": 2.5484151027737404e-06, + "loss": 1.1633, + "step": 16897 + }, + { + "epoch": 0.51, + "learning_rate": 2.548171228240031e-06, + "loss": 1.1556, + "step": 16898 + }, + { + "epoch": 0.51, + "learning_rate": 2.5479273532477544e-06, + "loss": 1.1531, + "step": 16899 + }, + { + "epoch": 0.51, + "learning_rate": 2.547683477799234e-06, + "loss": 1.1022, + "step": 16900 + }, + { + "epoch": 0.51, + "learning_rate": 2.5474396018967884e-06, + "loss": 1.0534, + "step": 16901 + }, + { + "epoch": 0.51, + "learning_rate": 2.547195725542741e-06, + "loss": 1.2067, + "step": 16902 + }, + { + "epoch": 0.51, + "learning_rate": 2.546951848739413e-06, + "loss": 1.1054, + "step": 16903 + }, + { + "epoch": 0.51, + "learning_rate": 2.546707971489126e-06, + "loss": 1.0269, + "step": 16904 + }, + { + "epoch": 0.51, + "learning_rate": 2.546464093794202e-06, + "loss": 1.3103, + "step": 16905 + }, + { + "epoch": 0.51, + "learning_rate": 2.5462202156569613e-06, + "loss": 1.2315, + "step": 16906 + }, + { + "epoch": 0.51, + "learning_rate": 2.5459763370797273e-06, + "loss": 0.9824, + "step": 16907 + }, + { + "epoch": 0.51, + "learning_rate": 2.5457324580648207e-06, + "loss": 1.0886, + "step": 16908 + }, + { + "epoch": 0.51, + "learning_rate": 2.545488578614563e-06, + "loss": 1.0801, + "step": 16909 + }, + { + "epoch": 0.51, + "learning_rate": 2.5452446987312757e-06, + "loss": 0.9553, + "step": 16910 + }, + { + "epoch": 0.51, + "learning_rate": 2.54500081841728e-06, + "loss": 1.1548, + "step": 16911 + }, + { + "epoch": 0.51, + "learning_rate": 2.5447569376748995e-06, + "loss": 1.1169, + "step": 16912 + }, + { + "epoch": 0.51, + "learning_rate": 2.544513056506454e-06, + "loss": 1.1281, + "step": 16913 + }, + { + "epoch": 0.51, + "learning_rate": 2.544269174914265e-06, + "loss": 1.1248, + "step": 16914 + }, + { + "epoch": 0.51, + "learning_rate": 2.544025292900656e-06, + "loss": 1.1214, + "step": 16915 + }, + { + "epoch": 0.51, + "learning_rate": 2.5437814104679465e-06, + "loss": 1.0798, + "step": 16916 + }, + { + "epoch": 0.51, + "learning_rate": 2.543537527618459e-06, + "loss": 1.1374, + "step": 16917 + }, + { + "epoch": 0.51, + "learning_rate": 2.543293644354516e-06, + "loss": 1.1172, + "step": 16918 + }, + { + "epoch": 0.51, + "learning_rate": 2.5430497606784375e-06, + "loss": 1.1245, + "step": 16919 + }, + { + "epoch": 0.51, + "learning_rate": 2.5428058765925467e-06, + "loss": 1.1091, + "step": 16920 + }, + { + "epoch": 0.51, + "learning_rate": 2.5425619920991645e-06, + "loss": 1.1342, + "step": 16921 + }, + { + "epoch": 0.51, + "learning_rate": 2.5423181072006125e-06, + "loss": 1.1647, + "step": 16922 + }, + { + "epoch": 0.51, + "learning_rate": 2.5420742218992125e-06, + "loss": 1.2114, + "step": 16923 + }, + { + "epoch": 0.51, + "learning_rate": 2.5418303361972857e-06, + "loss": 1.1112, + "step": 16924 + }, + { + "epoch": 0.51, + "learning_rate": 2.5415864500971544e-06, + "loss": 1.1374, + "step": 16925 + }, + { + "epoch": 0.51, + "learning_rate": 2.5413425636011406e-06, + "loss": 1.1655, + "step": 16926 + }, + { + "epoch": 0.51, + "learning_rate": 2.541098676711565e-06, + "loss": 1.1411, + "step": 16927 + }, + { + "epoch": 0.51, + "learning_rate": 2.5408547894307505e-06, + "loss": 1.1069, + "step": 16928 + }, + { + "epoch": 0.51, + "learning_rate": 2.5406109017610175e-06, + "loss": 1.1164, + "step": 16929 + }, + { + "epoch": 0.51, + "learning_rate": 2.540367013704688e-06, + "loss": 1.1074, + "step": 16930 + }, + { + "epoch": 0.51, + "learning_rate": 2.5401231252640845e-06, + "loss": 1.0663, + "step": 16931 + }, + { + "epoch": 0.51, + "learning_rate": 2.5398792364415283e-06, + "loss": 1.1138, + "step": 16932 + }, + { + "epoch": 0.51, + "learning_rate": 2.539635347239341e-06, + "loss": 1.1048, + "step": 16933 + }, + { + "epoch": 0.51, + "learning_rate": 2.5393914576598433e-06, + "loss": 1.0787, + "step": 16934 + }, + { + "epoch": 0.51, + "learning_rate": 2.539147567705359e-06, + "loss": 1.1334, + "step": 16935 + }, + { + "epoch": 0.51, + "learning_rate": 2.5389036773782083e-06, + "loss": 1.046, + "step": 16936 + }, + { + "epoch": 0.51, + "learning_rate": 2.5386597866807138e-06, + "loss": 1.1266, + "step": 16937 + }, + { + "epoch": 0.51, + "learning_rate": 2.538415895615196e-06, + "loss": 1.1152, + "step": 16938 + }, + { + "epoch": 0.51, + "learning_rate": 2.5381720041839774e-06, + "loss": 1.1248, + "step": 16939 + }, + { + "epoch": 0.51, + "learning_rate": 2.5379281123893796e-06, + "loss": 1.1107, + "step": 16940 + }, + { + "epoch": 0.51, + "learning_rate": 2.5376842202337254e-06, + "loss": 1.1199, + "step": 16941 + }, + { + "epoch": 0.51, + "learning_rate": 2.537440327719334e-06, + "loss": 1.1827, + "step": 16942 + }, + { + "epoch": 0.51, + "learning_rate": 2.53719643484853e-06, + "loss": 1.1319, + "step": 16943 + }, + { + "epoch": 0.51, + "learning_rate": 2.536952541623634e-06, + "loss": 1.0375, + "step": 16944 + }, + { + "epoch": 0.51, + "learning_rate": 2.5367086480469665e-06, + "loss": 1.1227, + "step": 16945 + }, + { + "epoch": 0.51, + "learning_rate": 2.5364647541208513e-06, + "loss": 1.0445, + "step": 16946 + }, + { + "epoch": 0.51, + "learning_rate": 2.536220859847609e-06, + "loss": 1.1775, + "step": 16947 + }, + { + "epoch": 0.51, + "learning_rate": 2.5359769652295617e-06, + "loss": 1.2191, + "step": 16948 + }, + { + "epoch": 0.51, + "learning_rate": 2.535733070269031e-06, + "loss": 1.0822, + "step": 16949 + }, + { + "epoch": 0.51, + "learning_rate": 2.5354891749683387e-06, + "loss": 1.0261, + "step": 16950 + }, + { + "epoch": 0.51, + "learning_rate": 2.535245279329806e-06, + "loss": 1.0534, + "step": 16951 + }, + { + "epoch": 0.51, + "learning_rate": 2.535001383355755e-06, + "loss": 1.1407, + "step": 16952 + }, + { + "epoch": 0.51, + "learning_rate": 2.534757487048508e-06, + "loss": 1.0877, + "step": 16953 + }, + { + "epoch": 0.51, + "learning_rate": 2.5345135904103875e-06, + "loss": 1.1016, + "step": 16954 + }, + { + "epoch": 0.51, + "learning_rate": 2.534269693443713e-06, + "loss": 1.1824, + "step": 16955 + }, + { + "epoch": 0.51, + "learning_rate": 2.5340257961508076e-06, + "loss": 1.1486, + "step": 16956 + }, + { + "epoch": 0.51, + "learning_rate": 2.5337818985339937e-06, + "loss": 1.1141, + "step": 16957 + }, + { + "epoch": 0.51, + "learning_rate": 2.533538000595592e-06, + "loss": 1.1543, + "step": 16958 + }, + { + "epoch": 0.51, + "learning_rate": 2.533294102337925e-06, + "loss": 1.1589, + "step": 16959 + }, + { + "epoch": 0.51, + "learning_rate": 2.5330502037633137e-06, + "loss": 1.2712, + "step": 16960 + }, + { + "epoch": 0.51, + "learning_rate": 2.532806304874081e-06, + "loss": 1.1044, + "step": 16961 + }, + { + "epoch": 0.51, + "learning_rate": 2.532562405672547e-06, + "loss": 1.2213, + "step": 16962 + }, + { + "epoch": 0.51, + "learning_rate": 2.5323185061610357e-06, + "loss": 1.1157, + "step": 16963 + }, + { + "epoch": 0.51, + "learning_rate": 2.532074606341867e-06, + "loss": 1.1951, + "step": 16964 + }, + { + "epoch": 0.51, + "learning_rate": 2.5318307062173637e-06, + "loss": 1.0406, + "step": 16965 + }, + { + "epoch": 0.51, + "learning_rate": 2.5315868057898476e-06, + "loss": 1.1169, + "step": 16966 + }, + { + "epoch": 0.51, + "learning_rate": 2.53134290506164e-06, + "loss": 1.114, + "step": 16967 + }, + { + "epoch": 0.51, + "learning_rate": 2.5310990040350638e-06, + "loss": 1.171, + "step": 16968 + }, + { + "epoch": 0.51, + "learning_rate": 2.5308551027124396e-06, + "loss": 1.025, + "step": 16969 + }, + { + "epoch": 0.51, + "learning_rate": 2.5306112010960894e-06, + "loss": 1.168, + "step": 16970 + }, + { + "epoch": 0.51, + "learning_rate": 2.5303672991883352e-06, + "loss": 1.162, + "step": 16971 + }, + { + "epoch": 0.51, + "learning_rate": 2.5301233969914994e-06, + "loss": 1.1099, + "step": 16972 + }, + { + "epoch": 0.51, + "learning_rate": 2.529879494507903e-06, + "loss": 1.1783, + "step": 16973 + }, + { + "epoch": 0.51, + "learning_rate": 2.5296355917398692e-06, + "loss": 1.1968, + "step": 16974 + }, + { + "epoch": 0.51, + "learning_rate": 2.5293916886897175e-06, + "loss": 1.0269, + "step": 16975 + }, + { + "epoch": 0.51, + "learning_rate": 2.5291477853597722e-06, + "loss": 1.1843, + "step": 16976 + }, + { + "epoch": 0.51, + "learning_rate": 2.528903881752353e-06, + "loss": 1.1017, + "step": 16977 + }, + { + "epoch": 0.51, + "learning_rate": 2.528659977869784e-06, + "loss": 1.1778, + "step": 16978 + }, + { + "epoch": 0.51, + "learning_rate": 2.5284160737143846e-06, + "loss": 1.0893, + "step": 16979 + }, + { + "epoch": 0.51, + "learning_rate": 2.528172169288478e-06, + "loss": 1.0547, + "step": 16980 + }, + { + "epoch": 0.51, + "learning_rate": 2.5279282645943863e-06, + "loss": 1.1668, + "step": 16981 + }, + { + "epoch": 0.51, + "learning_rate": 2.5276843596344316e-06, + "loss": 1.0675, + "step": 16982 + }, + { + "epoch": 0.51, + "learning_rate": 2.527440454410934e-06, + "loss": 1.0985, + "step": 16983 + }, + { + "epoch": 0.51, + "learning_rate": 2.5271965489262164e-06, + "loss": 1.1042, + "step": 16984 + }, + { + "epoch": 0.51, + "learning_rate": 2.526952643182602e-06, + "loss": 1.0486, + "step": 16985 + }, + { + "epoch": 0.51, + "learning_rate": 2.52670873718241e-06, + "loss": 1.1743, + "step": 16986 + }, + { + "epoch": 0.51, + "learning_rate": 2.526464830927965e-06, + "loss": 1.2026, + "step": 16987 + }, + { + "epoch": 0.51, + "learning_rate": 2.5262209244215867e-06, + "loss": 1.1415, + "step": 16988 + }, + { + "epoch": 0.51, + "learning_rate": 2.5259770176655985e-06, + "loss": 1.0746, + "step": 16989 + }, + { + "epoch": 0.51, + "learning_rate": 2.5257331106623207e-06, + "loss": 1.0357, + "step": 16990 + }, + { + "epoch": 0.51, + "learning_rate": 2.5254892034140773e-06, + "loss": 1.2034, + "step": 16991 + }, + { + "epoch": 0.51, + "learning_rate": 2.5252452959231876e-06, + "loss": 1.1888, + "step": 16992 + }, + { + "epoch": 0.51, + "learning_rate": 2.5250013881919757e-06, + "loss": 1.153, + "step": 16993 + }, + { + "epoch": 0.51, + "learning_rate": 2.524757480222762e-06, + "loss": 1.1208, + "step": 16994 + }, + { + "epoch": 0.51, + "learning_rate": 2.5245135720178697e-06, + "loss": 1.0938, + "step": 16995 + }, + { + "epoch": 0.51, + "learning_rate": 2.5242696635796194e-06, + "loss": 1.0666, + "step": 16996 + }, + { + "epoch": 0.51, + "learning_rate": 2.5240257549103338e-06, + "loss": 1.082, + "step": 16997 + }, + { + "epoch": 0.51, + "learning_rate": 2.523781846012335e-06, + "loss": 1.1357, + "step": 16998 + }, + { + "epoch": 0.51, + "learning_rate": 2.523537936887944e-06, + "loss": 1.0784, + "step": 16999 + }, + { + "epoch": 0.51, + "learning_rate": 2.5232940275394834e-06, + "loss": 1.2315, + "step": 17000 + }, + { + "epoch": 0.51, + "learning_rate": 2.5230501179692744e-06, + "loss": 1.1, + "step": 17001 + }, + { + "epoch": 0.51, + "learning_rate": 2.5228062081796407e-06, + "loss": 1.0867, + "step": 17002 + }, + { + "epoch": 0.51, + "learning_rate": 2.5225622981729015e-06, + "loss": 1.1824, + "step": 17003 + }, + { + "epoch": 0.51, + "learning_rate": 2.522318387951381e-06, + "loss": 1.1926, + "step": 17004 + }, + { + "epoch": 0.51, + "learning_rate": 2.5220744775173995e-06, + "loss": 1.2289, + "step": 17005 + }, + { + "epoch": 0.51, + "learning_rate": 2.5218305668732794e-06, + "loss": 1.2656, + "step": 17006 + }, + { + "epoch": 0.51, + "learning_rate": 2.521586656021343e-06, + "loss": 1.0867, + "step": 17007 + }, + { + "epoch": 0.51, + "learning_rate": 2.521342744963913e-06, + "loss": 1.1058, + "step": 17008 + }, + { + "epoch": 0.51, + "learning_rate": 2.5210988337033094e-06, + "loss": 1.0232, + "step": 17009 + }, + { + "epoch": 0.51, + "learning_rate": 2.520854922241855e-06, + "loss": 1.1808, + "step": 17010 + }, + { + "epoch": 0.51, + "learning_rate": 2.5206110105818722e-06, + "loss": 1.1791, + "step": 17011 + }, + { + "epoch": 0.51, + "learning_rate": 2.5203670987256823e-06, + "loss": 1.213, + "step": 17012 + }, + { + "epoch": 0.51, + "learning_rate": 2.520123186675608e-06, + "loss": 1.1181, + "step": 17013 + }, + { + "epoch": 0.51, + "learning_rate": 2.51987927443397e-06, + "loss": 0.9908, + "step": 17014 + }, + { + "epoch": 0.51, + "learning_rate": 2.519635362003091e-06, + "loss": 1.1505, + "step": 17015 + }, + { + "epoch": 0.51, + "learning_rate": 2.5193914493852926e-06, + "loss": 0.979, + "step": 17016 + }, + { + "epoch": 0.51, + "learning_rate": 2.519147536582898e-06, + "loss": 1.1735, + "step": 17017 + }, + { + "epoch": 0.51, + "learning_rate": 2.5189036235982266e-06, + "loss": 1.1096, + "step": 17018 + }, + { + "epoch": 0.51, + "learning_rate": 2.518659710433603e-06, + "loss": 1.0631, + "step": 17019 + }, + { + "epoch": 0.51, + "learning_rate": 2.5184157970913473e-06, + "loss": 1.1489, + "step": 17020 + }, + { + "epoch": 0.51, + "learning_rate": 2.5181718835737823e-06, + "loss": 1.1761, + "step": 17021 + }, + { + "epoch": 0.51, + "learning_rate": 2.5179279698832294e-06, + "loss": 1.1949, + "step": 17022 + }, + { + "epoch": 0.51, + "learning_rate": 2.517684056022011e-06, + "loss": 1.094, + "step": 17023 + }, + { + "epoch": 0.51, + "learning_rate": 2.5174401419924495e-06, + "loss": 1.1719, + "step": 17024 + }, + { + "epoch": 0.51, + "learning_rate": 2.5171962277968655e-06, + "loss": 1.1203, + "step": 17025 + }, + { + "epoch": 0.51, + "learning_rate": 2.516952313437582e-06, + "loss": 1.1163, + "step": 17026 + }, + { + "epoch": 0.51, + "learning_rate": 2.5167083989169205e-06, + "loss": 1.1281, + "step": 17027 + }, + { + "epoch": 0.51, + "learning_rate": 2.5164644842372034e-06, + "loss": 0.9786, + "step": 17028 + }, + { + "epoch": 0.51, + "learning_rate": 2.5162205694007517e-06, + "loss": 1.0874, + "step": 17029 + }, + { + "epoch": 0.51, + "learning_rate": 2.515976654409889e-06, + "loss": 1.1829, + "step": 17030 + }, + { + "epoch": 0.51, + "learning_rate": 2.5157327392669354e-06, + "loss": 1.2039, + "step": 17031 + }, + { + "epoch": 0.51, + "learning_rate": 2.515488823974214e-06, + "loss": 1.1813, + "step": 17032 + }, + { + "epoch": 0.51, + "learning_rate": 2.515244908534046e-06, + "loss": 1.0935, + "step": 17033 + }, + { + "epoch": 0.51, + "learning_rate": 2.5150009929487547e-06, + "loss": 1.017, + "step": 17034 + }, + { + "epoch": 0.51, + "learning_rate": 2.5147570772206602e-06, + "loss": 1.1797, + "step": 17035 + }, + { + "epoch": 0.51, + "learning_rate": 2.5145131613520858e-06, + "loss": 1.1468, + "step": 17036 + }, + { + "epoch": 0.51, + "learning_rate": 2.514269245345354e-06, + "loss": 1.0556, + "step": 17037 + }, + { + "epoch": 0.51, + "learning_rate": 2.514025329202784e-06, + "loss": 1.2632, + "step": 17038 + }, + { + "epoch": 0.51, + "learning_rate": 2.5137814129267014e-06, + "loss": 1.1869, + "step": 17039 + }, + { + "epoch": 0.51, + "learning_rate": 2.5135374965194254e-06, + "loss": 1.1, + "step": 17040 + }, + { + "epoch": 0.51, + "learning_rate": 2.5132935799832797e-06, + "loss": 1.1628, + "step": 17041 + }, + { + "epoch": 0.51, + "learning_rate": 2.5130496633205848e-06, + "loss": 1.1387, + "step": 17042 + }, + { + "epoch": 0.51, + "learning_rate": 2.512805746533664e-06, + "loss": 1.0894, + "step": 17043 + }, + { + "epoch": 0.51, + "learning_rate": 2.5125618296248382e-06, + "loss": 1.1796, + "step": 17044 + }, + { + "epoch": 0.51, + "learning_rate": 2.5123179125964305e-06, + "loss": 1.0958, + "step": 17045 + }, + { + "epoch": 0.51, + "learning_rate": 2.512073995450761e-06, + "loss": 1.124, + "step": 17046 + }, + { + "epoch": 0.51, + "learning_rate": 2.5118300781901533e-06, + "loss": 1.1486, + "step": 17047 + }, + { + "epoch": 0.51, + "learning_rate": 2.511586160816929e-06, + "loss": 1.173, + "step": 17048 + }, + { + "epoch": 0.51, + "learning_rate": 2.5113422433334104e-06, + "loss": 1.1555, + "step": 17049 + }, + { + "epoch": 0.51, + "learning_rate": 2.5110983257419193e-06, + "loss": 1.081, + "step": 17050 + }, + { + "epoch": 0.51, + "learning_rate": 2.5108544080447765e-06, + "loss": 1.0911, + "step": 17051 + }, + { + "epoch": 0.51, + "learning_rate": 2.5106104902443058e-06, + "loss": 1.1516, + "step": 17052 + }, + { + "epoch": 0.51, + "learning_rate": 2.5103665723428277e-06, + "loss": 1.0676, + "step": 17053 + }, + { + "epoch": 0.51, + "learning_rate": 2.510122654342666e-06, + "loss": 1.1047, + "step": 17054 + }, + { + "epoch": 0.51, + "learning_rate": 2.5098787362461404e-06, + "loss": 1.2327, + "step": 17055 + }, + { + "epoch": 0.51, + "learning_rate": 2.5096348180555746e-06, + "loss": 1.0649, + "step": 17056 + }, + { + "epoch": 0.51, + "learning_rate": 2.5093908997732896e-06, + "loss": 1.1119, + "step": 17057 + }, + { + "epoch": 0.51, + "learning_rate": 2.5091469814016083e-06, + "loss": 1.207, + "step": 17058 + }, + { + "epoch": 0.51, + "learning_rate": 2.508903062942851e-06, + "loss": 1.1956, + "step": 17059 + }, + { + "epoch": 0.51, + "learning_rate": 2.5086591443993424e-06, + "loss": 1.1059, + "step": 17060 + }, + { + "epoch": 0.51, + "learning_rate": 2.5084152257734017e-06, + "loss": 1.1335, + "step": 17061 + }, + { + "epoch": 0.51, + "learning_rate": 2.508171307067352e-06, + "loss": 1.1281, + "step": 17062 + }, + { + "epoch": 0.51, + "learning_rate": 2.507927388283516e-06, + "loss": 1.1174, + "step": 17063 + }, + { + "epoch": 0.51, + "learning_rate": 2.5076834694242146e-06, + "loss": 1.1299, + "step": 17064 + }, + { + "epoch": 0.51, + "learning_rate": 2.507439550491771e-06, + "loss": 1.1873, + "step": 17065 + }, + { + "epoch": 0.51, + "learning_rate": 2.5071956314885053e-06, + "loss": 1.2175, + "step": 17066 + }, + { + "epoch": 0.51, + "learning_rate": 2.506951712416742e-06, + "loss": 1.1121, + "step": 17067 + }, + { + "epoch": 0.51, + "learning_rate": 2.5067077932788008e-06, + "loss": 1.1132, + "step": 17068 + }, + { + "epoch": 0.51, + "learning_rate": 2.506463874077005e-06, + "loss": 1.1852, + "step": 17069 + }, + { + "epoch": 0.51, + "learning_rate": 2.5062199548136768e-06, + "loss": 1.0906, + "step": 17070 + }, + { + "epoch": 0.51, + "learning_rate": 2.505976035491137e-06, + "loss": 1.0402, + "step": 17071 + }, + { + "epoch": 0.51, + "learning_rate": 2.505732116111708e-06, + "loss": 0.9911, + "step": 17072 + }, + { + "epoch": 0.51, + "learning_rate": 2.5054881966777127e-06, + "loss": 1.0978, + "step": 17073 + }, + { + "epoch": 0.51, + "learning_rate": 2.505244277191472e-06, + "loss": 1.3107, + "step": 17074 + }, + { + "epoch": 0.51, + "learning_rate": 2.505000357655308e-06, + "loss": 1.1939, + "step": 17075 + }, + { + "epoch": 0.51, + "learning_rate": 2.504756438071543e-06, + "loss": 1.1889, + "step": 17076 + }, + { + "epoch": 0.51, + "learning_rate": 2.504512518442499e-06, + "loss": 1.1443, + "step": 17077 + }, + { + "epoch": 0.51, + "learning_rate": 2.504268598770499e-06, + "loss": 1.0928, + "step": 17078 + }, + { + "epoch": 0.51, + "learning_rate": 2.5040246790578624e-06, + "loss": 1.1179, + "step": 17079 + }, + { + "epoch": 0.51, + "learning_rate": 2.5037807593069146e-06, + "loss": 1.1792, + "step": 17080 + }, + { + "epoch": 0.51, + "learning_rate": 2.503536839519974e-06, + "loss": 1.1233, + "step": 17081 + }, + { + "epoch": 0.51, + "learning_rate": 2.503292919699366e-06, + "loss": 1.166, + "step": 17082 + }, + { + "epoch": 0.51, + "learning_rate": 2.50304899984741e-06, + "loss": 1.1432, + "step": 17083 + }, + { + "epoch": 0.51, + "learning_rate": 2.5028050799664298e-06, + "loss": 1.1161, + "step": 17084 + }, + { + "epoch": 0.51, + "learning_rate": 2.5025611600587457e-06, + "loss": 1.0863, + "step": 17085 + }, + { + "epoch": 0.51, + "learning_rate": 2.5023172401266814e-06, + "loss": 1.1523, + "step": 17086 + }, + { + "epoch": 0.51, + "learning_rate": 2.502073320172557e-06, + "loss": 1.1868, + "step": 17087 + }, + { + "epoch": 0.51, + "learning_rate": 2.5018294001986964e-06, + "loss": 1.1208, + "step": 17088 + }, + { + "epoch": 0.51, + "learning_rate": 2.5015854802074203e-06, + "loss": 1.2918, + "step": 17089 + }, + { + "epoch": 0.51, + "learning_rate": 2.5013415602010514e-06, + "loss": 1.0529, + "step": 17090 + }, + { + "epoch": 0.51, + "learning_rate": 2.501097640181912e-06, + "loss": 1.0916, + "step": 17091 + }, + { + "epoch": 0.51, + "learning_rate": 2.500853720152323e-06, + "loss": 1.2014, + "step": 17092 + }, + { + "epoch": 0.51, + "learning_rate": 2.500609800114607e-06, + "loss": 1.1454, + "step": 17093 + }, + { + "epoch": 0.51, + "learning_rate": 2.500365880071086e-06, + "loss": 1.1411, + "step": 17094 + }, + { + "epoch": 0.51, + "learning_rate": 2.500121960024083e-06, + "loss": 1.1296, + "step": 17095 + }, + { + "epoch": 0.52, + "learning_rate": 2.499878039975918e-06, + "loss": 1.067, + "step": 17096 + }, + { + "epoch": 0.52, + "learning_rate": 2.499634119928914e-06, + "loss": 1.023, + "step": 17097 + }, + { + "epoch": 0.52, + "learning_rate": 2.499390199885394e-06, + "loss": 1.1268, + "step": 17098 + }, + { + "epoch": 0.52, + "learning_rate": 2.4991462798476777e-06, + "loss": 1.1094, + "step": 17099 + }, + { + "epoch": 0.52, + "learning_rate": 2.498902359818089e-06, + "loss": 1.1359, + "step": 17100 + }, + { + "epoch": 0.52, + "learning_rate": 2.498658439798949e-06, + "loss": 1.1796, + "step": 17101 + }, + { + "epoch": 0.52, + "learning_rate": 2.49841451979258e-06, + "loss": 1.1571, + "step": 17102 + }, + { + "epoch": 0.52, + "learning_rate": 2.4981705998013044e-06, + "loss": 1.185, + "step": 17103 + }, + { + "epoch": 0.52, + "learning_rate": 2.4979266798274433e-06, + "loss": 1.097, + "step": 17104 + }, + { + "epoch": 0.52, + "learning_rate": 2.4976827598733194e-06, + "loss": 1.243, + "step": 17105 + }, + { + "epoch": 0.52, + "learning_rate": 2.4974388399412543e-06, + "loss": 1.0846, + "step": 17106 + }, + { + "epoch": 0.52, + "learning_rate": 2.4971949200335715e-06, + "loss": 1.0538, + "step": 17107 + }, + { + "epoch": 0.52, + "learning_rate": 2.4969510001525906e-06, + "loss": 1.1873, + "step": 17108 + }, + { + "epoch": 0.52, + "learning_rate": 2.4967070803006345e-06, + "loss": 1.1156, + "step": 17109 + }, + { + "epoch": 0.52, + "learning_rate": 2.4964631604800258e-06, + "loss": 1.1785, + "step": 17110 + }, + { + "epoch": 0.52, + "learning_rate": 2.4962192406930867e-06, + "loss": 1.1476, + "step": 17111 + }, + { + "epoch": 0.52, + "learning_rate": 2.495975320942138e-06, + "loss": 1.2319, + "step": 17112 + }, + { + "epoch": 0.52, + "learning_rate": 2.495731401229502e-06, + "loss": 1.2013, + "step": 17113 + }, + { + "epoch": 0.52, + "learning_rate": 2.4954874815575013e-06, + "loss": 1.1197, + "step": 17114 + }, + { + "epoch": 0.52, + "learning_rate": 2.4952435619284576e-06, + "loss": 1.1794, + "step": 17115 + }, + { + "epoch": 0.52, + "learning_rate": 2.494999642344693e-06, + "loss": 1.0235, + "step": 17116 + }, + { + "epoch": 0.52, + "learning_rate": 2.494755722808529e-06, + "loss": 1.1246, + "step": 17117 + }, + { + "epoch": 0.52, + "learning_rate": 2.4945118033222877e-06, + "loss": 1.06, + "step": 17118 + }, + { + "epoch": 0.52, + "learning_rate": 2.494267883888292e-06, + "loss": 1.1363, + "step": 17119 + }, + { + "epoch": 0.52, + "learning_rate": 2.4940239645088642e-06, + "loss": 1.1454, + "step": 17120 + }, + { + "epoch": 0.52, + "learning_rate": 2.493780045186324e-06, + "loss": 1.1636, + "step": 17121 + }, + { + "epoch": 0.52, + "learning_rate": 2.4935361259229953e-06, + "loss": 1.0588, + "step": 17122 + }, + { + "epoch": 0.52, + "learning_rate": 2.4932922067211992e-06, + "loss": 1.2533, + "step": 17123 + }, + { + "epoch": 0.52, + "learning_rate": 2.4930482875832593e-06, + "loss": 1.285, + "step": 17124 + }, + { + "epoch": 0.52, + "learning_rate": 2.492804368511495e-06, + "loss": 1.1109, + "step": 17125 + }, + { + "epoch": 0.52, + "learning_rate": 2.49256044950823e-06, + "loss": 1.0671, + "step": 17126 + }, + { + "epoch": 0.52, + "learning_rate": 2.4923165305757858e-06, + "loss": 1.1245, + "step": 17127 + }, + { + "epoch": 0.52, + "learning_rate": 2.492072611716485e-06, + "loss": 1.1021, + "step": 17128 + }, + { + "epoch": 0.52, + "learning_rate": 2.4918286929326484e-06, + "loss": 1.0483, + "step": 17129 + }, + { + "epoch": 0.52, + "learning_rate": 2.491584774226599e-06, + "loss": 1.2739, + "step": 17130 + }, + { + "epoch": 0.52, + "learning_rate": 2.4913408556006584e-06, + "loss": 1.095, + "step": 17131 + }, + { + "epoch": 0.52, + "learning_rate": 2.4910969370571493e-06, + "loss": 1.093, + "step": 17132 + }, + { + "epoch": 0.52, + "learning_rate": 2.490853018598393e-06, + "loss": 1.0969, + "step": 17133 + }, + { + "epoch": 0.52, + "learning_rate": 2.4906091002267112e-06, + "loss": 1.1328, + "step": 17134 + }, + { + "epoch": 0.52, + "learning_rate": 2.490365181944426e-06, + "loss": 1.0925, + "step": 17135 + }, + { + "epoch": 0.52, + "learning_rate": 2.4901212637538596e-06, + "loss": 1.1551, + "step": 17136 + }, + { + "epoch": 0.52, + "learning_rate": 2.4898773456573352e-06, + "loss": 1.0383, + "step": 17137 + }, + { + "epoch": 0.52, + "learning_rate": 2.4896334276571727e-06, + "loss": 1.1705, + "step": 17138 + }, + { + "epoch": 0.52, + "learning_rate": 2.4893895097556946e-06, + "loss": 1.1861, + "step": 17139 + }, + { + "epoch": 0.52, + "learning_rate": 2.489145591955224e-06, + "loss": 1.0635, + "step": 17140 + }, + { + "epoch": 0.52, + "learning_rate": 2.488901674258082e-06, + "loss": 1.11, + "step": 17141 + }, + { + "epoch": 0.52, + "learning_rate": 2.48865775666659e-06, + "loss": 1.1197, + "step": 17142 + }, + { + "epoch": 0.52, + "learning_rate": 2.488413839183072e-06, + "loss": 1.2203, + "step": 17143 + }, + { + "epoch": 0.52, + "learning_rate": 2.488169921809847e-06, + "loss": 1.0547, + "step": 17144 + }, + { + "epoch": 0.52, + "learning_rate": 2.4879260045492397e-06, + "loss": 1.1157, + "step": 17145 + }, + { + "epoch": 0.52, + "learning_rate": 2.4876820874035712e-06, + "loss": 1.2139, + "step": 17146 + }, + { + "epoch": 0.52, + "learning_rate": 2.4874381703751626e-06, + "loss": 1.1204, + "step": 17147 + }, + { + "epoch": 0.52, + "learning_rate": 2.487194253466337e-06, + "loss": 1.1906, + "step": 17148 + }, + { + "epoch": 0.52, + "learning_rate": 2.486950336679415e-06, + "loss": 1.2451, + "step": 17149 + }, + { + "epoch": 0.52, + "learning_rate": 2.4867064200167215e-06, + "loss": 1.1364, + "step": 17150 + }, + { + "epoch": 0.52, + "learning_rate": 2.4864625034805754e-06, + "loss": 1.2474, + "step": 17151 + }, + { + "epoch": 0.52, + "learning_rate": 2.4862185870732995e-06, + "loss": 1.1098, + "step": 17152 + }, + { + "epoch": 0.52, + "learning_rate": 2.4859746707972158e-06, + "loss": 1.0969, + "step": 17153 + }, + { + "epoch": 0.52, + "learning_rate": 2.4857307546546478e-06, + "loss": 1.1965, + "step": 17154 + }, + { + "epoch": 0.52, + "learning_rate": 2.485486838647915e-06, + "loss": 1.3315, + "step": 17155 + }, + { + "epoch": 0.52, + "learning_rate": 2.48524292277934e-06, + "loss": 1.0782, + "step": 17156 + }, + { + "epoch": 0.52, + "learning_rate": 2.484999007051246e-06, + "loss": 1.1865, + "step": 17157 + }, + { + "epoch": 0.52, + "learning_rate": 2.4847550914659543e-06, + "loss": 1.0425, + "step": 17158 + }, + { + "epoch": 0.52, + "learning_rate": 2.484511176025787e-06, + "loss": 1.1065, + "step": 17159 + }, + { + "epoch": 0.52, + "learning_rate": 2.4842672607330654e-06, + "loss": 1.1662, + "step": 17160 + }, + { + "epoch": 0.52, + "learning_rate": 2.4840233455901115e-06, + "loss": 1.1406, + "step": 17161 + }, + { + "epoch": 0.52, + "learning_rate": 2.4837794305992482e-06, + "loss": 1.2125, + "step": 17162 + }, + { + "epoch": 0.52, + "learning_rate": 2.483535515762798e-06, + "loss": 1.0969, + "step": 17163 + }, + { + "epoch": 0.52, + "learning_rate": 2.4832916010830803e-06, + "loss": 1.1201, + "step": 17164 + }, + { + "epoch": 0.52, + "learning_rate": 2.4830476865624186e-06, + "loss": 1.2188, + "step": 17165 + }, + { + "epoch": 0.52, + "learning_rate": 2.482803772203135e-06, + "loss": 1.1121, + "step": 17166 + }, + { + "epoch": 0.52, + "learning_rate": 2.482559858007552e-06, + "loss": 1.1667, + "step": 17167 + }, + { + "epoch": 0.52, + "learning_rate": 2.4823159439779896e-06, + "loss": 1.039, + "step": 17168 + }, + { + "epoch": 0.52, + "learning_rate": 2.4820720301167714e-06, + "loss": 1.2355, + "step": 17169 + }, + { + "epoch": 0.52, + "learning_rate": 2.4818281164262185e-06, + "loss": 1.1494, + "step": 17170 + }, + { + "epoch": 0.52, + "learning_rate": 2.481584202908653e-06, + "loss": 1.1169, + "step": 17171 + }, + { + "epoch": 0.52, + "learning_rate": 2.481340289566398e-06, + "loss": 1.0823, + "step": 17172 + }, + { + "epoch": 0.52, + "learning_rate": 2.481096376401774e-06, + "loss": 1.1196, + "step": 17173 + }, + { + "epoch": 0.52, + "learning_rate": 2.4808524634171026e-06, + "loss": 1.1756, + "step": 17174 + }, + { + "epoch": 0.52, + "learning_rate": 2.4806085506147074e-06, + "loss": 1.0296, + "step": 17175 + }, + { + "epoch": 0.52, + "learning_rate": 2.48036463799691e-06, + "loss": 0.9722, + "step": 17176 + }, + { + "epoch": 0.52, + "learning_rate": 2.480120725566031e-06, + "loss": 1.2164, + "step": 17177 + }, + { + "epoch": 0.52, + "learning_rate": 2.4798768133243927e-06, + "loss": 1.1415, + "step": 17178 + }, + { + "epoch": 0.52, + "learning_rate": 2.4796329012743177e-06, + "loss": 1.179, + "step": 17179 + }, + { + "epoch": 0.52, + "learning_rate": 2.479388989418129e-06, + "loss": 1.0905, + "step": 17180 + }, + { + "epoch": 0.52, + "learning_rate": 2.4791450777581458e-06, + "loss": 1.0773, + "step": 17181 + }, + { + "epoch": 0.52, + "learning_rate": 2.478901166296692e-06, + "loss": 1.1782, + "step": 17182 + }, + { + "epoch": 0.52, + "learning_rate": 2.478657255036088e-06, + "loss": 1.1432, + "step": 17183 + }, + { + "epoch": 0.52, + "learning_rate": 2.478413343978657e-06, + "loss": 1.0897, + "step": 17184 + }, + { + "epoch": 0.52, + "learning_rate": 2.478169433126721e-06, + "loss": 1.144, + "step": 17185 + }, + { + "epoch": 0.52, + "learning_rate": 2.4779255224826013e-06, + "loss": 1.201, + "step": 17186 + }, + { + "epoch": 0.52, + "learning_rate": 2.47768161204862e-06, + "loss": 1.0972, + "step": 17187 + }, + { + "epoch": 0.52, + "learning_rate": 2.4774377018270985e-06, + "loss": 1.1005, + "step": 17188 + }, + { + "epoch": 0.52, + "learning_rate": 2.477193791820361e-06, + "loss": 1.1873, + "step": 17189 + }, + { + "epoch": 0.52, + "learning_rate": 2.476949882030726e-06, + "loss": 1.0564, + "step": 17190 + }, + { + "epoch": 0.52, + "learning_rate": 2.476705972460517e-06, + "loss": 1.1544, + "step": 17191 + }, + { + "epoch": 0.52, + "learning_rate": 2.4764620631120566e-06, + "loss": 1.1629, + "step": 17192 + }, + { + "epoch": 0.52, + "learning_rate": 2.4762181539876665e-06, + "loss": 1.1143, + "step": 17193 + }, + { + "epoch": 0.52, + "learning_rate": 2.475974245089667e-06, + "loss": 1.2502, + "step": 17194 + }, + { + "epoch": 0.52, + "learning_rate": 2.4757303364203814e-06, + "loss": 1.1193, + "step": 17195 + }, + { + "epoch": 0.52, + "learning_rate": 2.475486427982131e-06, + "loss": 1.1323, + "step": 17196 + }, + { + "epoch": 0.52, + "learning_rate": 2.4752425197772385e-06, + "loss": 1.195, + "step": 17197 + }, + { + "epoch": 0.52, + "learning_rate": 2.474998611808025e-06, + "loss": 1.2512, + "step": 17198 + }, + { + "epoch": 0.52, + "learning_rate": 2.474754704076813e-06, + "loss": 1.1136, + "step": 17199 + }, + { + "epoch": 0.52, + "learning_rate": 2.4745107965859236e-06, + "loss": 1.0002, + "step": 17200 + }, + { + "epoch": 0.52, + "learning_rate": 2.4742668893376792e-06, + "loss": 1.1336, + "step": 17201 + }, + { + "epoch": 0.52, + "learning_rate": 2.4740229823344028e-06, + "loss": 1.1246, + "step": 17202 + }, + { + "epoch": 0.52, + "learning_rate": 2.473779075578414e-06, + "loss": 1.1024, + "step": 17203 + }, + { + "epoch": 0.52, + "learning_rate": 2.4735351690720356e-06, + "loss": 1.0571, + "step": 17204 + }, + { + "epoch": 0.52, + "learning_rate": 2.4732912628175896e-06, + "loss": 0.9731, + "step": 17205 + }, + { + "epoch": 0.52, + "learning_rate": 2.4730473568173996e-06, + "loss": 1.1721, + "step": 17206 + }, + { + "epoch": 0.52, + "learning_rate": 2.472803451073784e-06, + "loss": 1.0867, + "step": 17207 + }, + { + "epoch": 0.52, + "learning_rate": 2.472559545589067e-06, + "loss": 1.1024, + "step": 17208 + }, + { + "epoch": 0.52, + "learning_rate": 2.4723156403655697e-06, + "loss": 1.0591, + "step": 17209 + }, + { + "epoch": 0.52, + "learning_rate": 2.472071735405614e-06, + "loss": 1.0477, + "step": 17210 + }, + { + "epoch": 0.52, + "learning_rate": 2.4718278307115226e-06, + "loss": 1.1089, + "step": 17211 + }, + { + "epoch": 0.52, + "learning_rate": 2.4715839262856162e-06, + "loss": 1.0873, + "step": 17212 + }, + { + "epoch": 0.52, + "learning_rate": 2.471340022130217e-06, + "loss": 1.205, + "step": 17213 + }, + { + "epoch": 0.52, + "learning_rate": 2.4710961182476475e-06, + "loss": 1.1162, + "step": 17214 + }, + { + "epoch": 0.52, + "learning_rate": 2.470852214640229e-06, + "loss": 1.1107, + "step": 17215 + }, + { + "epoch": 0.52, + "learning_rate": 2.470608311310283e-06, + "loss": 1.136, + "step": 17216 + }, + { + "epoch": 0.52, + "learning_rate": 2.4703644082601316e-06, + "loss": 1.1985, + "step": 17217 + }, + { + "epoch": 0.52, + "learning_rate": 2.470120505492097e-06, + "loss": 1.2045, + "step": 17218 + }, + { + "epoch": 0.52, + "learning_rate": 2.469876603008502e-06, + "loss": 1.1392, + "step": 17219 + }, + { + "epoch": 0.52, + "learning_rate": 2.4696327008116656e-06, + "loss": 1.0344, + "step": 17220 + }, + { + "epoch": 0.52, + "learning_rate": 2.4693887989039115e-06, + "loss": 1.1394, + "step": 17221 + }, + { + "epoch": 0.52, + "learning_rate": 2.4691448972875612e-06, + "loss": 1.1363, + "step": 17222 + }, + { + "epoch": 0.52, + "learning_rate": 2.4689009959649366e-06, + "loss": 1.1039, + "step": 17223 + }, + { + "epoch": 0.52, + "learning_rate": 2.4686570949383602e-06, + "loss": 1.186, + "step": 17224 + }, + { + "epoch": 0.52, + "learning_rate": 2.4684131942101533e-06, + "loss": 1.2017, + "step": 17225 + }, + { + "epoch": 0.52, + "learning_rate": 2.468169293782637e-06, + "loss": 1.1057, + "step": 17226 + }, + { + "epoch": 0.52, + "learning_rate": 2.4679253936581334e-06, + "loss": 1.1792, + "step": 17227 + }, + { + "epoch": 0.52, + "learning_rate": 2.4676814938389656e-06, + "loss": 1.0149, + "step": 17228 + }, + { + "epoch": 0.52, + "learning_rate": 2.4674375943274537e-06, + "loss": 1.131, + "step": 17229 + }, + { + "epoch": 0.52, + "learning_rate": 2.4671936951259203e-06, + "loss": 1.1342, + "step": 17230 + }, + { + "epoch": 0.52, + "learning_rate": 2.4669497962366867e-06, + "loss": 1.0499, + "step": 17231 + }, + { + "epoch": 0.52, + "learning_rate": 2.4667058976620762e-06, + "loss": 1.2874, + "step": 17232 + }, + { + "epoch": 0.52, + "learning_rate": 2.466461999404409e-06, + "loss": 1.0408, + "step": 17233 + }, + { + "epoch": 0.52, + "learning_rate": 2.466218101466007e-06, + "loss": 1.0289, + "step": 17234 + }, + { + "epoch": 0.52, + "learning_rate": 2.4659742038491928e-06, + "loss": 1.1442, + "step": 17235 + }, + { + "epoch": 0.52, + "learning_rate": 2.465730306556287e-06, + "loss": 1.2563, + "step": 17236 + }, + { + "epoch": 0.52, + "learning_rate": 2.4654864095896142e-06, + "loss": 1.168, + "step": 17237 + }, + { + "epoch": 0.52, + "learning_rate": 2.4652425129514926e-06, + "loss": 1.0223, + "step": 17238 + }, + { + "epoch": 0.52, + "learning_rate": 2.4649986166442454e-06, + "loss": 1.1225, + "step": 17239 + }, + { + "epoch": 0.52, + "learning_rate": 2.464754720670195e-06, + "loss": 1.1268, + "step": 17240 + }, + { + "epoch": 0.52, + "learning_rate": 2.4645108250316626e-06, + "loss": 1.139, + "step": 17241 + }, + { + "epoch": 0.52, + "learning_rate": 2.46426692973097e-06, + "loss": 1.1687, + "step": 17242 + }, + { + "epoch": 0.52, + "learning_rate": 2.4640230347704387e-06, + "loss": 1.0828, + "step": 17243 + }, + { + "epoch": 0.52, + "learning_rate": 2.463779140152391e-06, + "loss": 1.1186, + "step": 17244 + }, + { + "epoch": 0.52, + "learning_rate": 2.4635352458791495e-06, + "loss": 1.1313, + "step": 17245 + }, + { + "epoch": 0.52, + "learning_rate": 2.463291351953034e-06, + "loss": 1.0878, + "step": 17246 + }, + { + "epoch": 0.52, + "learning_rate": 2.4630474583763668e-06, + "loss": 1.0933, + "step": 17247 + }, + { + "epoch": 0.52, + "learning_rate": 2.46280356515147e-06, + "loss": 1.2039, + "step": 17248 + }, + { + "epoch": 0.52, + "learning_rate": 2.4625596722806654e-06, + "loss": 1.1826, + "step": 17249 + }, + { + "epoch": 0.52, + "learning_rate": 2.4623157797662763e-06, + "loss": 1.1325, + "step": 17250 + }, + { + "epoch": 0.52, + "learning_rate": 2.462071887610621e-06, + "loss": 1.141, + "step": 17251 + }, + { + "epoch": 0.52, + "learning_rate": 2.4618279958160234e-06, + "loss": 1.0182, + "step": 17252 + }, + { + "epoch": 0.52, + "learning_rate": 2.4615841043848047e-06, + "loss": 1.1373, + "step": 17253 + }, + { + "epoch": 0.52, + "learning_rate": 2.4613402133192875e-06, + "loss": 1.1535, + "step": 17254 + }, + { + "epoch": 0.52, + "learning_rate": 2.4610963226217925e-06, + "loss": 1.1138, + "step": 17255 + }, + { + "epoch": 0.52, + "learning_rate": 2.4608524322946415e-06, + "loss": 1.0546, + "step": 17256 + }, + { + "epoch": 0.52, + "learning_rate": 2.4606085423401566e-06, + "loss": 1.1622, + "step": 17257 + }, + { + "epoch": 0.52, + "learning_rate": 2.4603646527606604e-06, + "loss": 1.105, + "step": 17258 + }, + { + "epoch": 0.52, + "learning_rate": 2.4601207635584725e-06, + "loss": 1.0358, + "step": 17259 + }, + { + "epoch": 0.52, + "learning_rate": 2.4598768747359163e-06, + "loss": 1.1511, + "step": 17260 + }, + { + "epoch": 0.52, + "learning_rate": 2.4596329862953123e-06, + "loss": 1.0805, + "step": 17261 + }, + { + "epoch": 0.52, + "learning_rate": 2.459389098238983e-06, + "loss": 1.1448, + "step": 17262 + }, + { + "epoch": 0.52, + "learning_rate": 2.459145210569251e-06, + "loss": 1.0855, + "step": 17263 + }, + { + "epoch": 0.52, + "learning_rate": 2.4589013232884356e-06, + "loss": 1.07, + "step": 17264 + }, + { + "epoch": 0.52, + "learning_rate": 2.4586574363988602e-06, + "loss": 1.1379, + "step": 17265 + }, + { + "epoch": 0.52, + "learning_rate": 2.4584135499028456e-06, + "loss": 1.2043, + "step": 17266 + }, + { + "epoch": 0.52, + "learning_rate": 2.458169663802715e-06, + "loss": 1.129, + "step": 17267 + }, + { + "epoch": 0.52, + "learning_rate": 2.4579257781007884e-06, + "loss": 1.1539, + "step": 17268 + }, + { + "epoch": 0.52, + "learning_rate": 2.457681892799388e-06, + "loss": 1.2358, + "step": 17269 + }, + { + "epoch": 0.52, + "learning_rate": 2.457438007900836e-06, + "loss": 1.1309, + "step": 17270 + }, + { + "epoch": 0.52, + "learning_rate": 2.457194123407454e-06, + "loss": 1.1017, + "step": 17271 + }, + { + "epoch": 0.52, + "learning_rate": 2.456950239321563e-06, + "loss": 1.0195, + "step": 17272 + }, + { + "epoch": 0.52, + "learning_rate": 2.456706355645485e-06, + "loss": 1.0494, + "step": 17273 + }, + { + "epoch": 0.52, + "learning_rate": 2.4564624723815413e-06, + "loss": 1.1647, + "step": 17274 + }, + { + "epoch": 0.52, + "learning_rate": 2.456218589532054e-06, + "loss": 1.0327, + "step": 17275 + }, + { + "epoch": 0.52, + "learning_rate": 2.4559747070993452e-06, + "loss": 1.1293, + "step": 17276 + }, + { + "epoch": 0.52, + "learning_rate": 2.4557308250857354e-06, + "loss": 1.0715, + "step": 17277 + }, + { + "epoch": 0.52, + "learning_rate": 2.455486943493547e-06, + "loss": 1.1666, + "step": 17278 + }, + { + "epoch": 0.52, + "learning_rate": 2.455243062325101e-06, + "loss": 1.2682, + "step": 17279 + }, + { + "epoch": 0.52, + "learning_rate": 2.4549991815827202e-06, + "loss": 0.981, + "step": 17280 + }, + { + "epoch": 0.52, + "learning_rate": 2.454755301268725e-06, + "loss": 1.215, + "step": 17281 + }, + { + "epoch": 0.52, + "learning_rate": 2.4545114213854375e-06, + "loss": 1.1117, + "step": 17282 + }, + { + "epoch": 0.52, + "learning_rate": 2.4542675419351797e-06, + "loss": 1.1492, + "step": 17283 + }, + { + "epoch": 0.52, + "learning_rate": 2.4540236629202736e-06, + "loss": 1.1343, + "step": 17284 + }, + { + "epoch": 0.52, + "learning_rate": 2.453779784343039e-06, + "loss": 1.1115, + "step": 17285 + }, + { + "epoch": 0.52, + "learning_rate": 2.453535906205799e-06, + "loss": 0.9579, + "step": 17286 + }, + { + "epoch": 0.52, + "learning_rate": 2.4532920285108745e-06, + "loss": 1.1698, + "step": 17287 + }, + { + "epoch": 0.52, + "learning_rate": 2.4530481512605883e-06, + "loss": 1.1707, + "step": 17288 + }, + { + "epoch": 0.52, + "learning_rate": 2.45280427445726e-06, + "loss": 1.0921, + "step": 17289 + }, + { + "epoch": 0.52, + "learning_rate": 2.4525603981032124e-06, + "loss": 1.1096, + "step": 17290 + }, + { + "epoch": 0.52, + "learning_rate": 2.4523165222007674e-06, + "loss": 1.1598, + "step": 17291 + }, + { + "epoch": 0.52, + "learning_rate": 2.4520726467522456e-06, + "loss": 1.0413, + "step": 17292 + }, + { + "epoch": 0.52, + "learning_rate": 2.4518287717599697e-06, + "loss": 1.0361, + "step": 17293 + }, + { + "epoch": 0.52, + "learning_rate": 2.4515848972262604e-06, + "loss": 1.0422, + "step": 17294 + }, + { + "epoch": 0.52, + "learning_rate": 2.451341023153439e-06, + "loss": 1.1021, + "step": 17295 + }, + { + "epoch": 0.52, + "learning_rate": 2.451097149543829e-06, + "loss": 1.1716, + "step": 17296 + }, + { + "epoch": 0.52, + "learning_rate": 2.45085327639975e-06, + "loss": 1.0779, + "step": 17297 + }, + { + "epoch": 0.52, + "learning_rate": 2.450609403723524e-06, + "loss": 1.1238, + "step": 17298 + }, + { + "epoch": 0.52, + "learning_rate": 2.450365531517472e-06, + "loss": 1.0933, + "step": 17299 + }, + { + "epoch": 0.52, + "learning_rate": 2.450121659783917e-06, + "loss": 1.1801, + "step": 17300 + }, + { + "epoch": 0.52, + "learning_rate": 2.4498777885251807e-06, + "loss": 1.0212, + "step": 17301 + }, + { + "epoch": 0.52, + "learning_rate": 2.449633917743582e-06, + "loss": 1.1025, + "step": 17302 + }, + { + "epoch": 0.52, + "learning_rate": 2.449390047441445e-06, + "loss": 1.077, + "step": 17303 + }, + { + "epoch": 0.52, + "learning_rate": 2.44914617762109e-06, + "loss": 1.1026, + "step": 17304 + }, + { + "epoch": 0.52, + "learning_rate": 2.448902308284839e-06, + "loss": 1.1251, + "step": 17305 + }, + { + "epoch": 0.52, + "learning_rate": 2.4486584394350137e-06, + "loss": 1.2401, + "step": 17306 + }, + { + "epoch": 0.52, + "learning_rate": 2.4484145710739356e-06, + "loss": 1.1471, + "step": 17307 + }, + { + "epoch": 0.52, + "learning_rate": 2.4481707032039256e-06, + "loss": 1.0778, + "step": 17308 + }, + { + "epoch": 0.52, + "learning_rate": 2.4479268358273046e-06, + "loss": 1.1616, + "step": 17309 + }, + { + "epoch": 0.52, + "learning_rate": 2.4476829689463966e-06, + "loss": 1.155, + "step": 17310 + }, + { + "epoch": 0.52, + "learning_rate": 2.4474391025635207e-06, + "loss": 1.1069, + "step": 17311 + }, + { + "epoch": 0.52, + "learning_rate": 2.447195236680999e-06, + "loss": 1.0345, + "step": 17312 + }, + { + "epoch": 0.52, + "learning_rate": 2.446951371301153e-06, + "loss": 1.29, + "step": 17313 + }, + { + "epoch": 0.52, + "learning_rate": 2.4467075064263063e-06, + "loss": 1.086, + "step": 17314 + }, + { + "epoch": 0.52, + "learning_rate": 2.4464636420587767e-06, + "loss": 1.0287, + "step": 17315 + }, + { + "epoch": 0.52, + "learning_rate": 2.4462197782008878e-06, + "loss": 1.1522, + "step": 17316 + }, + { + "epoch": 0.52, + "learning_rate": 2.4459759148549604e-06, + "loss": 1.1884, + "step": 17317 + }, + { + "epoch": 0.52, + "learning_rate": 2.4457320520233166e-06, + "loss": 1.2281, + "step": 17318 + }, + { + "epoch": 0.52, + "learning_rate": 2.4454881897082787e-06, + "loss": 1.087, + "step": 17319 + }, + { + "epoch": 0.52, + "learning_rate": 2.4452443279121654e-06, + "loss": 1.066, + "step": 17320 + }, + { + "epoch": 0.52, + "learning_rate": 2.4450004666373e-06, + "loss": 1.161, + "step": 17321 + }, + { + "epoch": 0.52, + "learning_rate": 2.4447566058860036e-06, + "loss": 1.0445, + "step": 17322 + }, + { + "epoch": 0.52, + "learning_rate": 2.444512745660598e-06, + "loss": 1.1464, + "step": 17323 + }, + { + "epoch": 0.52, + "learning_rate": 2.4442688859634044e-06, + "loss": 1.099, + "step": 17324 + }, + { + "epoch": 0.52, + "learning_rate": 2.444025026796744e-06, + "loss": 1.163, + "step": 17325 + }, + { + "epoch": 0.52, + "learning_rate": 2.443781168162938e-06, + "loss": 1.2062, + "step": 17326 + }, + { + "epoch": 0.52, + "learning_rate": 2.4435373100643097e-06, + "loss": 1.2445, + "step": 17327 + }, + { + "epoch": 0.52, + "learning_rate": 2.4432934525031777e-06, + "loss": 1.1158, + "step": 17328 + }, + { + "epoch": 0.52, + "learning_rate": 2.443049595481865e-06, + "loss": 1.1733, + "step": 17329 + }, + { + "epoch": 0.52, + "learning_rate": 2.4428057390026926e-06, + "loss": 1.0903, + "step": 17330 + }, + { + "epoch": 0.52, + "learning_rate": 2.4425618830679816e-06, + "loss": 1.1792, + "step": 17331 + }, + { + "epoch": 0.52, + "learning_rate": 2.4423180276800554e-06, + "loss": 1.0982, + "step": 17332 + }, + { + "epoch": 0.52, + "learning_rate": 2.4420741728412327e-06, + "loss": 1.0741, + "step": 17333 + }, + { + "epoch": 0.52, + "learning_rate": 2.4418303185538356e-06, + "loss": 1.0466, + "step": 17334 + }, + { + "epoch": 0.52, + "learning_rate": 2.441586464820186e-06, + "loss": 1.0801, + "step": 17335 + }, + { + "epoch": 0.52, + "learning_rate": 2.4413426116426057e-06, + "loss": 1.1616, + "step": 17336 + }, + { + "epoch": 0.52, + "learning_rate": 2.441098759023415e-06, + "loss": 1.095, + "step": 17337 + }, + { + "epoch": 0.52, + "learning_rate": 2.4408549069649356e-06, + "loss": 1.111, + "step": 17338 + }, + { + "epoch": 0.52, + "learning_rate": 2.440611055469489e-06, + "loss": 1.1277, + "step": 17339 + }, + { + "epoch": 0.52, + "learning_rate": 2.440367204539398e-06, + "loss": 1.0405, + "step": 17340 + }, + { + "epoch": 0.52, + "learning_rate": 2.440123354176981e-06, + "loss": 1.0635, + "step": 17341 + }, + { + "epoch": 0.52, + "learning_rate": 2.439879504384561e-06, + "loss": 1.1838, + "step": 17342 + }, + { + "epoch": 0.52, + "learning_rate": 2.4396356551644592e-06, + "loss": 1.0938, + "step": 17343 + }, + { + "epoch": 0.52, + "learning_rate": 2.439391806518997e-06, + "loss": 1.1682, + "step": 17344 + }, + { + "epoch": 0.52, + "learning_rate": 2.4391479584504964e-06, + "loss": 1.1335, + "step": 17345 + }, + { + "epoch": 0.52, + "learning_rate": 2.4389041109612773e-06, + "loss": 1.1032, + "step": 17346 + }, + { + "epoch": 0.52, + "learning_rate": 2.438660264053661e-06, + "loss": 1.2231, + "step": 17347 + }, + { + "epoch": 0.52, + "learning_rate": 2.43841641772997e-06, + "loss": 1.0873, + "step": 17348 + }, + { + "epoch": 0.52, + "learning_rate": 2.438172571992525e-06, + "loss": 1.1074, + "step": 17349 + }, + { + "epoch": 0.52, + "learning_rate": 2.4379287268436476e-06, + "loss": 1.1044, + "step": 17350 + }, + { + "epoch": 0.52, + "learning_rate": 2.4376848822856584e-06, + "loss": 1.1715, + "step": 17351 + }, + { + "epoch": 0.52, + "learning_rate": 2.4374410383208787e-06, + "loss": 1.1509, + "step": 17352 + }, + { + "epoch": 0.52, + "learning_rate": 2.4371971949516317e-06, + "loss": 1.0618, + "step": 17353 + }, + { + "epoch": 0.52, + "learning_rate": 2.4369533521802362e-06, + "loss": 1.102, + "step": 17354 + }, + { + "epoch": 0.52, + "learning_rate": 2.4367095100090144e-06, + "loss": 1.1424, + "step": 17355 + }, + { + "epoch": 0.52, + "learning_rate": 2.436465668440287e-06, + "loss": 1.1508, + "step": 17356 + }, + { + "epoch": 0.52, + "learning_rate": 2.4362218274763766e-06, + "loss": 1.1642, + "step": 17357 + }, + { + "epoch": 0.52, + "learning_rate": 2.4359779871196044e-06, + "loss": 1.0804, + "step": 17358 + }, + { + "epoch": 0.52, + "learning_rate": 2.4357341473722897e-06, + "loss": 1.0837, + "step": 17359 + }, + { + "epoch": 0.52, + "learning_rate": 2.4354903082367552e-06, + "loss": 1.1935, + "step": 17360 + }, + { + "epoch": 0.52, + "learning_rate": 2.4352464697153218e-06, + "loss": 1.0364, + "step": 17361 + }, + { + "epoch": 0.52, + "learning_rate": 2.4350026318103114e-06, + "loss": 1.2379, + "step": 17362 + }, + { + "epoch": 0.52, + "learning_rate": 2.4347587945240442e-06, + "loss": 1.0444, + "step": 17363 + }, + { + "epoch": 0.52, + "learning_rate": 2.4345149578588415e-06, + "loss": 1.2028, + "step": 17364 + }, + { + "epoch": 0.52, + "learning_rate": 2.4342711218170254e-06, + "loss": 1.1251, + "step": 17365 + }, + { + "epoch": 0.52, + "learning_rate": 2.434027286400917e-06, + "loss": 1.0898, + "step": 17366 + }, + { + "epoch": 0.52, + "learning_rate": 2.4337834516128365e-06, + "loss": 1.1364, + "step": 17367 + }, + { + "epoch": 0.52, + "learning_rate": 2.433539617455106e-06, + "loss": 1.0677, + "step": 17368 + }, + { + "epoch": 0.52, + "learning_rate": 2.4332957839300457e-06, + "loss": 1.1265, + "step": 17369 + }, + { + "epoch": 0.52, + "learning_rate": 2.4330519510399773e-06, + "loss": 1.1703, + "step": 17370 + }, + { + "epoch": 0.52, + "learning_rate": 2.4328081187872234e-06, + "loss": 1.0226, + "step": 17371 + }, + { + "epoch": 0.52, + "learning_rate": 2.432564287174103e-06, + "loss": 1.0934, + "step": 17372 + }, + { + "epoch": 0.52, + "learning_rate": 2.4323204562029377e-06, + "loss": 1.1418, + "step": 17373 + }, + { + "epoch": 0.52, + "learning_rate": 2.4320766258760495e-06, + "loss": 0.9184, + "step": 17374 + }, + { + "epoch": 0.52, + "learning_rate": 2.4318327961957596e-06, + "loss": 1.0257, + "step": 17375 + }, + { + "epoch": 0.52, + "learning_rate": 2.4315889671643875e-06, + "loss": 1.063, + "step": 17376 + }, + { + "epoch": 0.52, + "learning_rate": 2.431345138784256e-06, + "loss": 1.0997, + "step": 17377 + }, + { + "epoch": 0.52, + "learning_rate": 2.4311013110576856e-06, + "loss": 1.1418, + "step": 17378 + }, + { + "epoch": 0.52, + "learning_rate": 2.4308574839869987e-06, + "loss": 1.1218, + "step": 17379 + }, + { + "epoch": 0.52, + "learning_rate": 2.430613657574514e-06, + "loss": 1.0237, + "step": 17380 + }, + { + "epoch": 0.52, + "learning_rate": 2.430369831822554e-06, + "loss": 1.2993, + "step": 17381 + }, + { + "epoch": 0.52, + "learning_rate": 2.4301260067334394e-06, + "loss": 1.1178, + "step": 17382 + }, + { + "epoch": 0.52, + "learning_rate": 2.429882182309492e-06, + "loss": 1.1428, + "step": 17383 + }, + { + "epoch": 0.52, + "learning_rate": 2.4296383585530333e-06, + "loss": 1.0132, + "step": 17384 + }, + { + "epoch": 0.52, + "learning_rate": 2.4293945354663824e-06, + "loss": 1.2723, + "step": 17385 + }, + { + "epoch": 0.52, + "learning_rate": 2.4291507130518615e-06, + "loss": 1.0999, + "step": 17386 + }, + { + "epoch": 0.52, + "learning_rate": 2.428906891311792e-06, + "loss": 1.1902, + "step": 17387 + }, + { + "epoch": 0.52, + "learning_rate": 2.428663070248495e-06, + "loss": 1.1511, + "step": 17388 + }, + { + "epoch": 0.52, + "learning_rate": 2.4284192498642906e-06, + "loss": 1.0613, + "step": 17389 + }, + { + "epoch": 0.52, + "learning_rate": 2.428175430161501e-06, + "loss": 1.0453, + "step": 17390 + }, + { + "epoch": 0.52, + "learning_rate": 2.4279316111424465e-06, + "loss": 1.0773, + "step": 17391 + }, + { + "epoch": 0.52, + "learning_rate": 2.4276877928094482e-06, + "loss": 1.1039, + "step": 17392 + }, + { + "epoch": 0.52, + "learning_rate": 2.4274439751648273e-06, + "loss": 1.1191, + "step": 17393 + }, + { + "epoch": 0.52, + "learning_rate": 2.4272001582109046e-06, + "loss": 1.1356, + "step": 17394 + }, + { + "epoch": 0.52, + "learning_rate": 2.426956341950002e-06, + "loss": 1.2911, + "step": 17395 + }, + { + "epoch": 0.52, + "learning_rate": 2.426712526384439e-06, + "loss": 1.1956, + "step": 17396 + }, + { + "epoch": 0.52, + "learning_rate": 2.4264687115165386e-06, + "loss": 1.1131, + "step": 17397 + }, + { + "epoch": 0.52, + "learning_rate": 2.42622489734862e-06, + "loss": 1.1111, + "step": 17398 + }, + { + "epoch": 0.52, + "learning_rate": 2.4259810838830046e-06, + "loss": 1.1431, + "step": 17399 + }, + { + "epoch": 0.52, + "learning_rate": 2.4257372711220135e-06, + "loss": 1.0328, + "step": 17400 + }, + { + "epoch": 0.52, + "learning_rate": 2.425493459067969e-06, + "loss": 1.2417, + "step": 17401 + }, + { + "epoch": 0.52, + "learning_rate": 2.42524964772319e-06, + "loss": 1.1766, + "step": 17402 + }, + { + "epoch": 0.52, + "learning_rate": 2.425005837089998e-06, + "loss": 1.1356, + "step": 17403 + }, + { + "epoch": 0.52, + "learning_rate": 2.4247620271707145e-06, + "loss": 1.0797, + "step": 17404 + }, + { + "epoch": 0.52, + "learning_rate": 2.424518217967661e-06, + "loss": 1.16, + "step": 17405 + }, + { + "epoch": 0.52, + "learning_rate": 2.424274409483157e-06, + "loss": 1.1111, + "step": 17406 + }, + { + "epoch": 0.52, + "learning_rate": 2.4240306017195244e-06, + "loss": 1.0643, + "step": 17407 + }, + { + "epoch": 0.52, + "learning_rate": 2.4237867946790834e-06, + "loss": 1.1038, + "step": 17408 + }, + { + "epoch": 0.52, + "learning_rate": 2.423542988364156e-06, + "loss": 1.075, + "step": 17409 + }, + { + "epoch": 0.52, + "learning_rate": 2.423299182777063e-06, + "loss": 1.0884, + "step": 17410 + }, + { + "epoch": 0.52, + "learning_rate": 2.423055377920124e-06, + "loss": 1.1324, + "step": 17411 + }, + { + "epoch": 0.52, + "learning_rate": 2.4228115737956607e-06, + "loss": 1.1776, + "step": 17412 + }, + { + "epoch": 0.52, + "learning_rate": 2.422567770405994e-06, + "loss": 1.1614, + "step": 17413 + }, + { + "epoch": 0.52, + "learning_rate": 2.422323967753446e-06, + "loss": 1.1707, + "step": 17414 + }, + { + "epoch": 0.52, + "learning_rate": 2.4220801658403355e-06, + "loss": 1.0814, + "step": 17415 + }, + { + "epoch": 0.52, + "learning_rate": 2.4218363646689837e-06, + "loss": 1.1228, + "step": 17416 + }, + { + "epoch": 0.52, + "learning_rate": 2.4215925642417127e-06, + "loss": 1.2969, + "step": 17417 + }, + { + "epoch": 0.52, + "learning_rate": 2.421348764560843e-06, + "loss": 1.1642, + "step": 17418 + }, + { + "epoch": 0.52, + "learning_rate": 2.4211049656286946e-06, + "loss": 1.17, + "step": 17419 + }, + { + "epoch": 0.52, + "learning_rate": 2.420861167447589e-06, + "loss": 1.1615, + "step": 17420 + }, + { + "epoch": 0.52, + "learning_rate": 2.420617370019847e-06, + "loss": 1.147, + "step": 17421 + }, + { + "epoch": 0.52, + "learning_rate": 2.4203735733477895e-06, + "loss": 1.0044, + "step": 17422 + }, + { + "epoch": 0.52, + "learning_rate": 2.4201297774337383e-06, + "loss": 1.1688, + "step": 17423 + }, + { + "epoch": 0.52, + "learning_rate": 2.419885982280012e-06, + "loss": 1.1048, + "step": 17424 + }, + { + "epoch": 0.52, + "learning_rate": 2.4196421878889326e-06, + "loss": 1.0852, + "step": 17425 + }, + { + "epoch": 0.52, + "learning_rate": 2.4193983942628207e-06, + "loss": 1.1484, + "step": 17426 + }, + { + "epoch": 0.52, + "learning_rate": 2.4191546014039983e-06, + "loss": 1.0784, + "step": 17427 + }, + { + "epoch": 0.53, + "learning_rate": 2.4189108093147845e-06, + "loss": 1.1846, + "step": 17428 + }, + { + "epoch": 0.53, + "learning_rate": 2.4186670179975006e-06, + "loss": 1.0857, + "step": 17429 + }, + { + "epoch": 0.53, + "learning_rate": 2.418423227454467e-06, + "loss": 1.143, + "step": 17430 + }, + { + "epoch": 0.53, + "learning_rate": 2.418179437688006e-06, + "loss": 1.1942, + "step": 17431 + }, + { + "epoch": 0.53, + "learning_rate": 2.417935648700437e-06, + "loss": 1.0575, + "step": 17432 + }, + { + "epoch": 0.53, + "learning_rate": 2.417691860494081e-06, + "loss": 1.0748, + "step": 17433 + }, + { + "epoch": 0.53, + "learning_rate": 2.4174480730712585e-06, + "loss": 1.1414, + "step": 17434 + }, + { + "epoch": 0.53, + "learning_rate": 2.4172042864342907e-06, + "loss": 1.1329, + "step": 17435 + }, + { + "epoch": 0.53, + "learning_rate": 2.4169605005854994e-06, + "loss": 1.1841, + "step": 17436 + }, + { + "epoch": 0.53, + "learning_rate": 2.4167167155272033e-06, + "loss": 1.1453, + "step": 17437 + }, + { + "epoch": 0.53, + "learning_rate": 2.4164729312617237e-06, + "loss": 1.1033, + "step": 17438 + }, + { + "epoch": 0.53, + "learning_rate": 2.4162291477913814e-06, + "loss": 1.1855, + "step": 17439 + }, + { + "epoch": 0.53, + "learning_rate": 2.415985365118498e-06, + "loss": 1.0881, + "step": 17440 + }, + { + "epoch": 0.53, + "learning_rate": 2.4157415832453933e-06, + "loss": 1.1017, + "step": 17441 + }, + { + "epoch": 0.53, + "learning_rate": 2.415497802174388e-06, + "loss": 1.1093, + "step": 17442 + }, + { + "epoch": 0.53, + "learning_rate": 2.4152540219078024e-06, + "loss": 1.0181, + "step": 17443 + }, + { + "epoch": 0.53, + "learning_rate": 2.4150102424479583e-06, + "loss": 1.0013, + "step": 17444 + }, + { + "epoch": 0.53, + "learning_rate": 2.414766463797176e-06, + "loss": 1.0403, + "step": 17445 + }, + { + "epoch": 0.53, + "learning_rate": 2.414522685957775e-06, + "loss": 1.0927, + "step": 17446 + }, + { + "epoch": 0.53, + "learning_rate": 2.4142789089320772e-06, + "loss": 1.0462, + "step": 17447 + }, + { + "epoch": 0.53, + "learning_rate": 2.414035132722403e-06, + "loss": 1.1883, + "step": 17448 + }, + { + "epoch": 0.53, + "learning_rate": 2.413791357331074e-06, + "loss": 1.1961, + "step": 17449 + }, + { + "epoch": 0.53, + "learning_rate": 2.413547582760408e-06, + "loss": 1.1718, + "step": 17450 + }, + { + "epoch": 0.53, + "learning_rate": 2.4133038090127284e-06, + "loss": 1.0242, + "step": 17451 + }, + { + "epoch": 0.53, + "learning_rate": 2.413060036090354e-06, + "loss": 1.0992, + "step": 17452 + }, + { + "epoch": 0.53, + "learning_rate": 2.412816263995608e-06, + "loss": 1.1988, + "step": 17453 + }, + { + "epoch": 0.53, + "learning_rate": 2.4125724927308075e-06, + "loss": 1.0688, + "step": 17454 + }, + { + "epoch": 0.53, + "learning_rate": 2.412328722298275e-06, + "loss": 1.144, + "step": 17455 + }, + { + "epoch": 0.53, + "learning_rate": 2.412084952700331e-06, + "loss": 1.0884, + "step": 17456 + }, + { + "epoch": 0.53, + "learning_rate": 2.411841183939296e-06, + "loss": 1.046, + "step": 17457 + }, + { + "epoch": 0.53, + "learning_rate": 2.4115974160174902e-06, + "loss": 1.2361, + "step": 17458 + }, + { + "epoch": 0.53, + "learning_rate": 2.4113536489372347e-06, + "loss": 1.0396, + "step": 17459 + }, + { + "epoch": 0.53, + "learning_rate": 2.4111098827008496e-06, + "loss": 1.1365, + "step": 17460 + }, + { + "epoch": 0.53, + "learning_rate": 2.4108661173106556e-06, + "loss": 1.085, + "step": 17461 + }, + { + "epoch": 0.53, + "learning_rate": 2.410622352768974e-06, + "loss": 1.1463, + "step": 17462 + }, + { + "epoch": 0.53, + "learning_rate": 2.4103785890781235e-06, + "loss": 1.1874, + "step": 17463 + }, + { + "epoch": 0.53, + "learning_rate": 2.410134826240426e-06, + "loss": 1.2095, + "step": 17464 + }, + { + "epoch": 0.53, + "learning_rate": 2.4098910642582012e-06, + "loss": 1.1809, + "step": 17465 + }, + { + "epoch": 0.53, + "learning_rate": 2.409647303133772e-06, + "loss": 1.0571, + "step": 17466 + }, + { + "epoch": 0.53, + "learning_rate": 2.4094035428694553e-06, + "loss": 1.3047, + "step": 17467 + }, + { + "epoch": 0.53, + "learning_rate": 2.4091597834675733e-06, + "loss": 1.0571, + "step": 17468 + }, + { + "epoch": 0.53, + "learning_rate": 2.4089160249304462e-06, + "loss": 1.1541, + "step": 17469 + }, + { + "epoch": 0.53, + "learning_rate": 2.4086722672603955e-06, + "loss": 1.1536, + "step": 17470 + }, + { + "epoch": 0.53, + "learning_rate": 2.4084285104597402e-06, + "loss": 1.0436, + "step": 17471 + }, + { + "epoch": 0.53, + "learning_rate": 2.4081847545308017e-06, + "loss": 1.0541, + "step": 17472 + }, + { + "epoch": 0.53, + "learning_rate": 2.4079409994759e-06, + "loss": 1.1071, + "step": 17473 + }, + { + "epoch": 0.53, + "learning_rate": 2.407697245297356e-06, + "loss": 1.098, + "step": 17474 + }, + { + "epoch": 0.53, + "learning_rate": 2.407453491997489e-06, + "loss": 1.1298, + "step": 17475 + }, + { + "epoch": 0.53, + "learning_rate": 2.4072097395786208e-06, + "loss": 1.0653, + "step": 17476 + }, + { + "epoch": 0.53, + "learning_rate": 2.4069659880430702e-06, + "loss": 1.0365, + "step": 17477 + }, + { + "epoch": 0.53, + "learning_rate": 2.4067222373931595e-06, + "loss": 1.1666, + "step": 17478 + }, + { + "epoch": 0.53, + "learning_rate": 2.4064784876312087e-06, + "loss": 1.1037, + "step": 17479 + }, + { + "epoch": 0.53, + "learning_rate": 2.406234738759537e-06, + "loss": 1.2514, + "step": 17480 + }, + { + "epoch": 0.53, + "learning_rate": 2.4059909907804655e-06, + "loss": 1.1107, + "step": 17481 + }, + { + "epoch": 0.53, + "learning_rate": 2.405747243696314e-06, + "loss": 1.1612, + "step": 17482 + }, + { + "epoch": 0.53, + "learning_rate": 2.4055034975094047e-06, + "loss": 1.1406, + "step": 17483 + }, + { + "epoch": 0.53, + "learning_rate": 2.4052597522220554e-06, + "loss": 1.1508, + "step": 17484 + }, + { + "epoch": 0.53, + "learning_rate": 2.4050160078365878e-06, + "loss": 1.03, + "step": 17485 + }, + { + "epoch": 0.53, + "learning_rate": 2.404772264355322e-06, + "loss": 1.3003, + "step": 17486 + }, + { + "epoch": 0.53, + "learning_rate": 2.404528521780579e-06, + "loss": 1.2161, + "step": 17487 + }, + { + "epoch": 0.53, + "learning_rate": 2.4042847801146775e-06, + "loss": 1.1579, + "step": 17488 + }, + { + "epoch": 0.53, + "learning_rate": 2.404041039359939e-06, + "loss": 1.1448, + "step": 17489 + }, + { + "epoch": 0.53, + "learning_rate": 2.403797299518684e-06, + "loss": 1.137, + "step": 17490 + }, + { + "epoch": 0.53, + "learning_rate": 2.403553560593232e-06, + "loss": 1.1056, + "step": 17491 + }, + { + "epoch": 0.53, + "learning_rate": 2.403309822585905e-06, + "loss": 1.149, + "step": 17492 + }, + { + "epoch": 0.53, + "learning_rate": 2.4030660854990206e-06, + "loss": 1.185, + "step": 17493 + }, + { + "epoch": 0.53, + "learning_rate": 2.4028223493349005e-06, + "loss": 1.1241, + "step": 17494 + }, + { + "epoch": 0.53, + "learning_rate": 2.402578614095865e-06, + "loss": 1.1036, + "step": 17495 + }, + { + "epoch": 0.53, + "learning_rate": 2.402334879784235e-06, + "loss": 1.1577, + "step": 17496 + }, + { + "epoch": 0.53, + "learning_rate": 2.4020911464023285e-06, + "loss": 1.1218, + "step": 17497 + }, + { + "epoch": 0.53, + "learning_rate": 2.4018474139524678e-06, + "loss": 1.1126, + "step": 17498 + }, + { + "epoch": 0.53, + "learning_rate": 2.401603682436972e-06, + "loss": 1.1157, + "step": 17499 + }, + { + "epoch": 0.53, + "learning_rate": 2.4013599518581626e-06, + "loss": 1.1514, + "step": 17500 + }, + { + "epoch": 0.53, + "learning_rate": 2.4011162222183583e-06, + "loss": 1.0945, + "step": 17501 + }, + { + "epoch": 0.53, + "learning_rate": 2.4008724935198794e-06, + "loss": 1.0563, + "step": 17502 + }, + { + "epoch": 0.53, + "learning_rate": 2.4006287657650473e-06, + "loss": 1.1799, + "step": 17503 + }, + { + "epoch": 0.53, + "learning_rate": 2.4003850389561813e-06, + "loss": 1.1461, + "step": 17504 + }, + { + "epoch": 0.53, + "learning_rate": 2.400141313095603e-06, + "loss": 1.2092, + "step": 17505 + }, + { + "epoch": 0.53, + "learning_rate": 2.39989758818563e-06, + "loss": 1.0872, + "step": 17506 + }, + { + "epoch": 0.53, + "learning_rate": 2.3996538642285837e-06, + "loss": 1.136, + "step": 17507 + }, + { + "epoch": 0.53, + "learning_rate": 2.3994101412267847e-06, + "loss": 1.097, + "step": 17508 + }, + { + "epoch": 0.53, + "learning_rate": 2.3991664191825535e-06, + "loss": 1.1231, + "step": 17509 + }, + { + "epoch": 0.53, + "learning_rate": 2.398922698098208e-06, + "loss": 1.187, + "step": 17510 + }, + { + "epoch": 0.53, + "learning_rate": 2.3986789779760702e-06, + "loss": 1.1123, + "step": 17511 + }, + { + "epoch": 0.53, + "learning_rate": 2.3984352588184595e-06, + "loss": 1.1597, + "step": 17512 + }, + { + "epoch": 0.53, + "learning_rate": 2.398191540627697e-06, + "loss": 1.0622, + "step": 17513 + }, + { + "epoch": 0.53, + "learning_rate": 2.3979478234061014e-06, + "loss": 1.0998, + "step": 17514 + }, + { + "epoch": 0.53, + "learning_rate": 2.397704107155993e-06, + "loss": 1.1529, + "step": 17515 + }, + { + "epoch": 0.53, + "learning_rate": 2.3974603918796928e-06, + "loss": 1.0825, + "step": 17516 + }, + { + "epoch": 0.53, + "learning_rate": 2.39721667757952e-06, + "loss": 1.2434, + "step": 17517 + }, + { + "epoch": 0.53, + "learning_rate": 2.396972964257796e-06, + "loss": 1.1719, + "step": 17518 + }, + { + "epoch": 0.53, + "learning_rate": 2.396729251916839e-06, + "loss": 1.3412, + "step": 17519 + }, + { + "epoch": 0.53, + "learning_rate": 2.3964855405589692e-06, + "loss": 1.101, + "step": 17520 + }, + { + "epoch": 0.53, + "learning_rate": 2.3962418301865073e-06, + "loss": 1.0184, + "step": 17521 + }, + { + "epoch": 0.53, + "learning_rate": 2.3959981208017747e-06, + "loss": 1.1516, + "step": 17522 + }, + { + "epoch": 0.53, + "learning_rate": 2.3957544124070885e-06, + "loss": 1.2139, + "step": 17523 + }, + { + "epoch": 0.53, + "learning_rate": 2.39551070500477e-06, + "loss": 1.0786, + "step": 17524 + }, + { + "epoch": 0.53, + "learning_rate": 2.3952669985971393e-06, + "loss": 1.2545, + "step": 17525 + }, + { + "epoch": 0.53, + "learning_rate": 2.395023293186517e-06, + "loss": 1.1326, + "step": 17526 + }, + { + "epoch": 0.53, + "learning_rate": 2.394779588775222e-06, + "loss": 1.0791, + "step": 17527 + }, + { + "epoch": 0.53, + "learning_rate": 2.3945358853655745e-06, + "loss": 1.117, + "step": 17528 + }, + { + "epoch": 0.53, + "learning_rate": 2.394292182959895e-06, + "loss": 1.194, + "step": 17529 + }, + { + "epoch": 0.53, + "learning_rate": 2.3940484815605023e-06, + "loss": 1.2418, + "step": 17530 + }, + { + "epoch": 0.53, + "learning_rate": 2.3938047811697184e-06, + "loss": 1.0992, + "step": 17531 + }, + { + "epoch": 0.53, + "learning_rate": 2.3935610817898608e-06, + "loss": 1.2571, + "step": 17532 + }, + { + "epoch": 0.53, + "learning_rate": 2.39331738342325e-06, + "loss": 1.1228, + "step": 17533 + }, + { + "epoch": 0.53, + "learning_rate": 2.393073686072207e-06, + "loss": 1.1677, + "step": 17534 + }, + { + "epoch": 0.53, + "learning_rate": 2.392829989739052e-06, + "loss": 1.1212, + "step": 17535 + }, + { + "epoch": 0.53, + "learning_rate": 2.3925862944261023e-06, + "loss": 1.1574, + "step": 17536 + }, + { + "epoch": 0.53, + "learning_rate": 2.3923426001356798e-06, + "loss": 1.1441, + "step": 17537 + }, + { + "epoch": 0.53, + "learning_rate": 2.3920989068701036e-06, + "loss": 1.1611, + "step": 17538 + }, + { + "epoch": 0.53, + "learning_rate": 2.3918552146316946e-06, + "loss": 1.1274, + "step": 17539 + }, + { + "epoch": 0.53, + "learning_rate": 2.391611523422771e-06, + "loss": 1.008, + "step": 17540 + }, + { + "epoch": 0.53, + "learning_rate": 2.391367833245654e-06, + "loss": 1.0817, + "step": 17541 + }, + { + "epoch": 0.53, + "learning_rate": 2.3911241441026627e-06, + "loss": 1.194, + "step": 17542 + }, + { + "epoch": 0.53, + "learning_rate": 2.3908804559961177e-06, + "loss": 1.1248, + "step": 17543 + }, + { + "epoch": 0.53, + "learning_rate": 2.390636768928338e-06, + "loss": 1.1419, + "step": 17544 + }, + { + "epoch": 0.53, + "learning_rate": 2.3903930829016434e-06, + "loss": 1.1488, + "step": 17545 + }, + { + "epoch": 0.53, + "learning_rate": 2.3901493979183537e-06, + "loss": 1.0516, + "step": 17546 + }, + { + "epoch": 0.53, + "learning_rate": 2.3899057139807884e-06, + "loss": 1.1107, + "step": 17547 + }, + { + "epoch": 0.53, + "learning_rate": 2.3896620310912693e-06, + "loss": 1.0805, + "step": 17548 + }, + { + "epoch": 0.53, + "learning_rate": 2.3894183492521133e-06, + "loss": 1.1737, + "step": 17549 + }, + { + "epoch": 0.53, + "learning_rate": 2.3891746684656415e-06, + "loss": 1.0006, + "step": 17550 + }, + { + "epoch": 0.53, + "learning_rate": 2.388930988734173e-06, + "loss": 1.2317, + "step": 17551 + }, + { + "epoch": 0.53, + "learning_rate": 2.388687310060029e-06, + "loss": 1.019, + "step": 17552 + }, + { + "epoch": 0.53, + "learning_rate": 2.3884436324455272e-06, + "loss": 1.2075, + "step": 17553 + }, + { + "epoch": 0.53, + "learning_rate": 2.3881999558929894e-06, + "loss": 1.0847, + "step": 17554 + }, + { + "epoch": 0.53, + "learning_rate": 2.387956280404733e-06, + "loss": 1.2036, + "step": 17555 + }, + { + "epoch": 0.53, + "learning_rate": 2.3877126059830795e-06, + "loss": 0.9817, + "step": 17556 + }, + { + "epoch": 0.53, + "learning_rate": 2.3874689326303483e-06, + "loss": 1.1559, + "step": 17557 + }, + { + "epoch": 0.53, + "learning_rate": 2.387225260348858e-06, + "loss": 1.0738, + "step": 17558 + }, + { + "epoch": 0.53, + "learning_rate": 2.3869815891409287e-06, + "loss": 1.0724, + "step": 17559 + }, + { + "epoch": 0.53, + "learning_rate": 2.3867379190088803e-06, + "loss": 1.1315, + "step": 17560 + }, + { + "epoch": 0.53, + "learning_rate": 2.386494249955034e-06, + "loss": 1.1295, + "step": 17561 + }, + { + "epoch": 0.53, + "learning_rate": 2.3862505819817062e-06, + "loss": 1.203, + "step": 17562 + }, + { + "epoch": 0.53, + "learning_rate": 2.386006915091218e-06, + "loss": 1.1284, + "step": 17563 + }, + { + "epoch": 0.53, + "learning_rate": 2.3857632492858894e-06, + "loss": 1.0862, + "step": 17564 + }, + { + "epoch": 0.53, + "learning_rate": 2.3855195845680404e-06, + "loss": 1.1348, + "step": 17565 + }, + { + "epoch": 0.53, + "learning_rate": 2.385275920939989e-06, + "loss": 1.0286, + "step": 17566 + }, + { + "epoch": 0.53, + "learning_rate": 2.3850322584040554e-06, + "loss": 1.029, + "step": 17567 + }, + { + "epoch": 0.53, + "learning_rate": 2.384788596962559e-06, + "loss": 1.2325, + "step": 17568 + }, + { + "epoch": 0.53, + "learning_rate": 2.38454493661782e-06, + "loss": 1.0407, + "step": 17569 + }, + { + "epoch": 0.53, + "learning_rate": 2.3843012773721584e-06, + "loss": 1.1835, + "step": 17570 + }, + { + "epoch": 0.53, + "learning_rate": 2.3840576192278924e-06, + "loss": 1.0495, + "step": 17571 + }, + { + "epoch": 0.53, + "learning_rate": 2.3838139621873416e-06, + "loss": 1.0914, + "step": 17572 + }, + { + "epoch": 0.53, + "learning_rate": 2.383570306252826e-06, + "loss": 1.1352, + "step": 17573 + }, + { + "epoch": 0.53, + "learning_rate": 2.3833266514266665e-06, + "loss": 1.0275, + "step": 17574 + }, + { + "epoch": 0.53, + "learning_rate": 2.3830829977111796e-06, + "loss": 1.2062, + "step": 17575 + }, + { + "epoch": 0.53, + "learning_rate": 2.3828393451086864e-06, + "loss": 1.1512, + "step": 17576 + }, + { + "epoch": 0.53, + "learning_rate": 2.3825956936215064e-06, + "loss": 1.1555, + "step": 17577 + }, + { + "epoch": 0.53, + "learning_rate": 2.3823520432519593e-06, + "loss": 1.1034, + "step": 17578 + }, + { + "epoch": 0.53, + "learning_rate": 2.382108394002364e-06, + "loss": 0.9765, + "step": 17579 + }, + { + "epoch": 0.53, + "learning_rate": 2.381864745875039e-06, + "loss": 1.2057, + "step": 17580 + }, + { + "epoch": 0.53, + "learning_rate": 2.3816210988723053e-06, + "loss": 1.0067, + "step": 17581 + }, + { + "epoch": 0.53, + "learning_rate": 2.381377452996482e-06, + "loss": 1.0598, + "step": 17582 + }, + { + "epoch": 0.53, + "learning_rate": 2.381133808249888e-06, + "loss": 1.1963, + "step": 17583 + }, + { + "epoch": 0.53, + "learning_rate": 2.3808901646348426e-06, + "loss": 1.1419, + "step": 17584 + }, + { + "epoch": 0.53, + "learning_rate": 2.3806465221536654e-06, + "loss": 1.1872, + "step": 17585 + }, + { + "epoch": 0.53, + "learning_rate": 2.3804028808086763e-06, + "loss": 1.175, + "step": 17586 + }, + { + "epoch": 0.53, + "learning_rate": 2.3801592406021947e-06, + "loss": 1.252, + "step": 17587 + }, + { + "epoch": 0.53, + "learning_rate": 2.3799156015365386e-06, + "loss": 1.1218, + "step": 17588 + }, + { + "epoch": 0.53, + "learning_rate": 2.379671963614028e-06, + "loss": 0.9729, + "step": 17589 + }, + { + "epoch": 0.53, + "learning_rate": 2.3794283268369826e-06, + "loss": 1.1866, + "step": 17590 + }, + { + "epoch": 0.53, + "learning_rate": 2.379184691207722e-06, + "loss": 1.1141, + "step": 17591 + }, + { + "epoch": 0.53, + "learning_rate": 2.378941056728565e-06, + "loss": 1.0474, + "step": 17592 + }, + { + "epoch": 0.53, + "learning_rate": 2.3786974234018297e-06, + "loss": 1.1773, + "step": 17593 + }, + { + "epoch": 0.53, + "learning_rate": 2.3784537912298373e-06, + "loss": 1.0433, + "step": 17594 + }, + { + "epoch": 0.53, + "learning_rate": 2.3782101602149058e-06, + "loss": 1.0385, + "step": 17595 + }, + { + "epoch": 0.53, + "learning_rate": 2.3779665303593553e-06, + "loss": 1.1609, + "step": 17596 + }, + { + "epoch": 0.53, + "learning_rate": 2.3777229016655045e-06, + "loss": 1.1738, + "step": 17597 + }, + { + "epoch": 0.53, + "learning_rate": 2.3774792741356728e-06, + "loss": 1.0848, + "step": 17598 + }, + { + "epoch": 0.53, + "learning_rate": 2.377235647772179e-06, + "loss": 1.1689, + "step": 17599 + }, + { + "epoch": 0.53, + "learning_rate": 2.376992022577344e-06, + "loss": 1.0599, + "step": 17600 + }, + { + "epoch": 0.53, + "learning_rate": 2.376748398553485e-06, + "loss": 1.1754, + "step": 17601 + }, + { + "epoch": 0.53, + "learning_rate": 2.3765047757029214e-06, + "loss": 1.1278, + "step": 17602 + }, + { + "epoch": 0.53, + "learning_rate": 2.376261154027973e-06, + "loss": 1.144, + "step": 17603 + }, + { + "epoch": 0.53, + "learning_rate": 2.37601753353096e-06, + "loss": 1.2076, + "step": 17604 + }, + { + "epoch": 0.53, + "learning_rate": 2.375773914214199e-06, + "loss": 1.1058, + "step": 17605 + }, + { + "epoch": 0.53, + "learning_rate": 2.375530296080011e-06, + "loss": 1.0732, + "step": 17606 + }, + { + "epoch": 0.53, + "learning_rate": 2.375286679130714e-06, + "loss": 1.1516, + "step": 17607 + }, + { + "epoch": 0.53, + "learning_rate": 2.3750430633686285e-06, + "loss": 1.0702, + "step": 17608 + }, + { + "epoch": 0.53, + "learning_rate": 2.3747994487960727e-06, + "loss": 1.0953, + "step": 17609 + }, + { + "epoch": 0.53, + "learning_rate": 2.3745558354153656e-06, + "loss": 1.2019, + "step": 17610 + }, + { + "epoch": 0.53, + "learning_rate": 2.3743122232288266e-06, + "loss": 1.1728, + "step": 17611 + }, + { + "epoch": 0.53, + "learning_rate": 2.3740686122387747e-06, + "loss": 1.2184, + "step": 17612 + }, + { + "epoch": 0.53, + "learning_rate": 2.3738250024475297e-06, + "loss": 1.1418, + "step": 17613 + }, + { + "epoch": 0.53, + "learning_rate": 2.3735813938574093e-06, + "loss": 1.1509, + "step": 17614 + }, + { + "epoch": 0.53, + "learning_rate": 2.373337786470733e-06, + "loss": 1.0472, + "step": 17615 + }, + { + "epoch": 0.53, + "learning_rate": 2.3730941802898198e-06, + "loss": 1.1208, + "step": 17616 + }, + { + "epoch": 0.53, + "learning_rate": 2.37285057531699e-06, + "loss": 1.0867, + "step": 17617 + }, + { + "epoch": 0.53, + "learning_rate": 2.372606971554561e-06, + "loss": 1.1816, + "step": 17618 + }, + { + "epoch": 0.53, + "learning_rate": 2.3723633690048513e-06, + "loss": 1.1145, + "step": 17619 + }, + { + "epoch": 0.53, + "learning_rate": 2.3721197676701817e-06, + "loss": 1.1307, + "step": 17620 + }, + { + "epoch": 0.53, + "learning_rate": 2.3718761675528696e-06, + "loss": 1.0723, + "step": 17621 + }, + { + "epoch": 0.53, + "learning_rate": 2.3716325686552353e-06, + "loss": 1.0707, + "step": 17622 + }, + { + "epoch": 0.53, + "learning_rate": 2.371388970979597e-06, + "loss": 1.1075, + "step": 17623 + }, + { + "epoch": 0.53, + "learning_rate": 2.371145374528274e-06, + "loss": 1.1747, + "step": 17624 + }, + { + "epoch": 0.53, + "learning_rate": 2.3709017793035845e-06, + "loss": 1.0797, + "step": 17625 + }, + { + "epoch": 0.53, + "learning_rate": 2.370658185307849e-06, + "loss": 1.1582, + "step": 17626 + }, + { + "epoch": 0.53, + "learning_rate": 2.370414592543384e-06, + "loss": 1.0795, + "step": 17627 + }, + { + "epoch": 0.53, + "learning_rate": 2.37017100101251e-06, + "loss": 1.1127, + "step": 17628 + }, + { + "epoch": 0.53, + "learning_rate": 2.3699274107175454e-06, + "loss": 1.0408, + "step": 17629 + }, + { + "epoch": 0.53, + "learning_rate": 2.3696838216608102e-06, + "loss": 1.2205, + "step": 17630 + }, + { + "epoch": 0.53, + "learning_rate": 2.3694402338446217e-06, + "loss": 1.2086, + "step": 17631 + }, + { + "epoch": 0.53, + "learning_rate": 2.3691966472712986e-06, + "loss": 1.1552, + "step": 17632 + }, + { + "epoch": 0.53, + "learning_rate": 2.368953061943161e-06, + "loss": 1.1519, + "step": 17633 + }, + { + "epoch": 0.53, + "learning_rate": 2.3687094778625267e-06, + "loss": 1.0887, + "step": 17634 + }, + { + "epoch": 0.53, + "learning_rate": 2.368465895031716e-06, + "loss": 1.033, + "step": 17635 + }, + { + "epoch": 0.53, + "learning_rate": 2.3682223134530457e-06, + "loss": 1.022, + "step": 17636 + }, + { + "epoch": 0.53, + "learning_rate": 2.3679787331288357e-06, + "loss": 1.1217, + "step": 17637 + }, + { + "epoch": 0.53, + "learning_rate": 2.3677351540614044e-06, + "loss": 1.142, + "step": 17638 + }, + { + "epoch": 0.53, + "learning_rate": 2.3674915762530716e-06, + "loss": 1.0801, + "step": 17639 + }, + { + "epoch": 0.53, + "learning_rate": 2.367247999706154e-06, + "loss": 1.1133, + "step": 17640 + }, + { + "epoch": 0.53, + "learning_rate": 2.3670044244229717e-06, + "loss": 1.0511, + "step": 17641 + }, + { + "epoch": 0.53, + "learning_rate": 2.3667608504058436e-06, + "loss": 1.1578, + "step": 17642 + }, + { + "epoch": 0.53, + "learning_rate": 2.3665172776570888e-06, + "loss": 1.2176, + "step": 17643 + }, + { + "epoch": 0.53, + "learning_rate": 2.366273706179024e-06, + "loss": 1.0876, + "step": 17644 + }, + { + "epoch": 0.53, + "learning_rate": 2.3660301359739698e-06, + "loss": 1.0469, + "step": 17645 + }, + { + "epoch": 0.53, + "learning_rate": 2.3657865670442434e-06, + "loss": 0.992, + "step": 17646 + }, + { + "epoch": 0.53, + "learning_rate": 2.3655429993921647e-06, + "loss": 1.1516, + "step": 17647 + }, + { + "epoch": 0.53, + "learning_rate": 2.365299433020053e-06, + "loss": 1.1237, + "step": 17648 + }, + { + "epoch": 0.53, + "learning_rate": 2.3650558679302244e-06, + "loss": 1.1763, + "step": 17649 + }, + { + "epoch": 0.53, + "learning_rate": 2.364812304124999e-06, + "loss": 1.0018, + "step": 17650 + }, + { + "epoch": 0.53, + "learning_rate": 2.3645687416066956e-06, + "loss": 1.0552, + "step": 17651 + }, + { + "epoch": 0.53, + "learning_rate": 2.364325180377633e-06, + "loss": 1.1616, + "step": 17652 + }, + { + "epoch": 0.53, + "learning_rate": 2.3640816204401287e-06, + "loss": 1.2418, + "step": 17653 + }, + { + "epoch": 0.53, + "learning_rate": 2.363838061796502e-06, + "loss": 1.2067, + "step": 17654 + }, + { + "epoch": 0.53, + "learning_rate": 2.363594504449071e-06, + "loss": 1.2664, + "step": 17655 + }, + { + "epoch": 0.53, + "learning_rate": 2.363350948400156e-06, + "loss": 1.209, + "step": 17656 + }, + { + "epoch": 0.53, + "learning_rate": 2.3631073936520734e-06, + "loss": 1.144, + "step": 17657 + }, + { + "epoch": 0.53, + "learning_rate": 2.3628638402071423e-06, + "loss": 1.1783, + "step": 17658 + }, + { + "epoch": 0.53, + "learning_rate": 2.3626202880676813e-06, + "loss": 1.1355, + "step": 17659 + }, + { + "epoch": 0.53, + "learning_rate": 2.3623767372360103e-06, + "loss": 1.2216, + "step": 17660 + }, + { + "epoch": 0.53, + "learning_rate": 2.3621331877144448e-06, + "loss": 1.1909, + "step": 17661 + }, + { + "epoch": 0.53, + "learning_rate": 2.3618896395053055e-06, + "loss": 1.1938, + "step": 17662 + }, + { + "epoch": 0.53, + "learning_rate": 2.36164609261091e-06, + "loss": 1.0986, + "step": 17663 + }, + { + "epoch": 0.53, + "learning_rate": 2.3614025470335776e-06, + "loss": 1.1959, + "step": 17664 + }, + { + "epoch": 0.53, + "learning_rate": 2.361159002775626e-06, + "loss": 1.0764, + "step": 17665 + }, + { + "epoch": 0.53, + "learning_rate": 2.3609154598393736e-06, + "loss": 1.0317, + "step": 17666 + }, + { + "epoch": 0.53, + "learning_rate": 2.360671918227139e-06, + "loss": 1.174, + "step": 17667 + }, + { + "epoch": 0.53, + "learning_rate": 2.360428377941241e-06, + "loss": 1.1969, + "step": 17668 + }, + { + "epoch": 0.53, + "learning_rate": 2.3601848389839983e-06, + "loss": 1.1725, + "step": 17669 + }, + { + "epoch": 0.53, + "learning_rate": 2.3599413013577277e-06, + "loss": 1.0941, + "step": 17670 + }, + { + "epoch": 0.53, + "learning_rate": 2.3596977650647483e-06, + "loss": 1.0359, + "step": 17671 + }, + { + "epoch": 0.53, + "learning_rate": 2.359454230107379e-06, + "loss": 1.1547, + "step": 17672 + }, + { + "epoch": 0.53, + "learning_rate": 2.3592106964879385e-06, + "loss": 1.2212, + "step": 17673 + }, + { + "epoch": 0.53, + "learning_rate": 2.3589671642087433e-06, + "loss": 1.0464, + "step": 17674 + }, + { + "epoch": 0.53, + "learning_rate": 2.3587236332721128e-06, + "loss": 1.1272, + "step": 17675 + }, + { + "epoch": 0.53, + "learning_rate": 2.358480103680365e-06, + "loss": 1.1438, + "step": 17676 + }, + { + "epoch": 0.53, + "learning_rate": 2.3582365754358187e-06, + "loss": 1.0723, + "step": 17677 + }, + { + "epoch": 0.53, + "learning_rate": 2.3579930485407927e-06, + "loss": 1.081, + "step": 17678 + }, + { + "epoch": 0.53, + "learning_rate": 2.3577495229976034e-06, + "loss": 1.0726, + "step": 17679 + }, + { + "epoch": 0.53, + "learning_rate": 2.3575059988085707e-06, + "loss": 1.132, + "step": 17680 + }, + { + "epoch": 0.53, + "learning_rate": 2.357262475976012e-06, + "loss": 1.2581, + "step": 17681 + }, + { + "epoch": 0.53, + "learning_rate": 2.357018954502247e-06, + "loss": 1.0742, + "step": 17682 + }, + { + "epoch": 0.53, + "learning_rate": 2.356775434389591e-06, + "loss": 1.1098, + "step": 17683 + }, + { + "epoch": 0.53, + "learning_rate": 2.3565319156403646e-06, + "loss": 1.0981, + "step": 17684 + }, + { + "epoch": 0.53, + "learning_rate": 2.356288398256885e-06, + "loss": 1.1154, + "step": 17685 + }, + { + "epoch": 0.53, + "learning_rate": 2.356044882241472e-06, + "loss": 1.0662, + "step": 17686 + }, + { + "epoch": 0.53, + "learning_rate": 2.3558013675964407e-06, + "loss": 1.1622, + "step": 17687 + }, + { + "epoch": 0.53, + "learning_rate": 2.3555578543241114e-06, + "loss": 1.0373, + "step": 17688 + }, + { + "epoch": 0.53, + "learning_rate": 2.355314342426802e-06, + "loss": 1.1486, + "step": 17689 + }, + { + "epoch": 0.53, + "learning_rate": 2.3550708319068295e-06, + "loss": 1.1667, + "step": 17690 + }, + { + "epoch": 0.53, + "learning_rate": 2.354827322766514e-06, + "loss": 1.0435, + "step": 17691 + }, + { + "epoch": 0.53, + "learning_rate": 2.354583815008172e-06, + "loss": 1.1771, + "step": 17692 + }, + { + "epoch": 0.53, + "learning_rate": 2.354340308634122e-06, + "loss": 1.2823, + "step": 17693 + }, + { + "epoch": 0.53, + "learning_rate": 2.354096803646682e-06, + "loss": 1.2742, + "step": 17694 + }, + { + "epoch": 0.53, + "learning_rate": 2.3538533000481712e-06, + "loss": 1.0568, + "step": 17695 + }, + { + "epoch": 0.53, + "learning_rate": 2.353609797840906e-06, + "loss": 1.0914, + "step": 17696 + }, + { + "epoch": 0.53, + "learning_rate": 2.3533662970272044e-06, + "loss": 1.1129, + "step": 17697 + }, + { + "epoch": 0.53, + "learning_rate": 2.353122797609385e-06, + "loss": 1.0983, + "step": 17698 + }, + { + "epoch": 0.53, + "learning_rate": 2.3528792995897674e-06, + "loss": 1.0754, + "step": 17699 + }, + { + "epoch": 0.53, + "learning_rate": 2.3526358029706665e-06, + "loss": 1.1229, + "step": 17700 + }, + { + "epoch": 0.53, + "learning_rate": 2.352392307754402e-06, + "loss": 1.0343, + "step": 17701 + }, + { + "epoch": 0.53, + "learning_rate": 2.3521488139432917e-06, + "loss": 1.0056, + "step": 17702 + }, + { + "epoch": 0.53, + "learning_rate": 2.3519053215396536e-06, + "loss": 1.0602, + "step": 17703 + }, + { + "epoch": 0.53, + "learning_rate": 2.3516618305458057e-06, + "loss": 1.0366, + "step": 17704 + }, + { + "epoch": 0.53, + "learning_rate": 2.3514183409640655e-06, + "loss": 1.1312, + "step": 17705 + }, + { + "epoch": 0.53, + "learning_rate": 2.351174852796751e-06, + "loss": 1.2712, + "step": 17706 + }, + { + "epoch": 0.53, + "learning_rate": 2.35093136604618e-06, + "loss": 1.1349, + "step": 17707 + }, + { + "epoch": 0.53, + "learning_rate": 2.350687880714672e-06, + "loss": 1.1036, + "step": 17708 + }, + { + "epoch": 0.53, + "learning_rate": 2.350444396804542e-06, + "loss": 1.0292, + "step": 17709 + }, + { + "epoch": 0.53, + "learning_rate": 2.3502009143181097e-06, + "loss": 1.0749, + "step": 17710 + }, + { + "epoch": 0.53, + "learning_rate": 2.3499574332576924e-06, + "loss": 1.0879, + "step": 17711 + }, + { + "epoch": 0.53, + "learning_rate": 2.349713953625609e-06, + "loss": 1.1512, + "step": 17712 + }, + { + "epoch": 0.53, + "learning_rate": 2.3494704754241757e-06, + "loss": 1.0901, + "step": 17713 + }, + { + "epoch": 0.53, + "learning_rate": 2.3492269986557104e-06, + "loss": 1.1611, + "step": 17714 + }, + { + "epoch": 0.53, + "learning_rate": 2.3489835233225323e-06, + "loss": 1.1308, + "step": 17715 + }, + { + "epoch": 0.53, + "learning_rate": 2.3487400494269575e-06, + "loss": 1.1646, + "step": 17716 + }, + { + "epoch": 0.53, + "learning_rate": 2.3484965769713057e-06, + "loss": 1.2386, + "step": 17717 + }, + { + "epoch": 0.53, + "learning_rate": 2.3482531059578927e-06, + "loss": 1.1967, + "step": 17718 + }, + { + "epoch": 0.53, + "learning_rate": 2.3480096363890376e-06, + "loss": 1.1808, + "step": 17719 + }, + { + "epoch": 0.53, + "learning_rate": 2.347766168267057e-06, + "loss": 1.1082, + "step": 17720 + }, + { + "epoch": 0.53, + "learning_rate": 2.34752270159427e-06, + "loss": 1.0819, + "step": 17721 + }, + { + "epoch": 0.53, + "learning_rate": 2.3472792363729922e-06, + "loss": 1.0786, + "step": 17722 + }, + { + "epoch": 0.53, + "learning_rate": 2.3470357726055433e-06, + "loss": 1.0447, + "step": 17723 + }, + { + "epoch": 0.53, + "learning_rate": 2.3467923102942397e-06, + "loss": 1.0661, + "step": 17724 + }, + { + "epoch": 0.53, + "learning_rate": 2.3465488494414007e-06, + "loss": 1.1066, + "step": 17725 + }, + { + "epoch": 0.53, + "learning_rate": 2.346305390049342e-06, + "loss": 1.1354, + "step": 17726 + }, + { + "epoch": 0.53, + "learning_rate": 2.3460619321203814e-06, + "loss": 1.1445, + "step": 17727 + }, + { + "epoch": 0.53, + "learning_rate": 2.345818475656837e-06, + "loss": 1.124, + "step": 17728 + }, + { + "epoch": 0.53, + "learning_rate": 2.345575020661027e-06, + "loss": 1.0741, + "step": 17729 + }, + { + "epoch": 0.53, + "learning_rate": 2.3453315671352695e-06, + "loss": 1.157, + "step": 17730 + }, + { + "epoch": 0.53, + "learning_rate": 2.3450881150818797e-06, + "loss": 1.1747, + "step": 17731 + }, + { + "epoch": 0.53, + "learning_rate": 2.3448446645031763e-06, + "loss": 1.0806, + "step": 17732 + }, + { + "epoch": 0.53, + "learning_rate": 2.3446012154014773e-06, + "loss": 1.1905, + "step": 17733 + }, + { + "epoch": 0.53, + "learning_rate": 2.3443577677791002e-06, + "loss": 1.0507, + "step": 17734 + }, + { + "epoch": 0.53, + "learning_rate": 2.3441143216383616e-06, + "loss": 1.0651, + "step": 17735 + }, + { + "epoch": 0.53, + "learning_rate": 2.34387087698158e-06, + "loss": 1.2676, + "step": 17736 + }, + { + "epoch": 0.53, + "learning_rate": 2.343627433811072e-06, + "loss": 1.2244, + "step": 17737 + }, + { + "epoch": 0.53, + "learning_rate": 2.3433839921291567e-06, + "loss": 1.0086, + "step": 17738 + }, + { + "epoch": 0.53, + "learning_rate": 2.343140551938149e-06, + "loss": 1.0541, + "step": 17739 + }, + { + "epoch": 0.53, + "learning_rate": 2.342897113240368e-06, + "loss": 1.0024, + "step": 17740 + }, + { + "epoch": 0.53, + "learning_rate": 2.342653676038131e-06, + "loss": 1.0677, + "step": 17741 + }, + { + "epoch": 0.53, + "learning_rate": 2.3424102403337552e-06, + "loss": 1.2397, + "step": 17742 + }, + { + "epoch": 0.53, + "learning_rate": 2.3421668061295586e-06, + "loss": 1.3438, + "step": 17743 + }, + { + "epoch": 0.53, + "learning_rate": 2.3419233734278575e-06, + "loss": 1.2859, + "step": 17744 + }, + { + "epoch": 0.53, + "learning_rate": 2.3416799422309696e-06, + "loss": 1.2361, + "step": 17745 + }, + { + "epoch": 0.53, + "learning_rate": 2.341436512541212e-06, + "loss": 1.0815, + "step": 17746 + }, + { + "epoch": 0.53, + "learning_rate": 2.341193084360904e-06, + "loss": 1.0182, + "step": 17747 + }, + { + "epoch": 0.53, + "learning_rate": 2.34094965769236e-06, + "loss": 1.1594, + "step": 17748 + }, + { + "epoch": 0.53, + "learning_rate": 2.3407062325378986e-06, + "loss": 1.139, + "step": 17749 + }, + { + "epoch": 0.53, + "learning_rate": 2.340462808899837e-06, + "loss": 1.1591, + "step": 17750 + }, + { + "epoch": 0.53, + "learning_rate": 2.340219386780494e-06, + "loss": 1.1192, + "step": 17751 + }, + { + "epoch": 0.53, + "learning_rate": 2.339975966182185e-06, + "loss": 1.1324, + "step": 17752 + }, + { + "epoch": 0.53, + "learning_rate": 2.339732547107227e-06, + "loss": 1.0408, + "step": 17753 + }, + { + "epoch": 0.53, + "learning_rate": 2.339489129557938e-06, + "loss": 1.1288, + "step": 17754 + }, + { + "epoch": 0.53, + "learning_rate": 2.3392457135366353e-06, + "loss": 1.217, + "step": 17755 + }, + { + "epoch": 0.53, + "learning_rate": 2.3390022990456372e-06, + "loss": 1.1371, + "step": 17756 + }, + { + "epoch": 0.53, + "learning_rate": 2.338758886087258e-06, + "loss": 1.0761, + "step": 17757 + }, + { + "epoch": 0.53, + "learning_rate": 2.3385154746638173e-06, + "loss": 1.0597, + "step": 17758 + }, + { + "epoch": 0.53, + "learning_rate": 2.338272064777631e-06, + "loss": 0.9728, + "step": 17759 + }, + { + "epoch": 0.54, + "learning_rate": 2.338028656431018e-06, + "loss": 1.0994, + "step": 17760 + }, + { + "epoch": 0.54, + "learning_rate": 2.337785249626293e-06, + "loss": 1.175, + "step": 17761 + }, + { + "epoch": 0.54, + "learning_rate": 2.3375418443657745e-06, + "loss": 1.1479, + "step": 17762 + }, + { + "epoch": 0.54, + "learning_rate": 2.337298440651779e-06, + "loss": 1.1619, + "step": 17763 + }, + { + "epoch": 0.54, + "learning_rate": 2.3370550384866257e-06, + "loss": 1.1138, + "step": 17764 + }, + { + "epoch": 0.54, + "learning_rate": 2.3368116378726286e-06, + "loss": 1.1061, + "step": 17765 + }, + { + "epoch": 0.54, + "learning_rate": 2.336568238812106e-06, + "loss": 1.0891, + "step": 17766 + }, + { + "epoch": 0.54, + "learning_rate": 2.336324841307375e-06, + "loss": 1.1018, + "step": 17767 + }, + { + "epoch": 0.54, + "learning_rate": 2.336081445360753e-06, + "loss": 1.2016, + "step": 17768 + }, + { + "epoch": 0.54, + "learning_rate": 2.3358380509745575e-06, + "loss": 1.0721, + "step": 17769 + }, + { + "epoch": 0.54, + "learning_rate": 2.335594658151104e-06, + "loss": 1.1385, + "step": 17770 + }, + { + "epoch": 0.54, + "learning_rate": 2.3353512668927098e-06, + "loss": 1.1917, + "step": 17771 + }, + { + "epoch": 0.54, + "learning_rate": 2.335107877201692e-06, + "loss": 1.1124, + "step": 17772 + }, + { + "epoch": 0.54, + "learning_rate": 2.334864489080369e-06, + "loss": 1.1806, + "step": 17773 + }, + { + "epoch": 0.54, + "learning_rate": 2.3346211025310555e-06, + "loss": 1.1123, + "step": 17774 + }, + { + "epoch": 0.54, + "learning_rate": 2.33437771755607e-06, + "loss": 1.0895, + "step": 17775 + }, + { + "epoch": 0.54, + "learning_rate": 2.334134334157728e-06, + "loss": 1.1229, + "step": 17776 + }, + { + "epoch": 0.54, + "learning_rate": 2.333890952338349e-06, + "loss": 1.1307, + "step": 17777 + }, + { + "epoch": 0.54, + "learning_rate": 2.333647572100247e-06, + "loss": 1.1388, + "step": 17778 + }, + { + "epoch": 0.54, + "learning_rate": 2.3334041934457395e-06, + "loss": 1.1141, + "step": 17779 + }, + { + "epoch": 0.54, + "learning_rate": 2.3331608163771445e-06, + "loss": 1.2004, + "step": 17780 + }, + { + "epoch": 0.54, + "learning_rate": 2.332917440896778e-06, + "loss": 1.0439, + "step": 17781 + }, + { + "epoch": 0.54, + "learning_rate": 2.3326740670069577e-06, + "loss": 1.0172, + "step": 17782 + }, + { + "epoch": 0.54, + "learning_rate": 2.3324306947099988e-06, + "loss": 1.0563, + "step": 17783 + }, + { + "epoch": 0.54, + "learning_rate": 2.3321873240082192e-06, + "loss": 1.1443, + "step": 17784 + }, + { + "epoch": 0.54, + "learning_rate": 2.3319439549039354e-06, + "loss": 1.1152, + "step": 17785 + }, + { + "epoch": 0.54, + "learning_rate": 2.3317005873994647e-06, + "loss": 1.2224, + "step": 17786 + }, + { + "epoch": 0.54, + "learning_rate": 2.3314572214971225e-06, + "loss": 1.1412, + "step": 17787 + }, + { + "epoch": 0.54, + "learning_rate": 2.331213857199227e-06, + "loss": 1.1866, + "step": 17788 + }, + { + "epoch": 0.54, + "learning_rate": 2.3309704945080937e-06, + "loss": 1.155, + "step": 17789 + }, + { + "epoch": 0.54, + "learning_rate": 2.330727133426041e-06, + "loss": 1.0405, + "step": 17790 + }, + { + "epoch": 0.54, + "learning_rate": 2.3304837739553836e-06, + "loss": 1.1354, + "step": 17791 + }, + { + "epoch": 0.54, + "learning_rate": 2.3302404160984394e-06, + "loss": 1.018, + "step": 17792 + }, + { + "epoch": 0.54, + "learning_rate": 2.329997059857524e-06, + "loss": 1.3019, + "step": 17793 + }, + { + "epoch": 0.54, + "learning_rate": 2.329753705234955e-06, + "loss": 1.1886, + "step": 17794 + }, + { + "epoch": 0.54, + "learning_rate": 2.32951035223305e-06, + "loss": 1.0532, + "step": 17795 + }, + { + "epoch": 0.54, + "learning_rate": 2.329267000854123e-06, + "loss": 1.0341, + "step": 17796 + }, + { + "epoch": 0.54, + "learning_rate": 2.329023651100492e-06, + "loss": 1.2063, + "step": 17797 + }, + { + "epoch": 0.54, + "learning_rate": 2.3287803029744737e-06, + "loss": 1.2145, + "step": 17798 + }, + { + "epoch": 0.54, + "learning_rate": 2.3285369564783848e-06, + "loss": 1.0399, + "step": 17799 + }, + { + "epoch": 0.54, + "learning_rate": 2.3282936116145406e-06, + "loss": 1.1962, + "step": 17800 + }, + { + "epoch": 0.54, + "learning_rate": 2.3280502683852596e-06, + "loss": 1.1145, + "step": 17801 + }, + { + "epoch": 0.54, + "learning_rate": 2.3278069267928566e-06, + "loss": 1.1523, + "step": 17802 + }, + { + "epoch": 0.54, + "learning_rate": 2.327563586839649e-06, + "loss": 1.0355, + "step": 17803 + }, + { + "epoch": 0.54, + "learning_rate": 2.327320248527953e-06, + "loss": 1.2, + "step": 17804 + }, + { + "epoch": 0.54, + "learning_rate": 2.3270769118600844e-06, + "loss": 1.1721, + "step": 17805 + }, + { + "epoch": 0.54, + "learning_rate": 2.3268335768383607e-06, + "loss": 1.0687, + "step": 17806 + }, + { + "epoch": 0.54, + "learning_rate": 2.326590243465098e-06, + "loss": 1.0189, + "step": 17807 + }, + { + "epoch": 0.54, + "learning_rate": 2.3263469117426134e-06, + "loss": 1.1005, + "step": 17808 + }, + { + "epoch": 0.54, + "learning_rate": 2.3261035816732216e-06, + "loss": 1.0297, + "step": 17809 + }, + { + "epoch": 0.54, + "learning_rate": 2.32586025325924e-06, + "loss": 1.1333, + "step": 17810 + }, + { + "epoch": 0.54, + "learning_rate": 2.325616926502985e-06, + "loss": 1.1912, + "step": 17811 + }, + { + "epoch": 0.54, + "learning_rate": 2.325373601406774e-06, + "loss": 1.1102, + "step": 17812 + }, + { + "epoch": 0.54, + "learning_rate": 2.325130277972921e-06, + "loss": 1.1113, + "step": 17813 + }, + { + "epoch": 0.54, + "learning_rate": 2.3248869562037437e-06, + "loss": 1.1414, + "step": 17814 + }, + { + "epoch": 0.54, + "learning_rate": 2.324643636101558e-06, + "loss": 0.976, + "step": 17815 + }, + { + "epoch": 0.54, + "learning_rate": 2.324400317668681e-06, + "loss": 1.0696, + "step": 17816 + }, + { + "epoch": 0.54, + "learning_rate": 2.324157000907428e-06, + "loss": 1.1455, + "step": 17817 + }, + { + "epoch": 0.54, + "learning_rate": 2.323913685820116e-06, + "loss": 1.0747, + "step": 17818 + }, + { + "epoch": 0.54, + "learning_rate": 2.3236703724090606e-06, + "loss": 1.1501, + "step": 17819 + }, + { + "epoch": 0.54, + "learning_rate": 2.323427060676578e-06, + "loss": 1.0789, + "step": 17820 + }, + { + "epoch": 0.54, + "learning_rate": 2.323183750624986e-06, + "loss": 1.1251, + "step": 17821 + }, + { + "epoch": 0.54, + "learning_rate": 2.3229404422565987e-06, + "loss": 1.2043, + "step": 17822 + }, + { + "epoch": 0.54, + "learning_rate": 2.3226971355737328e-06, + "loss": 1.1062, + "step": 17823 + }, + { + "epoch": 0.54, + "learning_rate": 2.322453830578705e-06, + "loss": 1.2261, + "step": 17824 + }, + { + "epoch": 0.54, + "learning_rate": 2.3222105272738324e-06, + "loss": 1.0837, + "step": 17825 + }, + { + "epoch": 0.54, + "learning_rate": 2.3219672256614285e-06, + "loss": 1.0432, + "step": 17826 + }, + { + "epoch": 0.54, + "learning_rate": 2.3217239257438114e-06, + "loss": 1.1446, + "step": 17827 + }, + { + "epoch": 0.54, + "learning_rate": 2.3214806275232964e-06, + "loss": 1.1395, + "step": 17828 + }, + { + "epoch": 0.54, + "learning_rate": 2.3212373310022e-06, + "loss": 1.1439, + "step": 17829 + }, + { + "epoch": 0.54, + "learning_rate": 2.3209940361828383e-06, + "loss": 1.055, + "step": 17830 + }, + { + "epoch": 0.54, + "learning_rate": 2.3207507430675263e-06, + "loss": 1.127, + "step": 17831 + }, + { + "epoch": 0.54, + "learning_rate": 2.3205074516585813e-06, + "loss": 1.049, + "step": 17832 + }, + { + "epoch": 0.54, + "learning_rate": 2.3202641619583203e-06, + "loss": 1.0928, + "step": 17833 + }, + { + "epoch": 0.54, + "learning_rate": 2.3200208739690565e-06, + "loss": 1.1497, + "step": 17834 + }, + { + "epoch": 0.54, + "learning_rate": 2.3197775876931075e-06, + "loss": 1.1057, + "step": 17835 + }, + { + "epoch": 0.54, + "learning_rate": 2.319534303132789e-06, + "loss": 1.0604, + "step": 17836 + }, + { + "epoch": 0.54, + "learning_rate": 2.319291020290417e-06, + "loss": 1.2037, + "step": 17837 + }, + { + "epoch": 0.54, + "learning_rate": 2.3190477391683086e-06, + "loss": 1.0722, + "step": 17838 + }, + { + "epoch": 0.54, + "learning_rate": 2.318804459768777e-06, + "loss": 1.1259, + "step": 17839 + }, + { + "epoch": 0.54, + "learning_rate": 2.3185611820941402e-06, + "loss": 1.1669, + "step": 17840 + }, + { + "epoch": 0.54, + "learning_rate": 2.3183179061467136e-06, + "loss": 1.0861, + "step": 17841 + }, + { + "epoch": 0.54, + "learning_rate": 2.3180746319288134e-06, + "loss": 1.1639, + "step": 17842 + }, + { + "epoch": 0.54, + "learning_rate": 2.3178313594427547e-06, + "loss": 1.3781, + "step": 17843 + }, + { + "epoch": 0.54, + "learning_rate": 2.3175880886908532e-06, + "loss": 1.1547, + "step": 17844 + }, + { + "epoch": 0.54, + "learning_rate": 2.3173448196754256e-06, + "loss": 1.1589, + "step": 17845 + }, + { + "epoch": 0.54, + "learning_rate": 2.317101552398789e-06, + "loss": 1.1058, + "step": 17846 + }, + { + "epoch": 0.54, + "learning_rate": 2.3168582868632556e-06, + "loss": 1.0426, + "step": 17847 + }, + { + "epoch": 0.54, + "learning_rate": 2.3166150230711435e-06, + "loss": 1.061, + "step": 17848 + }, + { + "epoch": 0.54, + "learning_rate": 2.316371761024768e-06, + "loss": 1.0771, + "step": 17849 + }, + { + "epoch": 0.54, + "learning_rate": 2.316128500726445e-06, + "loss": 1.1023, + "step": 17850 + }, + { + "epoch": 0.54, + "learning_rate": 2.3158852421784908e-06, + "loss": 1.1943, + "step": 17851 + }, + { + "epoch": 0.54, + "learning_rate": 2.3156419853832198e-06, + "loss": 1.0563, + "step": 17852 + }, + { + "epoch": 0.54, + "learning_rate": 2.315398730342948e-06, + "loss": 1.0422, + "step": 17853 + }, + { + "epoch": 0.54, + "learning_rate": 2.3151554770599916e-06, + "loss": 1.1459, + "step": 17854 + }, + { + "epoch": 0.54, + "learning_rate": 2.3149122255366664e-06, + "loss": 1.1348, + "step": 17855 + }, + { + "epoch": 0.54, + "learning_rate": 2.314668975775287e-06, + "loss": 1.1788, + "step": 17856 + }, + { + "epoch": 0.54, + "learning_rate": 2.31442572777817e-06, + "loss": 1.0595, + "step": 17857 + }, + { + "epoch": 0.54, + "learning_rate": 2.3141824815476306e-06, + "loss": 1.0934, + "step": 17858 + }, + { + "epoch": 0.54, + "learning_rate": 2.3139392370859856e-06, + "loss": 1.1241, + "step": 17859 + }, + { + "epoch": 0.54, + "learning_rate": 2.3136959943955483e-06, + "loss": 1.1174, + "step": 17860 + }, + { + "epoch": 0.54, + "learning_rate": 2.3134527534786354e-06, + "loss": 1.0275, + "step": 17861 + }, + { + "epoch": 0.54, + "learning_rate": 2.3132095143375627e-06, + "loss": 1.1516, + "step": 17862 + }, + { + "epoch": 0.54, + "learning_rate": 2.3129662769746454e-06, + "loss": 1.0613, + "step": 17863 + }, + { + "epoch": 0.54, + "learning_rate": 2.3127230413922e-06, + "loss": 1.1399, + "step": 17864 + }, + { + "epoch": 0.54, + "learning_rate": 2.3124798075925398e-06, + "loss": 1.0717, + "step": 17865 + }, + { + "epoch": 0.54, + "learning_rate": 2.3122365755779817e-06, + "loss": 1.1523, + "step": 17866 + }, + { + "epoch": 0.54, + "learning_rate": 2.311993345350841e-06, + "loss": 1.0884, + "step": 17867 + }, + { + "epoch": 0.54, + "learning_rate": 2.3117501169134335e-06, + "loss": 1.1827, + "step": 17868 + }, + { + "epoch": 0.54, + "learning_rate": 2.3115068902680737e-06, + "loss": 1.1401, + "step": 17869 + }, + { + "epoch": 0.54, + "learning_rate": 2.3112636654170773e-06, + "loss": 1.1526, + "step": 17870 + }, + { + "epoch": 0.54, + "learning_rate": 2.3110204423627607e-06, + "loss": 1.1631, + "step": 17871 + }, + { + "epoch": 0.54, + "learning_rate": 2.3107772211074387e-06, + "loss": 1.0922, + "step": 17872 + }, + { + "epoch": 0.54, + "learning_rate": 2.310534001653426e-06, + "loss": 1.1733, + "step": 17873 + }, + { + "epoch": 0.54, + "learning_rate": 2.3102907840030376e-06, + "loss": 1.1143, + "step": 17874 + }, + { + "epoch": 0.54, + "learning_rate": 2.3100475681585905e-06, + "loss": 0.9677, + "step": 17875 + }, + { + "epoch": 0.54, + "learning_rate": 2.3098043541223986e-06, + "loss": 1.087, + "step": 17876 + }, + { + "epoch": 0.54, + "learning_rate": 2.3095611418967786e-06, + "loss": 1.1443, + "step": 17877 + }, + { + "epoch": 0.54, + "learning_rate": 2.3093179314840437e-06, + "loss": 1.108, + "step": 17878 + }, + { + "epoch": 0.54, + "learning_rate": 2.3090747228865102e-06, + "loss": 1.244, + "step": 17879 + }, + { + "epoch": 0.54, + "learning_rate": 2.308831516106494e-06, + "loss": 1.0193, + "step": 17880 + }, + { + "epoch": 0.54, + "learning_rate": 2.30858831114631e-06, + "loss": 1.0667, + "step": 17881 + }, + { + "epoch": 0.54, + "learning_rate": 2.308345108008272e-06, + "loss": 1.0972, + "step": 17882 + }, + { + "epoch": 0.54, + "learning_rate": 2.3081019066946974e-06, + "loss": 1.1454, + "step": 17883 + }, + { + "epoch": 0.54, + "learning_rate": 2.3078587072078994e-06, + "loss": 0.9938, + "step": 17884 + }, + { + "epoch": 0.54, + "learning_rate": 2.3076155095501945e-06, + "loss": 1.1201, + "step": 17885 + }, + { + "epoch": 0.54, + "learning_rate": 2.3073723137238968e-06, + "loss": 1.1588, + "step": 17886 + }, + { + "epoch": 0.54, + "learning_rate": 2.307129119731322e-06, + "loss": 1.0956, + "step": 17887 + }, + { + "epoch": 0.54, + "learning_rate": 2.3068859275747853e-06, + "loss": 1.1949, + "step": 17888 + }, + { + "epoch": 0.54, + "learning_rate": 2.306642737256601e-06, + "loss": 1.1558, + "step": 17889 + }, + { + "epoch": 0.54, + "learning_rate": 2.306399548779086e-06, + "loss": 1.0258, + "step": 17890 + }, + { + "epoch": 0.54, + "learning_rate": 2.3061563621445533e-06, + "loss": 1.0752, + "step": 17891 + }, + { + "epoch": 0.54, + "learning_rate": 2.3059131773553185e-06, + "loss": 1.1754, + "step": 17892 + }, + { + "epoch": 0.54, + "learning_rate": 2.3056699944136964e-06, + "loss": 1.2034, + "step": 17893 + }, + { + "epoch": 0.54, + "learning_rate": 2.305426813322004e-06, + "loss": 1.116, + "step": 17894 + }, + { + "epoch": 0.54, + "learning_rate": 2.305183634082553e-06, + "loss": 1.0852, + "step": 17895 + }, + { + "epoch": 0.54, + "learning_rate": 2.3049404566976603e-06, + "loss": 1.0648, + "step": 17896 + }, + { + "epoch": 0.54, + "learning_rate": 2.3046972811696407e-06, + "loss": 1.1026, + "step": 17897 + }, + { + "epoch": 0.54, + "learning_rate": 2.3044541075008093e-06, + "loss": 1.0375, + "step": 17898 + }, + { + "epoch": 0.54, + "learning_rate": 2.30421093569348e-06, + "loss": 1.0334, + "step": 17899 + }, + { + "epoch": 0.54, + "learning_rate": 2.303967765749968e-06, + "loss": 1.1661, + "step": 17900 + }, + { + "epoch": 0.54, + "learning_rate": 2.303724597672589e-06, + "loss": 1.0857, + "step": 17901 + }, + { + "epoch": 0.54, + "learning_rate": 2.303481431463657e-06, + "loss": 1.0761, + "step": 17902 + }, + { + "epoch": 0.54, + "learning_rate": 2.303238267125488e-06, + "loss": 1.1642, + "step": 17903 + }, + { + "epoch": 0.54, + "learning_rate": 2.3029951046603954e-06, + "loss": 1.1219, + "step": 17904 + }, + { + "epoch": 0.54, + "learning_rate": 2.3027519440706946e-06, + "loss": 1.1416, + "step": 17905 + }, + { + "epoch": 0.54, + "learning_rate": 2.3025087853587e-06, + "loss": 1.1442, + "step": 17906 + }, + { + "epoch": 0.54, + "learning_rate": 2.3022656285267277e-06, + "loss": 1.1573, + "step": 17907 + }, + { + "epoch": 0.54, + "learning_rate": 2.3020224735770897e-06, + "loss": 1.145, + "step": 17908 + }, + { + "epoch": 0.54, + "learning_rate": 2.3017793205121035e-06, + "loss": 1.1876, + "step": 17909 + }, + { + "epoch": 0.54, + "learning_rate": 2.301536169334082e-06, + "loss": 1.0182, + "step": 17910 + }, + { + "epoch": 0.54, + "learning_rate": 2.3012930200453412e-06, + "loss": 1.0781, + "step": 17911 + }, + { + "epoch": 0.54, + "learning_rate": 2.3010498726481946e-06, + "loss": 1.1653, + "step": 17912 + }, + { + "epoch": 0.54, + "learning_rate": 2.300806727144958e-06, + "loss": 1.1747, + "step": 17913 + }, + { + "epoch": 0.54, + "learning_rate": 2.300563583537945e-06, + "loss": 1.1688, + "step": 17914 + }, + { + "epoch": 0.54, + "learning_rate": 2.3003204418294703e-06, + "loss": 1.0754, + "step": 17915 + }, + { + "epoch": 0.54, + "learning_rate": 2.30007730202185e-06, + "loss": 1.1868, + "step": 17916 + }, + { + "epoch": 0.54, + "learning_rate": 2.299834164117397e-06, + "loss": 1.1396, + "step": 17917 + }, + { + "epoch": 0.54, + "learning_rate": 2.299591028118426e-06, + "loss": 1.0947, + "step": 17918 + }, + { + "epoch": 0.54, + "learning_rate": 2.2993478940272516e-06, + "loss": 1.2048, + "step": 17919 + }, + { + "epoch": 0.54, + "learning_rate": 2.2991047618461897e-06, + "loss": 1.1492, + "step": 17920 + }, + { + "epoch": 0.54, + "learning_rate": 2.298861631577553e-06, + "loss": 1.1761, + "step": 17921 + }, + { + "epoch": 0.54, + "learning_rate": 2.2986185032236567e-06, + "loss": 1.0856, + "step": 17922 + }, + { + "epoch": 0.54, + "learning_rate": 2.298375376786815e-06, + "loss": 1.1476, + "step": 17923 + }, + { + "epoch": 0.54, + "learning_rate": 2.2981322522693435e-06, + "loss": 1.285, + "step": 17924 + }, + { + "epoch": 0.54, + "learning_rate": 2.2978891296735546e-06, + "loss": 1.1172, + "step": 17925 + }, + { + "epoch": 0.54, + "learning_rate": 2.2976460090017645e-06, + "loss": 1.1146, + "step": 17926 + }, + { + "epoch": 0.54, + "learning_rate": 2.2974028902562862e-06, + "loss": 1.0789, + "step": 17927 + }, + { + "epoch": 0.54, + "learning_rate": 2.297159773439436e-06, + "loss": 1.0423, + "step": 17928 + }, + { + "epoch": 0.54, + "learning_rate": 2.296916658553527e-06, + "loss": 1.1729, + "step": 17929 + }, + { + "epoch": 0.54, + "learning_rate": 2.296673545600873e-06, + "loss": 1.0632, + "step": 17930 + }, + { + "epoch": 0.54, + "learning_rate": 2.296430434583789e-06, + "loss": 1.114, + "step": 17931 + }, + { + "epoch": 0.54, + "learning_rate": 2.2961873255045888e-06, + "loss": 1.0713, + "step": 17932 + }, + { + "epoch": 0.54, + "learning_rate": 2.2959442183655887e-06, + "loss": 1.1425, + "step": 17933 + }, + { + "epoch": 0.54, + "learning_rate": 2.2957011131691e-06, + "loss": 1.1416, + "step": 17934 + }, + { + "epoch": 0.54, + "learning_rate": 2.2954580099174382e-06, + "loss": 1.264, + "step": 17935 + }, + { + "epoch": 0.54, + "learning_rate": 2.2952149086129176e-06, + "loss": 1.246, + "step": 17936 + }, + { + "epoch": 0.54, + "learning_rate": 2.294971809257853e-06, + "loss": 1.1634, + "step": 17937 + }, + { + "epoch": 0.54, + "learning_rate": 2.294728711854558e-06, + "loss": 1.0889, + "step": 17938 + }, + { + "epoch": 0.54, + "learning_rate": 2.2944856164053465e-06, + "loss": 1.1234, + "step": 17939 + }, + { + "epoch": 0.54, + "learning_rate": 2.294242522912533e-06, + "loss": 1.0488, + "step": 17940 + }, + { + "epoch": 0.54, + "learning_rate": 2.2939994313784316e-06, + "loss": 1.0948, + "step": 17941 + }, + { + "epoch": 0.54, + "learning_rate": 2.293756341805357e-06, + "loss": 1.0878, + "step": 17942 + }, + { + "epoch": 0.54, + "learning_rate": 2.293513254195622e-06, + "loss": 1.1338, + "step": 17943 + }, + { + "epoch": 0.54, + "learning_rate": 2.2932701685515416e-06, + "loss": 1.1278, + "step": 17944 + }, + { + "epoch": 0.54, + "learning_rate": 2.293027084875429e-06, + "loss": 1.1636, + "step": 17945 + }, + { + "epoch": 0.54, + "learning_rate": 2.292784003169601e-06, + "loss": 1.1552, + "step": 17946 + }, + { + "epoch": 0.54, + "learning_rate": 2.292540923436367e-06, + "loss": 1.0325, + "step": 17947 + }, + { + "epoch": 0.54, + "learning_rate": 2.292297845678045e-06, + "loss": 1.1451, + "step": 17948 + }, + { + "epoch": 0.54, + "learning_rate": 2.2920547698969462e-06, + "loss": 1.1627, + "step": 17949 + }, + { + "epoch": 0.54, + "learning_rate": 2.2918116960953872e-06, + "loss": 1.0489, + "step": 17950 + }, + { + "epoch": 0.54, + "learning_rate": 2.2915686242756795e-06, + "loss": 1.1661, + "step": 17951 + }, + { + "epoch": 0.54, + "learning_rate": 2.291325554440139e-06, + "loss": 1.1182, + "step": 17952 + }, + { + "epoch": 0.54, + "learning_rate": 2.2910824865910776e-06, + "loss": 1.1021, + "step": 17953 + }, + { + "epoch": 0.54, + "learning_rate": 2.2908394207308107e-06, + "loss": 1.0729, + "step": 17954 + }, + { + "epoch": 0.54, + "learning_rate": 2.290596356861653e-06, + "loss": 1.1447, + "step": 17955 + }, + { + "epoch": 0.54, + "learning_rate": 2.290353294985916e-06, + "loss": 1.1754, + "step": 17956 + }, + { + "epoch": 0.54, + "learning_rate": 2.2901102351059146e-06, + "loss": 1.0977, + "step": 17957 + }, + { + "epoch": 0.54, + "learning_rate": 2.289867177223963e-06, + "loss": 1.1412, + "step": 17958 + }, + { + "epoch": 0.54, + "learning_rate": 2.289624121342375e-06, + "loss": 1.1151, + "step": 17959 + }, + { + "epoch": 0.54, + "learning_rate": 2.2893810674634635e-06, + "loss": 1.0294, + "step": 17960 + }, + { + "epoch": 0.54, + "learning_rate": 2.289138015589543e-06, + "loss": 1.1173, + "step": 17961 + }, + { + "epoch": 0.54, + "learning_rate": 2.2888949657229266e-06, + "loss": 1.1387, + "step": 17962 + }, + { + "epoch": 0.54, + "learning_rate": 2.2886519178659296e-06, + "loss": 1.0193, + "step": 17963 + }, + { + "epoch": 0.54, + "learning_rate": 2.2884088720208637e-06, + "loss": 1.1984, + "step": 17964 + }, + { + "epoch": 0.54, + "learning_rate": 2.2881658281900434e-06, + "loss": 1.0898, + "step": 17965 + }, + { + "epoch": 0.54, + "learning_rate": 2.2879227863757824e-06, + "loss": 1.0623, + "step": 17966 + }, + { + "epoch": 0.54, + "learning_rate": 2.2876797465803943e-06, + "loss": 1.1184, + "step": 17967 + }, + { + "epoch": 0.54, + "learning_rate": 2.2874367088061933e-06, + "loss": 1.2573, + "step": 17968 + }, + { + "epoch": 0.54, + "learning_rate": 2.287193673055492e-06, + "loss": 1.1638, + "step": 17969 + }, + { + "epoch": 0.54, + "learning_rate": 2.2869506393306042e-06, + "loss": 1.096, + "step": 17970 + }, + { + "epoch": 0.54, + "learning_rate": 2.286707607633844e-06, + "loss": 1.0582, + "step": 17971 + }, + { + "epoch": 0.54, + "learning_rate": 2.2864645779675253e-06, + "loss": 1.1683, + "step": 17972 + }, + { + "epoch": 0.54, + "learning_rate": 2.2862215503339604e-06, + "loss": 1.06, + "step": 17973 + }, + { + "epoch": 0.54, + "learning_rate": 2.285978524735463e-06, + "loss": 1.1022, + "step": 17974 + }, + { + "epoch": 0.54, + "learning_rate": 2.2857355011743472e-06, + "loss": 1.1902, + "step": 17975 + }, + { + "epoch": 0.54, + "learning_rate": 2.2854924796529264e-06, + "loss": 1.0507, + "step": 17976 + }, + { + "epoch": 0.54, + "learning_rate": 2.2852494601735143e-06, + "loss": 1.0672, + "step": 17977 + }, + { + "epoch": 0.54, + "learning_rate": 2.2850064427384234e-06, + "loss": 1.1664, + "step": 17978 + }, + { + "epoch": 0.54, + "learning_rate": 2.284763427349967e-06, + "loss": 1.11, + "step": 17979 + }, + { + "epoch": 0.54, + "learning_rate": 2.28452041401046e-06, + "loss": 1.1002, + "step": 17980 + }, + { + "epoch": 0.54, + "learning_rate": 2.284277402722215e-06, + "loss": 1.0376, + "step": 17981 + }, + { + "epoch": 0.54, + "learning_rate": 2.2840343934875443e-06, + "loss": 1.1178, + "step": 17982 + }, + { + "epoch": 0.54, + "learning_rate": 2.2837913863087625e-06, + "loss": 1.0887, + "step": 17983 + }, + { + "epoch": 0.54, + "learning_rate": 2.2835483811881826e-06, + "loss": 1.1103, + "step": 17984 + }, + { + "epoch": 0.54, + "learning_rate": 2.2833053781281193e-06, + "loss": 1.0372, + "step": 17985 + }, + { + "epoch": 0.54, + "learning_rate": 2.283062377130883e-06, + "loss": 1.1641, + "step": 17986 + }, + { + "epoch": 0.54, + "learning_rate": 2.2828193781987882e-06, + "loss": 1.2638, + "step": 17987 + }, + { + "epoch": 0.54, + "learning_rate": 2.2825763813341487e-06, + "loss": 1.1404, + "step": 17988 + }, + { + "epoch": 0.54, + "learning_rate": 2.2823333865392783e-06, + "loss": 1.0997, + "step": 17989 + }, + { + "epoch": 0.54, + "learning_rate": 2.282090393816488e-06, + "loss": 0.9881, + "step": 17990 + }, + { + "epoch": 0.54, + "learning_rate": 2.281847403168092e-06, + "loss": 1.0866, + "step": 17991 + }, + { + "epoch": 0.54, + "learning_rate": 2.2816044145964044e-06, + "loss": 1.0726, + "step": 17992 + }, + { + "epoch": 0.54, + "learning_rate": 2.2813614281037367e-06, + "loss": 1.1799, + "step": 17993 + }, + { + "epoch": 0.54, + "learning_rate": 2.2811184436924043e-06, + "loss": 1.1099, + "step": 17994 + }, + { + "epoch": 0.54, + "learning_rate": 2.280875461364718e-06, + "loss": 1.1019, + "step": 17995 + }, + { + "epoch": 0.54, + "learning_rate": 2.280632481122991e-06, + "loss": 1.1669, + "step": 17996 + }, + { + "epoch": 0.54, + "learning_rate": 2.2803895029695385e-06, + "loss": 1.0225, + "step": 17997 + }, + { + "epoch": 0.54, + "learning_rate": 2.280146526906672e-06, + "loss": 1.0673, + "step": 17998 + }, + { + "epoch": 0.54, + "learning_rate": 2.2799035529367047e-06, + "loss": 1.1801, + "step": 17999 + }, + { + "epoch": 0.54, + "learning_rate": 2.2796605810619486e-06, + "loss": 1.213, + "step": 18000 + }, + { + "epoch": 0.54, + "learning_rate": 2.2794176112847185e-06, + "loss": 1.1671, + "step": 18001 + }, + { + "epoch": 0.54, + "learning_rate": 2.279174643607327e-06, + "loss": 1.2006, + "step": 18002 + }, + { + "epoch": 0.54, + "learning_rate": 2.2789316780320854e-06, + "loss": 1.1066, + "step": 18003 + }, + { + "epoch": 0.54, + "learning_rate": 2.2786887145613082e-06, + "loss": 1.1656, + "step": 18004 + }, + { + "epoch": 0.54, + "learning_rate": 2.2784457531973073e-06, + "loss": 1.1382, + "step": 18005 + }, + { + "epoch": 0.54, + "learning_rate": 2.278202793942397e-06, + "loss": 1.2499, + "step": 18006 + }, + { + "epoch": 0.54, + "learning_rate": 2.2779598367988893e-06, + "loss": 1.0899, + "step": 18007 + }, + { + "epoch": 0.54, + "learning_rate": 2.2777168817690966e-06, + "loss": 1.1957, + "step": 18008 + }, + { + "epoch": 0.54, + "learning_rate": 2.2774739288553314e-06, + "loss": 1.1103, + "step": 18009 + }, + { + "epoch": 0.54, + "learning_rate": 2.277230978059908e-06, + "loss": 1.0168, + "step": 18010 + }, + { + "epoch": 0.54, + "learning_rate": 2.276988029385139e-06, + "loss": 1.1492, + "step": 18011 + }, + { + "epoch": 0.54, + "learning_rate": 2.2767450828333364e-06, + "loss": 1.0789, + "step": 18012 + }, + { + "epoch": 0.54, + "learning_rate": 2.276502138406812e-06, + "loss": 1.105, + "step": 18013 + }, + { + "epoch": 0.54, + "learning_rate": 2.27625919610788e-06, + "loss": 1.113, + "step": 18014 + }, + { + "epoch": 0.54, + "learning_rate": 2.2760162559388544e-06, + "loss": 1.1089, + "step": 18015 + }, + { + "epoch": 0.54, + "learning_rate": 2.2757733179020443e-06, + "loss": 1.0838, + "step": 18016 + }, + { + "epoch": 0.54, + "learning_rate": 2.2755303819997645e-06, + "loss": 1.1396, + "step": 18017 + }, + { + "epoch": 0.54, + "learning_rate": 2.2752874482343273e-06, + "loss": 1.1951, + "step": 18018 + }, + { + "epoch": 0.54, + "learning_rate": 2.275044516608046e-06, + "loss": 0.9342, + "step": 18019 + }, + { + "epoch": 0.54, + "learning_rate": 2.2748015871232316e-06, + "loss": 1.1271, + "step": 18020 + }, + { + "epoch": 0.54, + "learning_rate": 2.274558659782198e-06, + "loss": 1.1769, + "step": 18021 + }, + { + "epoch": 0.54, + "learning_rate": 2.2743157345872573e-06, + "loss": 1.1077, + "step": 18022 + }, + { + "epoch": 0.54, + "learning_rate": 2.2740728115407222e-06, + "loss": 1.1451, + "step": 18023 + }, + { + "epoch": 0.54, + "learning_rate": 2.2738298906449063e-06, + "loss": 1.1132, + "step": 18024 + }, + { + "epoch": 0.54, + "learning_rate": 2.2735869719021197e-06, + "loss": 1.1983, + "step": 18025 + }, + { + "epoch": 0.54, + "learning_rate": 2.2733440553146763e-06, + "loss": 1.0949, + "step": 18026 + }, + { + "epoch": 0.54, + "learning_rate": 2.273101140884888e-06, + "loss": 0.9958, + "step": 18027 + }, + { + "epoch": 0.54, + "learning_rate": 2.2728582286150687e-06, + "loss": 1.0139, + "step": 18028 + }, + { + "epoch": 0.54, + "learning_rate": 2.2726153185075285e-06, + "loss": 1.1438, + "step": 18029 + }, + { + "epoch": 0.54, + "learning_rate": 2.2723724105645815e-06, + "loss": 1.2711, + "step": 18030 + }, + { + "epoch": 0.54, + "learning_rate": 2.272129504788539e-06, + "loss": 1.0338, + "step": 18031 + }, + { + "epoch": 0.54, + "learning_rate": 2.2718866011817146e-06, + "loss": 1.0909, + "step": 18032 + }, + { + "epoch": 0.54, + "learning_rate": 2.271643699746419e-06, + "loss": 1.1151, + "step": 18033 + }, + { + "epoch": 0.54, + "learning_rate": 2.2714008004849657e-06, + "loss": 1.2095, + "step": 18034 + }, + { + "epoch": 0.54, + "learning_rate": 2.271157903399667e-06, + "loss": 1.0557, + "step": 18035 + }, + { + "epoch": 0.54, + "learning_rate": 2.2709150084928342e-06, + "loss": 1.105, + "step": 18036 + }, + { + "epoch": 0.54, + "learning_rate": 2.2706721157667815e-06, + "loss": 1.3624, + "step": 18037 + }, + { + "epoch": 0.54, + "learning_rate": 2.270429225223819e-06, + "loss": 1.1249, + "step": 18038 + }, + { + "epoch": 0.54, + "learning_rate": 2.2701863368662596e-06, + "loss": 1.033, + "step": 18039 + }, + { + "epoch": 0.54, + "learning_rate": 2.2699434506964156e-06, + "loss": 0.9906, + "step": 18040 + }, + { + "epoch": 0.54, + "learning_rate": 2.2697005667166e-06, + "loss": 1.1824, + "step": 18041 + }, + { + "epoch": 0.54, + "learning_rate": 2.269457684929123e-06, + "loss": 1.1722, + "step": 18042 + }, + { + "epoch": 0.54, + "learning_rate": 2.269214805336298e-06, + "loss": 1.1271, + "step": 18043 + }, + { + "epoch": 0.54, + "learning_rate": 2.268971927940437e-06, + "loss": 1.1633, + "step": 18044 + }, + { + "epoch": 0.54, + "learning_rate": 2.2687290527438524e-06, + "loss": 1.0611, + "step": 18045 + }, + { + "epoch": 0.54, + "learning_rate": 2.2684861797488554e-06, + "loss": 1.022, + "step": 18046 + }, + { + "epoch": 0.54, + "learning_rate": 2.268243308957758e-06, + "loss": 1.2524, + "step": 18047 + }, + { + "epoch": 0.54, + "learning_rate": 2.2680004403728737e-06, + "loss": 1.0893, + "step": 18048 + }, + { + "epoch": 0.54, + "learning_rate": 2.2677575739965125e-06, + "loss": 1.1204, + "step": 18049 + }, + { + "epoch": 0.54, + "learning_rate": 2.2675147098309886e-06, + "loss": 1.1778, + "step": 18050 + }, + { + "epoch": 0.54, + "learning_rate": 2.2672718478786115e-06, + "loss": 1.2583, + "step": 18051 + }, + { + "epoch": 0.54, + "learning_rate": 2.2670289881416944e-06, + "loss": 1.1497, + "step": 18052 + }, + { + "epoch": 0.54, + "learning_rate": 2.2667861306225492e-06, + "loss": 1.2189, + "step": 18053 + }, + { + "epoch": 0.54, + "learning_rate": 2.2665432753234893e-06, + "loss": 1.1579, + "step": 18054 + }, + { + "epoch": 0.54, + "learning_rate": 2.2663004222468236e-06, + "loss": 1.1885, + "step": 18055 + }, + { + "epoch": 0.54, + "learning_rate": 2.2660575713948653e-06, + "loss": 1.2435, + "step": 18056 + }, + { + "epoch": 0.54, + "learning_rate": 2.265814722769926e-06, + "loss": 1.0852, + "step": 18057 + }, + { + "epoch": 0.54, + "learning_rate": 2.2655718763743183e-06, + "loss": 1.2139, + "step": 18058 + }, + { + "epoch": 0.54, + "learning_rate": 2.2653290322103534e-06, + "loss": 1.0938, + "step": 18059 + }, + { + "epoch": 0.54, + "learning_rate": 2.2650861902803427e-06, + "loss": 1.093, + "step": 18060 + }, + { + "epoch": 0.54, + "learning_rate": 2.2648433505865985e-06, + "loss": 1.0687, + "step": 18061 + }, + { + "epoch": 0.54, + "learning_rate": 2.2646005131314324e-06, + "loss": 1.179, + "step": 18062 + }, + { + "epoch": 0.54, + "learning_rate": 2.2643576779171562e-06, + "loss": 1.0114, + "step": 18063 + }, + { + "epoch": 0.54, + "learning_rate": 2.2641148449460813e-06, + "loss": 1.1006, + "step": 18064 + }, + { + "epoch": 0.54, + "learning_rate": 2.263872014220519e-06, + "loss": 1.0641, + "step": 18065 + }, + { + "epoch": 0.54, + "learning_rate": 2.2636291857427815e-06, + "loss": 1.0594, + "step": 18066 + }, + { + "epoch": 0.54, + "learning_rate": 2.2633863595151815e-06, + "loss": 1.0418, + "step": 18067 + }, + { + "epoch": 0.54, + "learning_rate": 2.263143535540029e-06, + "loss": 1.1778, + "step": 18068 + }, + { + "epoch": 0.54, + "learning_rate": 2.262900713819635e-06, + "loss": 1.1264, + "step": 18069 + }, + { + "epoch": 0.54, + "learning_rate": 2.2626578943563123e-06, + "loss": 1.1305, + "step": 18070 + }, + { + "epoch": 0.54, + "learning_rate": 2.2624150771523733e-06, + "loss": 1.0362, + "step": 18071 + }, + { + "epoch": 0.54, + "learning_rate": 2.2621722622101274e-06, + "loss": 1.1409, + "step": 18072 + }, + { + "epoch": 0.54, + "learning_rate": 2.2619294495318866e-06, + "loss": 1.0719, + "step": 18073 + }, + { + "epoch": 0.54, + "learning_rate": 2.2616866391199634e-06, + "loss": 1.0665, + "step": 18074 + }, + { + "epoch": 0.54, + "learning_rate": 2.261443830976668e-06, + "loss": 1.2274, + "step": 18075 + }, + { + "epoch": 0.54, + "learning_rate": 2.2612010251043132e-06, + "loss": 1.0765, + "step": 18076 + }, + { + "epoch": 0.54, + "learning_rate": 2.260958221505209e-06, + "loss": 1.1395, + "step": 18077 + }, + { + "epoch": 0.54, + "learning_rate": 2.2607154201816676e-06, + "loss": 1.0714, + "step": 18078 + }, + { + "epoch": 0.54, + "learning_rate": 2.260472621136e-06, + "loss": 1.149, + "step": 18079 + }, + { + "epoch": 0.54, + "learning_rate": 2.260229824370519e-06, + "loss": 1.1862, + "step": 18080 + }, + { + "epoch": 0.54, + "learning_rate": 2.2599870298875332e-06, + "loss": 1.1392, + "step": 18081 + }, + { + "epoch": 0.54, + "learning_rate": 2.2597442376893556e-06, + "loss": 1.2115, + "step": 18082 + }, + { + "epoch": 0.54, + "learning_rate": 2.2595014477782966e-06, + "loss": 1.0696, + "step": 18083 + }, + { + "epoch": 0.54, + "learning_rate": 2.2592586601566694e-06, + "loss": 1.0773, + "step": 18084 + }, + { + "epoch": 0.54, + "learning_rate": 2.259015874826783e-06, + "loss": 1.1665, + "step": 18085 + }, + { + "epoch": 0.54, + "learning_rate": 2.2587730917909494e-06, + "loss": 1.0889, + "step": 18086 + }, + { + "epoch": 0.54, + "learning_rate": 2.2585303110514793e-06, + "loss": 1.3147, + "step": 18087 + }, + { + "epoch": 0.54, + "learning_rate": 2.2582875326106846e-06, + "loss": 1.2256, + "step": 18088 + }, + { + "epoch": 0.54, + "learning_rate": 2.258044756470877e-06, + "loss": 1.1449, + "step": 18089 + }, + { + "epoch": 0.54, + "learning_rate": 2.257801982634366e-06, + "loss": 1.1347, + "step": 18090 + }, + { + "epoch": 0.54, + "learning_rate": 2.257559211103463e-06, + "loss": 1.0779, + "step": 18091 + }, + { + "epoch": 0.55, + "learning_rate": 2.2573164418804804e-06, + "loss": 1.0465, + "step": 18092 + }, + { + "epoch": 0.55, + "learning_rate": 2.257073674967729e-06, + "loss": 1.136, + "step": 18093 + }, + { + "epoch": 0.55, + "learning_rate": 2.256830910367518e-06, + "loss": 1.0714, + "step": 18094 + }, + { + "epoch": 0.55, + "learning_rate": 2.25658814808216e-06, + "loss": 1.167, + "step": 18095 + }, + { + "epoch": 0.55, + "learning_rate": 2.2563453881139655e-06, + "loss": 1.0149, + "step": 18096 + }, + { + "epoch": 0.55, + "learning_rate": 2.2561026304652467e-06, + "loss": 1.2555, + "step": 18097 + }, + { + "epoch": 0.55, + "learning_rate": 2.255859875138312e-06, + "loss": 1.1705, + "step": 18098 + }, + { + "epoch": 0.55, + "learning_rate": 2.2556171221354737e-06, + "loss": 1.1713, + "step": 18099 + }, + { + "epoch": 0.55, + "learning_rate": 2.255374371459043e-06, + "loss": 1.1959, + "step": 18100 + }, + { + "epoch": 0.55, + "learning_rate": 2.2551316231113305e-06, + "loss": 1.1097, + "step": 18101 + }, + { + "epoch": 0.55, + "learning_rate": 2.2548888770946475e-06, + "loss": 1.0309, + "step": 18102 + }, + { + "epoch": 0.55, + "learning_rate": 2.254646133411304e-06, + "loss": 1.0237, + "step": 18103 + }, + { + "epoch": 0.55, + "learning_rate": 2.2544033920636105e-06, + "loss": 1.177, + "step": 18104 + }, + { + "epoch": 0.55, + "learning_rate": 2.2541606530538788e-06, + "loss": 1.158, + "step": 18105 + }, + { + "epoch": 0.55, + "learning_rate": 2.2539179163844203e-06, + "loss": 1.2885, + "step": 18106 + }, + { + "epoch": 0.55, + "learning_rate": 2.2536751820575437e-06, + "loss": 1.2416, + "step": 18107 + }, + { + "epoch": 0.55, + "learning_rate": 2.253432450075561e-06, + "loss": 1.103, + "step": 18108 + }, + { + "epoch": 0.55, + "learning_rate": 2.2531897204407822e-06, + "loss": 1.1451, + "step": 18109 + }, + { + "epoch": 0.55, + "learning_rate": 2.2529469931555197e-06, + "loss": 1.1119, + "step": 18110 + }, + { + "epoch": 0.55, + "learning_rate": 2.2527042682220813e-06, + "loss": 1.0897, + "step": 18111 + }, + { + "epoch": 0.55, + "learning_rate": 2.2524615456427796e-06, + "loss": 1.1478, + "step": 18112 + }, + { + "epoch": 0.55, + "learning_rate": 2.252218825419925e-06, + "loss": 0.9619, + "step": 18113 + }, + { + "epoch": 0.55, + "learning_rate": 2.2519761075558273e-06, + "loss": 1.1378, + "step": 18114 + }, + { + "epoch": 0.55, + "learning_rate": 2.2517333920527985e-06, + "loss": 1.0628, + "step": 18115 + }, + { + "epoch": 0.55, + "learning_rate": 2.251490678913148e-06, + "loss": 1.2644, + "step": 18116 + }, + { + "epoch": 0.55, + "learning_rate": 2.251247968139186e-06, + "loss": 1.1713, + "step": 18117 + }, + { + "epoch": 0.55, + "learning_rate": 2.2510052597332237e-06, + "loss": 1.1979, + "step": 18118 + }, + { + "epoch": 0.55, + "learning_rate": 2.250762553697572e-06, + "loss": 1.0833, + "step": 18119 + }, + { + "epoch": 0.55, + "learning_rate": 2.2505198500345404e-06, + "loss": 1.1165, + "step": 18120 + }, + { + "epoch": 0.55, + "learning_rate": 2.2502771487464393e-06, + "loss": 1.1527, + "step": 18121 + }, + { + "epoch": 0.55, + "learning_rate": 2.2500344498355798e-06, + "loss": 1.1602, + "step": 18122 + }, + { + "epoch": 0.55, + "learning_rate": 2.2497917533042725e-06, + "loss": 1.2247, + "step": 18123 + }, + { + "epoch": 0.55, + "learning_rate": 2.2495490591548266e-06, + "loss": 1.1793, + "step": 18124 + }, + { + "epoch": 0.55, + "learning_rate": 2.249306367389553e-06, + "loss": 1.0504, + "step": 18125 + }, + { + "epoch": 0.55, + "learning_rate": 2.249063678010762e-06, + "loss": 1.0657, + "step": 18126 + }, + { + "epoch": 0.55, + "learning_rate": 2.2488209910207637e-06, + "loss": 1.1174, + "step": 18127 + }, + { + "epoch": 0.55, + "learning_rate": 2.2485783064218692e-06, + "loss": 1.1944, + "step": 18128 + }, + { + "epoch": 0.55, + "learning_rate": 2.248335624216388e-06, + "loss": 1.1447, + "step": 18129 + }, + { + "epoch": 0.55, + "learning_rate": 2.2480929444066304e-06, + "loss": 1.1688, + "step": 18130 + }, + { + "epoch": 0.55, + "learning_rate": 2.2478502669949066e-06, + "loss": 1.2103, + "step": 18131 + }, + { + "epoch": 0.55, + "learning_rate": 2.247607591983527e-06, + "loss": 1.0257, + "step": 18132 + }, + { + "epoch": 0.55, + "learning_rate": 2.2473649193748013e-06, + "loss": 1.0659, + "step": 18133 + }, + { + "epoch": 0.55, + "learning_rate": 2.2471222491710394e-06, + "loss": 1.075, + "step": 18134 + }, + { + "epoch": 0.55, + "learning_rate": 2.2468795813745524e-06, + "loss": 1.1161, + "step": 18135 + }, + { + "epoch": 0.55, + "learning_rate": 2.246636915987651e-06, + "loss": 1.2588, + "step": 18136 + }, + { + "epoch": 0.55, + "learning_rate": 2.246394253012643e-06, + "loss": 1.224, + "step": 18137 + }, + { + "epoch": 0.55, + "learning_rate": 2.246151592451839e-06, + "loss": 1.1235, + "step": 18138 + }, + { + "epoch": 0.55, + "learning_rate": 2.24590893430755e-06, + "loss": 1.1529, + "step": 18139 + }, + { + "epoch": 0.55, + "learning_rate": 2.245666278582086e-06, + "loss": 1.1209, + "step": 18140 + }, + { + "epoch": 0.55, + "learning_rate": 2.245423625277757e-06, + "loss": 1.1331, + "step": 18141 + }, + { + "epoch": 0.55, + "learning_rate": 2.2451809743968717e-06, + "loss": 1.1258, + "step": 18142 + }, + { + "epoch": 0.55, + "learning_rate": 2.244938325941741e-06, + "loss": 1.177, + "step": 18143 + }, + { + "epoch": 0.55, + "learning_rate": 2.244695679914674e-06, + "loss": 1.0956, + "step": 18144 + }, + { + "epoch": 0.55, + "learning_rate": 2.244453036317982e-06, + "loss": 1.0844, + "step": 18145 + }, + { + "epoch": 0.55, + "learning_rate": 2.2442103951539734e-06, + "loss": 1.0637, + "step": 18146 + }, + { + "epoch": 0.55, + "learning_rate": 2.243967756424959e-06, + "loss": 1.1022, + "step": 18147 + }, + { + "epoch": 0.55, + "learning_rate": 2.243725120133248e-06, + "loss": 1.1523, + "step": 18148 + }, + { + "epoch": 0.55, + "learning_rate": 2.2434824862811514e-06, + "loss": 1.1696, + "step": 18149 + }, + { + "epoch": 0.55, + "learning_rate": 2.2432398548709768e-06, + "loss": 1.3004, + "step": 18150 + }, + { + "epoch": 0.55, + "learning_rate": 2.2429972259050356e-06, + "loss": 1.2695, + "step": 18151 + }, + { + "epoch": 0.55, + "learning_rate": 2.242754599385637e-06, + "loss": 1.142, + "step": 18152 + }, + { + "epoch": 0.55, + "learning_rate": 2.24251197531509e-06, + "loss": 1.1802, + "step": 18153 + }, + { + "epoch": 0.55, + "learning_rate": 2.242269353695707e-06, + "loss": 1.214, + "step": 18154 + }, + { + "epoch": 0.55, + "learning_rate": 2.2420267345297938e-06, + "loss": 1.1429, + "step": 18155 + }, + { + "epoch": 0.55, + "learning_rate": 2.241784117819662e-06, + "loss": 1.1921, + "step": 18156 + }, + { + "epoch": 0.55, + "learning_rate": 2.2415415035676213e-06, + "loss": 1.0579, + "step": 18157 + }, + { + "epoch": 0.55, + "learning_rate": 2.2412988917759816e-06, + "loss": 1.1044, + "step": 18158 + }, + { + "epoch": 0.55, + "learning_rate": 2.241056282447051e-06, + "loss": 1.1172, + "step": 18159 + }, + { + "epoch": 0.55, + "learning_rate": 2.24081367558314e-06, + "loss": 1.1254, + "step": 18160 + }, + { + "epoch": 0.55, + "learning_rate": 2.240571071186558e-06, + "loss": 1.1398, + "step": 18161 + }, + { + "epoch": 0.55, + "learning_rate": 2.2403284692596154e-06, + "loss": 1.3174, + "step": 18162 + }, + { + "epoch": 0.55, + "learning_rate": 2.2400858698046197e-06, + "loss": 1.0944, + "step": 18163 + }, + { + "epoch": 0.55, + "learning_rate": 2.239843272823882e-06, + "loss": 1.0549, + "step": 18164 + }, + { + "epoch": 0.55, + "learning_rate": 2.23960067831971e-06, + "loss": 1.1512, + "step": 18165 + }, + { + "epoch": 0.55, + "learning_rate": 2.2393580862944146e-06, + "loss": 1.2327, + "step": 18166 + }, + { + "epoch": 0.55, + "learning_rate": 2.2391154967503058e-06, + "loss": 1.1483, + "step": 18167 + }, + { + "epoch": 0.55, + "learning_rate": 2.238872909689691e-06, + "loss": 1.0481, + "step": 18168 + }, + { + "epoch": 0.55, + "learning_rate": 2.2386303251148795e-06, + "loss": 1.1304, + "step": 18169 + }, + { + "epoch": 0.55, + "learning_rate": 2.238387743028182e-06, + "loss": 1.1703, + "step": 18170 + }, + { + "epoch": 0.55, + "learning_rate": 2.238145163431908e-06, + "loss": 1.1714, + "step": 18171 + }, + { + "epoch": 0.55, + "learning_rate": 2.237902586328365e-06, + "loss": 1.0381, + "step": 18172 + }, + { + "epoch": 0.55, + "learning_rate": 2.2376600117198633e-06, + "loss": 1.1143, + "step": 18173 + }, + { + "epoch": 0.55, + "learning_rate": 2.2374174396087116e-06, + "loss": 1.0318, + "step": 18174 + }, + { + "epoch": 0.55, + "learning_rate": 2.237174869997221e-06, + "loss": 1.1017, + "step": 18175 + }, + { + "epoch": 0.55, + "learning_rate": 2.2369323028876975e-06, + "loss": 1.0161, + "step": 18176 + }, + { + "epoch": 0.55, + "learning_rate": 2.236689738282452e-06, + "loss": 1.0616, + "step": 18177 + }, + { + "epoch": 0.55, + "learning_rate": 2.2364471761837938e-06, + "loss": 1.0883, + "step": 18178 + }, + { + "epoch": 0.55, + "learning_rate": 2.236204616594031e-06, + "loss": 1.0753, + "step": 18179 + }, + { + "epoch": 0.55, + "learning_rate": 2.235962059515474e-06, + "loss": 1.1227, + "step": 18180 + }, + { + "epoch": 0.55, + "learning_rate": 2.2357195049504307e-06, + "loss": 1.0605, + "step": 18181 + }, + { + "epoch": 0.55, + "learning_rate": 2.2354769529012103e-06, + "loss": 1.1638, + "step": 18182 + }, + { + "epoch": 0.55, + "learning_rate": 2.2352344033701214e-06, + "loss": 1.1682, + "step": 18183 + }, + { + "epoch": 0.55, + "learning_rate": 2.2349918563594743e-06, + "loss": 1.1962, + "step": 18184 + }, + { + "epoch": 0.55, + "learning_rate": 2.2347493118715764e-06, + "loss": 1.1326, + "step": 18185 + }, + { + "epoch": 0.55, + "learning_rate": 2.234506769908738e-06, + "loss": 1.1771, + "step": 18186 + }, + { + "epoch": 0.55, + "learning_rate": 2.2342642304732665e-06, + "loss": 1.2105, + "step": 18187 + }, + { + "epoch": 0.55, + "learning_rate": 2.234021693567473e-06, + "loss": 1.159, + "step": 18188 + }, + { + "epoch": 0.55, + "learning_rate": 2.2337791591936635e-06, + "loss": 1.0989, + "step": 18189 + }, + { + "epoch": 0.55, + "learning_rate": 2.2335366273541486e-06, + "loss": 1.1007, + "step": 18190 + }, + { + "epoch": 0.55, + "learning_rate": 2.2332940980512364e-06, + "loss": 1.0942, + "step": 18191 + }, + { + "epoch": 0.55, + "learning_rate": 2.2330515712872357e-06, + "loss": 1.2333, + "step": 18192 + }, + { + "epoch": 0.55, + "learning_rate": 2.232809047064457e-06, + "loss": 1.1214, + "step": 18193 + }, + { + "epoch": 0.55, + "learning_rate": 2.2325665253852065e-06, + "loss": 1.0551, + "step": 18194 + }, + { + "epoch": 0.55, + "learning_rate": 2.2323240062517935e-06, + "loss": 1.124, + "step": 18195 + }, + { + "epoch": 0.55, + "learning_rate": 2.232081489666527e-06, + "loss": 1.147, + "step": 18196 + }, + { + "epoch": 0.55, + "learning_rate": 2.2318389756317163e-06, + "loss": 1.0103, + "step": 18197 + }, + { + "epoch": 0.55, + "learning_rate": 2.231596464149669e-06, + "loss": 1.05, + "step": 18198 + }, + { + "epoch": 0.55, + "learning_rate": 2.231353955222694e-06, + "loss": 1.1548, + "step": 18199 + }, + { + "epoch": 0.55, + "learning_rate": 2.2311114488531e-06, + "loss": 1.1702, + "step": 18200 + }, + { + "epoch": 0.55, + "learning_rate": 2.2308689450431966e-06, + "loss": 1.207, + "step": 18201 + }, + { + "epoch": 0.55, + "learning_rate": 2.23062644379529e-06, + "loss": 1.0757, + "step": 18202 + }, + { + "epoch": 0.55, + "learning_rate": 2.2303839451116906e-06, + "loss": 1.0292, + "step": 18203 + }, + { + "epoch": 0.55, + "learning_rate": 2.2301414489947056e-06, + "loss": 1.0344, + "step": 18204 + }, + { + "epoch": 0.55, + "learning_rate": 2.229898955446645e-06, + "loss": 1.1364, + "step": 18205 + }, + { + "epoch": 0.55, + "learning_rate": 2.2296564644698154e-06, + "loss": 1.164, + "step": 18206 + }, + { + "epoch": 0.55, + "learning_rate": 2.229413976066526e-06, + "loss": 1.1914, + "step": 18207 + }, + { + "epoch": 0.55, + "learning_rate": 2.229171490239085e-06, + "loss": 1.1476, + "step": 18208 + }, + { + "epoch": 0.55, + "learning_rate": 2.228929006989801e-06, + "loss": 1.1157, + "step": 18209 + }, + { + "epoch": 0.55, + "learning_rate": 2.2286865263209835e-06, + "loss": 1.2153, + "step": 18210 + }, + { + "epoch": 0.55, + "learning_rate": 2.2284440482349384e-06, + "loss": 1.162, + "step": 18211 + }, + { + "epoch": 0.55, + "learning_rate": 2.2282015727339755e-06, + "loss": 1.129, + "step": 18212 + }, + { + "epoch": 0.55, + "learning_rate": 2.227959099820403e-06, + "loss": 1.1063, + "step": 18213 + }, + { + "epoch": 0.55, + "learning_rate": 2.227716629496529e-06, + "loss": 1.1014, + "step": 18214 + }, + { + "epoch": 0.55, + "learning_rate": 2.227474161764661e-06, + "loss": 1.1428, + "step": 18215 + }, + { + "epoch": 0.55, + "learning_rate": 2.227231696627108e-06, + "loss": 0.9728, + "step": 18216 + }, + { + "epoch": 0.55, + "learning_rate": 2.2269892340861773e-06, + "loss": 1.1572, + "step": 18217 + }, + { + "epoch": 0.55, + "learning_rate": 2.2267467741441793e-06, + "loss": 1.1149, + "step": 18218 + }, + { + "epoch": 0.55, + "learning_rate": 2.226504316803419e-06, + "loss": 1.0927, + "step": 18219 + }, + { + "epoch": 0.55, + "learning_rate": 2.226261862066206e-06, + "loss": 1.1023, + "step": 18220 + }, + { + "epoch": 0.55, + "learning_rate": 2.2260194099348478e-06, + "loss": 1.16, + "step": 18221 + }, + { + "epoch": 0.55, + "learning_rate": 2.225776960411653e-06, + "loss": 1.0045, + "step": 18222 + }, + { + "epoch": 0.55, + "learning_rate": 2.2255345134989306e-06, + "loss": 1.1438, + "step": 18223 + }, + { + "epoch": 0.55, + "learning_rate": 2.225292069198987e-06, + "loss": 1.0531, + "step": 18224 + }, + { + "epoch": 0.55, + "learning_rate": 2.22504962751413e-06, + "loss": 1.2114, + "step": 18225 + }, + { + "epoch": 0.55, + "learning_rate": 2.224807188446668e-06, + "loss": 1.1076, + "step": 18226 + }, + { + "epoch": 0.55, + "learning_rate": 2.22456475199891e-06, + "loss": 1.071, + "step": 18227 + }, + { + "epoch": 0.55, + "learning_rate": 2.2243223181731622e-06, + "loss": 1.1083, + "step": 18228 + }, + { + "epoch": 0.55, + "learning_rate": 2.2240798869717332e-06, + "loss": 1.2521, + "step": 18229 + }, + { + "epoch": 0.55, + "learning_rate": 2.2238374583969306e-06, + "loss": 1.1646, + "step": 18230 + }, + { + "epoch": 0.55, + "learning_rate": 2.2235950324510636e-06, + "loss": 1.0702, + "step": 18231 + }, + { + "epoch": 0.55, + "learning_rate": 2.223352609136438e-06, + "loss": 1.1398, + "step": 18232 + }, + { + "epoch": 0.55, + "learning_rate": 2.223110188455362e-06, + "loss": 0.9959, + "step": 18233 + }, + { + "epoch": 0.55, + "learning_rate": 2.2228677704101436e-06, + "loss": 0.9294, + "step": 18234 + }, + { + "epoch": 0.55, + "learning_rate": 2.2226253550030903e-06, + "loss": 1.1379, + "step": 18235 + }, + { + "epoch": 0.55, + "learning_rate": 2.2223829422365118e-06, + "loss": 1.104, + "step": 18236 + }, + { + "epoch": 0.55, + "learning_rate": 2.2221405321127125e-06, + "loss": 1.1053, + "step": 18237 + }, + { + "epoch": 0.55, + "learning_rate": 2.2218981246340014e-06, + "loss": 1.1263, + "step": 18238 + }, + { + "epoch": 0.55, + "learning_rate": 2.2216557198026864e-06, + "loss": 1.097, + "step": 18239 + }, + { + "epoch": 0.55, + "learning_rate": 2.2214133176210754e-06, + "loss": 1.0999, + "step": 18240 + }, + { + "epoch": 0.55, + "learning_rate": 2.221170918091475e-06, + "loss": 1.1637, + "step": 18241 + }, + { + "epoch": 0.55, + "learning_rate": 2.220928521216193e-06, + "loss": 1.222, + "step": 18242 + }, + { + "epoch": 0.55, + "learning_rate": 2.220686126997537e-06, + "loss": 1.098, + "step": 18243 + }, + { + "epoch": 0.55, + "learning_rate": 2.220443735437816e-06, + "loss": 1.194, + "step": 18244 + }, + { + "epoch": 0.55, + "learning_rate": 2.2202013465393346e-06, + "loss": 1.1191, + "step": 18245 + }, + { + "epoch": 0.55, + "learning_rate": 2.2199589603044017e-06, + "loss": 1.066, + "step": 18246 + }, + { + "epoch": 0.55, + "learning_rate": 2.2197165767353246e-06, + "loss": 1.1578, + "step": 18247 + }, + { + "epoch": 0.55, + "learning_rate": 2.2194741958344107e-06, + "loss": 1.1705, + "step": 18248 + }, + { + "epoch": 0.55, + "learning_rate": 2.2192318176039683e-06, + "loss": 1.1783, + "step": 18249 + }, + { + "epoch": 0.55, + "learning_rate": 2.2189894420463034e-06, + "loss": 1.1198, + "step": 18250 + }, + { + "epoch": 0.55, + "learning_rate": 2.218747069163723e-06, + "loss": 1.1694, + "step": 18251 + }, + { + "epoch": 0.55, + "learning_rate": 2.218504698958535e-06, + "loss": 1.0232, + "step": 18252 + }, + { + "epoch": 0.55, + "learning_rate": 2.2182623314330476e-06, + "loss": 1.1432, + "step": 18253 + }, + { + "epoch": 0.55, + "learning_rate": 2.2180199665895663e-06, + "loss": 1.2308, + "step": 18254 + }, + { + "epoch": 0.55, + "learning_rate": 2.2177776044303993e-06, + "loss": 1.1415, + "step": 18255 + }, + { + "epoch": 0.55, + "learning_rate": 2.217535244957853e-06, + "loss": 1.1255, + "step": 18256 + }, + { + "epoch": 0.55, + "learning_rate": 2.217292888174237e-06, + "loss": 1.085, + "step": 18257 + }, + { + "epoch": 0.55, + "learning_rate": 2.217050534081855e-06, + "loss": 1.1688, + "step": 18258 + }, + { + "epoch": 0.55, + "learning_rate": 2.216808182683016e-06, + "loss": 1.1497, + "step": 18259 + }, + { + "epoch": 0.55, + "learning_rate": 2.2165658339800266e-06, + "loss": 1.019, + "step": 18260 + }, + { + "epoch": 0.55, + "learning_rate": 2.2163234879751937e-06, + "loss": 1.1619, + "step": 18261 + }, + { + "epoch": 0.55, + "learning_rate": 2.216081144670826e-06, + "loss": 1.1232, + "step": 18262 + }, + { + "epoch": 0.55, + "learning_rate": 2.2158388040692278e-06, + "loss": 1.0987, + "step": 18263 + }, + { + "epoch": 0.55, + "learning_rate": 2.215596466172707e-06, + "loss": 1.058, + "step": 18264 + }, + { + "epoch": 0.55, + "learning_rate": 2.2153541309835715e-06, + "loss": 1.0863, + "step": 18265 + }, + { + "epoch": 0.55, + "learning_rate": 2.2151117985041278e-06, + "loss": 1.2466, + "step": 18266 + }, + { + "epoch": 0.55, + "learning_rate": 2.214869468736682e-06, + "loss": 1.0848, + "step": 18267 + }, + { + "epoch": 0.55, + "learning_rate": 2.2146271416835416e-06, + "loss": 1.1898, + "step": 18268 + }, + { + "epoch": 0.55, + "learning_rate": 2.2143848173470135e-06, + "loss": 1.0918, + "step": 18269 + }, + { + "epoch": 0.55, + "learning_rate": 2.2141424957294053e-06, + "loss": 1.0848, + "step": 18270 + }, + { + "epoch": 0.55, + "learning_rate": 2.2139001768330216e-06, + "loss": 1.1344, + "step": 18271 + }, + { + "epoch": 0.55, + "learning_rate": 2.213657860660171e-06, + "loss": 1.15, + "step": 18272 + }, + { + "epoch": 0.55, + "learning_rate": 2.2134155472131593e-06, + "loss": 1.069, + "step": 18273 + }, + { + "epoch": 0.55, + "learning_rate": 2.2131732364942934e-06, + "loss": 1.2167, + "step": 18274 + }, + { + "epoch": 0.55, + "learning_rate": 2.2129309285058815e-06, + "loss": 1.1119, + "step": 18275 + }, + { + "epoch": 0.55, + "learning_rate": 2.2126886232502274e-06, + "loss": 1.1187, + "step": 18276 + }, + { + "epoch": 0.55, + "learning_rate": 2.2124463207296398e-06, + "loss": 1.0283, + "step": 18277 + }, + { + "epoch": 0.55, + "learning_rate": 2.212204020946424e-06, + "loss": 1.0771, + "step": 18278 + }, + { + "epoch": 0.55, + "learning_rate": 2.2119617239028888e-06, + "loss": 1.2192, + "step": 18279 + }, + { + "epoch": 0.55, + "learning_rate": 2.211719429601338e-06, + "loss": 1.0573, + "step": 18280 + }, + { + "epoch": 0.55, + "learning_rate": 2.21147713804408e-06, + "loss": 1.251, + "step": 18281 + }, + { + "epoch": 0.55, + "learning_rate": 2.21123484923342e-06, + "loss": 1.0673, + "step": 18282 + }, + { + "epoch": 0.55, + "learning_rate": 2.210992563171667e-06, + "loss": 1.11, + "step": 18283 + }, + { + "epoch": 0.55, + "learning_rate": 2.210750279861124e-06, + "loss": 1.2083, + "step": 18284 + }, + { + "epoch": 0.55, + "learning_rate": 2.210507999304099e-06, + "loss": 1.0718, + "step": 18285 + }, + { + "epoch": 0.55, + "learning_rate": 2.2102657215028986e-06, + "loss": 1.1376, + "step": 18286 + }, + { + "epoch": 0.55, + "learning_rate": 2.210023446459829e-06, + "loss": 1.1777, + "step": 18287 + }, + { + "epoch": 0.55, + "learning_rate": 2.2097811741771973e-06, + "loss": 1.1807, + "step": 18288 + }, + { + "epoch": 0.55, + "learning_rate": 2.2095389046573084e-06, + "loss": 1.1161, + "step": 18289 + }, + { + "epoch": 0.55, + "learning_rate": 2.2092966379024693e-06, + "loss": 1.0558, + "step": 18290 + }, + { + "epoch": 0.55, + "learning_rate": 2.2090543739149855e-06, + "loss": 0.9648, + "step": 18291 + }, + { + "epoch": 0.55, + "learning_rate": 2.208812112697165e-06, + "loss": 1.234, + "step": 18292 + }, + { + "epoch": 0.55, + "learning_rate": 2.2085698542513126e-06, + "loss": 1.1889, + "step": 18293 + }, + { + "epoch": 0.55, + "learning_rate": 2.2083275985797344e-06, + "loss": 1.1946, + "step": 18294 + }, + { + "epoch": 0.55, + "learning_rate": 2.208085345684738e-06, + "loss": 1.0875, + "step": 18295 + }, + { + "epoch": 0.55, + "learning_rate": 2.207843095568628e-06, + "loss": 1.1379, + "step": 18296 + }, + { + "epoch": 0.55, + "learning_rate": 2.2076008482337107e-06, + "loss": 1.0914, + "step": 18297 + }, + { + "epoch": 0.55, + "learning_rate": 2.2073586036822923e-06, + "loss": 1.1741, + "step": 18298 + }, + { + "epoch": 0.55, + "learning_rate": 2.2071163619166793e-06, + "loss": 1.2987, + "step": 18299 + }, + { + "epoch": 0.55, + "learning_rate": 2.2068741229391778e-06, + "loss": 1.1165, + "step": 18300 + }, + { + "epoch": 0.55, + "learning_rate": 2.2066318867520937e-06, + "loss": 1.0848, + "step": 18301 + }, + { + "epoch": 0.55, + "learning_rate": 2.2063896533577327e-06, + "loss": 1.1055, + "step": 18302 + }, + { + "epoch": 0.55, + "learning_rate": 2.2061474227584e-06, + "loss": 1.0702, + "step": 18303 + }, + { + "epoch": 0.55, + "learning_rate": 2.2059051949564026e-06, + "loss": 1.0439, + "step": 18304 + }, + { + "epoch": 0.55, + "learning_rate": 2.205662969954047e-06, + "loss": 1.1869, + "step": 18305 + }, + { + "epoch": 0.55, + "learning_rate": 2.2054207477536375e-06, + "loss": 1.2639, + "step": 18306 + }, + { + "epoch": 0.55, + "learning_rate": 2.20517852835748e-06, + "loss": 1.1332, + "step": 18307 + }, + { + "epoch": 0.55, + "learning_rate": 2.204936311767881e-06, + "loss": 1.0931, + "step": 18308 + }, + { + "epoch": 0.55, + "learning_rate": 2.2046940979871474e-06, + "loss": 1.1065, + "step": 18309 + }, + { + "epoch": 0.55, + "learning_rate": 2.204451887017583e-06, + "loss": 1.0738, + "step": 18310 + }, + { + "epoch": 0.55, + "learning_rate": 2.204209678861494e-06, + "loss": 1.129, + "step": 18311 + }, + { + "epoch": 0.55, + "learning_rate": 2.203967473521186e-06, + "loss": 1.1277, + "step": 18312 + }, + { + "epoch": 0.55, + "learning_rate": 2.203725270998966e-06, + "loss": 0.9816, + "step": 18313 + }, + { + "epoch": 0.55, + "learning_rate": 2.2034830712971394e-06, + "loss": 1.0471, + "step": 18314 + }, + { + "epoch": 0.55, + "learning_rate": 2.20324087441801e-06, + "loss": 1.1368, + "step": 18315 + }, + { + "epoch": 0.55, + "learning_rate": 2.2029986803638847e-06, + "loss": 0.9945, + "step": 18316 + }, + { + "epoch": 0.55, + "learning_rate": 2.202756489137069e-06, + "loss": 1.2177, + "step": 18317 + }, + { + "epoch": 0.55, + "learning_rate": 2.202514300739869e-06, + "loss": 1.1082, + "step": 18318 + }, + { + "epoch": 0.55, + "learning_rate": 2.202272115174589e-06, + "loss": 1.1437, + "step": 18319 + }, + { + "epoch": 0.55, + "learning_rate": 2.202029932443535e-06, + "loss": 1.0894, + "step": 18320 + }, + { + "epoch": 0.55, + "learning_rate": 2.2017877525490123e-06, + "loss": 1.2367, + "step": 18321 + }, + { + "epoch": 0.55, + "learning_rate": 2.2015455754933275e-06, + "loss": 1.1111, + "step": 18322 + }, + { + "epoch": 0.55, + "learning_rate": 2.201303401278784e-06, + "loss": 1.1359, + "step": 18323 + }, + { + "epoch": 0.55, + "learning_rate": 2.201061229907689e-06, + "loss": 1.2392, + "step": 18324 + }, + { + "epoch": 0.55, + "learning_rate": 2.200819061382346e-06, + "loss": 1.0987, + "step": 18325 + }, + { + "epoch": 0.55, + "learning_rate": 2.200576895705062e-06, + "loss": 1.046, + "step": 18326 + }, + { + "epoch": 0.55, + "learning_rate": 2.2003347328781433e-06, + "loss": 1.1072, + "step": 18327 + }, + { + "epoch": 0.55, + "learning_rate": 2.2000925729038922e-06, + "loss": 1.1032, + "step": 18328 + }, + { + "epoch": 0.55, + "learning_rate": 2.1998504157846152e-06, + "loss": 1.108, + "step": 18329 + }, + { + "epoch": 0.55, + "learning_rate": 2.199608261522618e-06, + "loss": 1.0274, + "step": 18330 + }, + { + "epoch": 0.55, + "learning_rate": 2.1993661101202064e-06, + "loss": 1.1189, + "step": 18331 + }, + { + "epoch": 0.55, + "learning_rate": 2.1991239615796833e-06, + "loss": 1.0402, + "step": 18332 + }, + { + "epoch": 0.55, + "learning_rate": 2.198881815903355e-06, + "loss": 1.1306, + "step": 18333 + }, + { + "epoch": 0.55, + "learning_rate": 2.1986396730935275e-06, + "loss": 0.9943, + "step": 18334 + }, + { + "epoch": 0.55, + "learning_rate": 2.1983975331525056e-06, + "loss": 1.1342, + "step": 18335 + }, + { + "epoch": 0.55, + "learning_rate": 2.198155396082593e-06, + "loss": 1.2175, + "step": 18336 + }, + { + "epoch": 0.55, + "learning_rate": 2.197913261886096e-06, + "loss": 1.1702, + "step": 18337 + }, + { + "epoch": 0.55, + "learning_rate": 2.197671130565319e-06, + "loss": 1.1566, + "step": 18338 + }, + { + "epoch": 0.55, + "learning_rate": 2.1974290021225672e-06, + "loss": 1.2028, + "step": 18339 + }, + { + "epoch": 0.55, + "learning_rate": 2.197186876560147e-06, + "loss": 1.0823, + "step": 18340 + }, + { + "epoch": 0.55, + "learning_rate": 2.196944753880361e-06, + "loss": 1.0901, + "step": 18341 + }, + { + "epoch": 0.55, + "learning_rate": 2.196702634085514e-06, + "loss": 1.0924, + "step": 18342 + }, + { + "epoch": 0.55, + "learning_rate": 2.1964605171779124e-06, + "loss": 1.22, + "step": 18343 + }, + { + "epoch": 0.55, + "learning_rate": 2.196218403159862e-06, + "loss": 1.04, + "step": 18344 + }, + { + "epoch": 0.55, + "learning_rate": 2.1959762920336643e-06, + "loss": 1.1479, + "step": 18345 + }, + { + "epoch": 0.55, + "learning_rate": 2.1957341838016265e-06, + "loss": 1.0876, + "step": 18346 + }, + { + "epoch": 0.55, + "learning_rate": 2.195492078466052e-06, + "loss": 1.0892, + "step": 18347 + }, + { + "epoch": 0.55, + "learning_rate": 2.1952499760292474e-06, + "loss": 1.178, + "step": 18348 + }, + { + "epoch": 0.55, + "learning_rate": 2.1950078764935156e-06, + "loss": 1.1271, + "step": 18349 + }, + { + "epoch": 0.55, + "learning_rate": 2.1947657798611617e-06, + "loss": 1.2216, + "step": 18350 + }, + { + "epoch": 0.55, + "learning_rate": 2.194523686134491e-06, + "loss": 1.0249, + "step": 18351 + }, + { + "epoch": 0.55, + "learning_rate": 2.194281595315807e-06, + "loss": 1.0363, + "step": 18352 + }, + { + "epoch": 0.55, + "learning_rate": 2.194039507407417e-06, + "loss": 1.1021, + "step": 18353 + }, + { + "epoch": 0.55, + "learning_rate": 2.193797422411622e-06, + "loss": 1.138, + "step": 18354 + }, + { + "epoch": 0.55, + "learning_rate": 2.1935553403307277e-06, + "loss": 1.0732, + "step": 18355 + }, + { + "epoch": 0.55, + "learning_rate": 2.1933132611670395e-06, + "loss": 1.0559, + "step": 18356 + }, + { + "epoch": 0.55, + "learning_rate": 2.1930711849228618e-06, + "loss": 1.1052, + "step": 18357 + }, + { + "epoch": 0.55, + "learning_rate": 2.1928291116004983e-06, + "loss": 1.0383, + "step": 18358 + }, + { + "epoch": 0.55, + "learning_rate": 2.192587041202253e-06, + "loss": 1.0784, + "step": 18359 + }, + { + "epoch": 0.55, + "learning_rate": 2.1923449737304314e-06, + "loss": 1.0482, + "step": 18360 + }, + { + "epoch": 0.55, + "learning_rate": 2.192102909187338e-06, + "loss": 1.2664, + "step": 18361 + }, + { + "epoch": 0.55, + "learning_rate": 2.191860847575276e-06, + "loss": 1.1669, + "step": 18362 + }, + { + "epoch": 0.55, + "learning_rate": 2.191618788896551e-06, + "loss": 1.1469, + "step": 18363 + }, + { + "epoch": 0.55, + "learning_rate": 2.1913767331534655e-06, + "loss": 1.1003, + "step": 18364 + }, + { + "epoch": 0.55, + "learning_rate": 2.191134680348325e-06, + "loss": 0.9663, + "step": 18365 + }, + { + "epoch": 0.55, + "learning_rate": 2.1908926304834354e-06, + "loss": 1.1909, + "step": 18366 + }, + { + "epoch": 0.55, + "learning_rate": 2.1906505835610975e-06, + "loss": 1.1372, + "step": 18367 + }, + { + "epoch": 0.55, + "learning_rate": 2.190408539583617e-06, + "loss": 1.1501, + "step": 18368 + }, + { + "epoch": 0.55, + "learning_rate": 2.1901664985532985e-06, + "loss": 1.1472, + "step": 18369 + }, + { + "epoch": 0.55, + "learning_rate": 2.189924460472447e-06, + "loss": 1.1133, + "step": 18370 + }, + { + "epoch": 0.55, + "learning_rate": 2.1896824253433635e-06, + "loss": 1.112, + "step": 18371 + }, + { + "epoch": 0.55, + "learning_rate": 2.189440393168354e-06, + "loss": 1.1477, + "step": 18372 + }, + { + "epoch": 0.55, + "learning_rate": 2.1891983639497224e-06, + "loss": 1.0427, + "step": 18373 + }, + { + "epoch": 0.55, + "learning_rate": 2.1889563376897737e-06, + "loss": 1.1997, + "step": 18374 + }, + { + "epoch": 0.55, + "learning_rate": 2.18871431439081e-06, + "loss": 1.2051, + "step": 18375 + }, + { + "epoch": 0.55, + "learning_rate": 2.188472294055136e-06, + "loss": 1.0682, + "step": 18376 + }, + { + "epoch": 0.55, + "learning_rate": 2.1882302766850563e-06, + "loss": 1.0164, + "step": 18377 + }, + { + "epoch": 0.55, + "learning_rate": 2.1879882622828735e-06, + "loss": 1.0808, + "step": 18378 + }, + { + "epoch": 0.55, + "learning_rate": 2.187746250850893e-06, + "loss": 1.1317, + "step": 18379 + }, + { + "epoch": 0.55, + "learning_rate": 2.187504242391417e-06, + "loss": 1.0598, + "step": 18380 + }, + { + "epoch": 0.55, + "learning_rate": 2.1872622369067505e-06, + "loss": 1.0648, + "step": 18381 + }, + { + "epoch": 0.55, + "learning_rate": 2.187020234399197e-06, + "loss": 1.1319, + "step": 18382 + }, + { + "epoch": 0.55, + "learning_rate": 2.1867782348710607e-06, + "loss": 1.0491, + "step": 18383 + }, + { + "epoch": 0.55, + "learning_rate": 2.1865362383246437e-06, + "loss": 1.0847, + "step": 18384 + }, + { + "epoch": 0.55, + "learning_rate": 2.186294244762251e-06, + "loss": 1.1276, + "step": 18385 + }, + { + "epoch": 0.55, + "learning_rate": 2.1860522541861862e-06, + "loss": 1.1456, + "step": 18386 + }, + { + "epoch": 0.55, + "learning_rate": 2.185810266598753e-06, + "loss": 1.0123, + "step": 18387 + }, + { + "epoch": 0.55, + "learning_rate": 2.1855682820022546e-06, + "loss": 1.0899, + "step": 18388 + }, + { + "epoch": 0.55, + "learning_rate": 2.185326300398994e-06, + "loss": 1.1667, + "step": 18389 + }, + { + "epoch": 0.55, + "learning_rate": 2.185084321791276e-06, + "loss": 1.2034, + "step": 18390 + }, + { + "epoch": 0.55, + "learning_rate": 2.184842346181404e-06, + "loss": 1.1876, + "step": 18391 + }, + { + "epoch": 0.55, + "learning_rate": 2.18460037357168e-06, + "loss": 1.0785, + "step": 18392 + }, + { + "epoch": 0.55, + "learning_rate": 2.1843584039644095e-06, + "loss": 1.1306, + "step": 18393 + }, + { + "epoch": 0.55, + "learning_rate": 2.1841164373618946e-06, + "loss": 1.2191, + "step": 18394 + }, + { + "epoch": 0.55, + "learning_rate": 2.183874473766439e-06, + "loss": 1.187, + "step": 18395 + }, + { + "epoch": 0.55, + "learning_rate": 2.183632513180347e-06, + "loss": 1.0518, + "step": 18396 + }, + { + "epoch": 0.55, + "learning_rate": 2.1833905556059202e-06, + "loss": 1.1575, + "step": 18397 + }, + { + "epoch": 0.55, + "learning_rate": 2.1831486010454627e-06, + "loss": 1.2056, + "step": 18398 + }, + { + "epoch": 0.55, + "learning_rate": 2.182906649501278e-06, + "loss": 1.1064, + "step": 18399 + }, + { + "epoch": 0.55, + "learning_rate": 2.1826647009756707e-06, + "loss": 1.2324, + "step": 18400 + }, + { + "epoch": 0.55, + "learning_rate": 2.182422755470941e-06, + "loss": 1.0498, + "step": 18401 + }, + { + "epoch": 0.55, + "learning_rate": 2.182180812989394e-06, + "loss": 1.1915, + "step": 18402 + }, + { + "epoch": 0.55, + "learning_rate": 2.1819388735333327e-06, + "loss": 1.0871, + "step": 18403 + }, + { + "epoch": 0.55, + "learning_rate": 2.1816969371050605e-06, + "loss": 1.1342, + "step": 18404 + }, + { + "epoch": 0.55, + "learning_rate": 2.18145500370688e-06, + "loss": 1.1516, + "step": 18405 + }, + { + "epoch": 0.55, + "learning_rate": 2.1812130733410937e-06, + "loss": 1.2537, + "step": 18406 + }, + { + "epoch": 0.55, + "learning_rate": 2.1809711460100057e-06, + "loss": 1.1302, + "step": 18407 + }, + { + "epoch": 0.55, + "learning_rate": 2.180729221715919e-06, + "loss": 1.1207, + "step": 18408 + }, + { + "epoch": 0.55, + "learning_rate": 2.1804873004611372e-06, + "loss": 1.1923, + "step": 18409 + }, + { + "epoch": 0.55, + "learning_rate": 2.1802453822479617e-06, + "loss": 1.0773, + "step": 18410 + }, + { + "epoch": 0.55, + "learning_rate": 2.1800034670786956e-06, + "loss": 1.0449, + "step": 18411 + }, + { + "epoch": 0.55, + "learning_rate": 2.179761554955643e-06, + "loss": 1.1783, + "step": 18412 + }, + { + "epoch": 0.55, + "learning_rate": 2.179519645881107e-06, + "loss": 1.1348, + "step": 18413 + }, + { + "epoch": 0.55, + "learning_rate": 2.179277739857388e-06, + "loss": 1.024, + "step": 18414 + }, + { + "epoch": 0.55, + "learning_rate": 2.179035836886791e-06, + "loss": 1.0501, + "step": 18415 + }, + { + "epoch": 0.55, + "learning_rate": 2.178793936971618e-06, + "loss": 1.1273, + "step": 18416 + }, + { + "epoch": 0.55, + "learning_rate": 2.178552040114173e-06, + "loss": 1.0458, + "step": 18417 + }, + { + "epoch": 0.55, + "learning_rate": 2.178310146316757e-06, + "loss": 1.3142, + "step": 18418 + }, + { + "epoch": 0.55, + "learning_rate": 2.1780682555816733e-06, + "loss": 1.1232, + "step": 18419 + }, + { + "epoch": 0.55, + "learning_rate": 2.177826367911225e-06, + "loss": 1.093, + "step": 18420 + }, + { + "epoch": 0.55, + "learning_rate": 2.177584483307714e-06, + "loss": 1.2118, + "step": 18421 + }, + { + "epoch": 0.55, + "learning_rate": 2.1773426017734454e-06, + "loss": 1.0427, + "step": 18422 + }, + { + "epoch": 0.55, + "learning_rate": 2.177100723310718e-06, + "loss": 1.2719, + "step": 18423 + }, + { + "epoch": 0.56, + "learning_rate": 2.1768588479218367e-06, + "loss": 1.0515, + "step": 18424 + }, + { + "epoch": 0.56, + "learning_rate": 2.1766169756091034e-06, + "loss": 1.1258, + "step": 18425 + }, + { + "epoch": 0.56, + "learning_rate": 2.1763751063748215e-06, + "loss": 1.1393, + "step": 18426 + }, + { + "epoch": 0.56, + "learning_rate": 2.176133240221292e-06, + "loss": 1.1303, + "step": 18427 + }, + { + "epoch": 0.56, + "learning_rate": 2.1758913771508178e-06, + "loss": 1.0704, + "step": 18428 + }, + { + "epoch": 0.56, + "learning_rate": 2.1756495171657016e-06, + "loss": 1.1299, + "step": 18429 + }, + { + "epoch": 0.56, + "learning_rate": 2.1754076602682467e-06, + "loss": 1.0614, + "step": 18430 + }, + { + "epoch": 0.56, + "learning_rate": 2.1751658064607535e-06, + "loss": 1.1577, + "step": 18431 + }, + { + "epoch": 0.56, + "learning_rate": 2.174923955745526e-06, + "loss": 1.0952, + "step": 18432 + }, + { + "epoch": 0.56, + "learning_rate": 2.1746821081248654e-06, + "loss": 1.0942, + "step": 18433 + }, + { + "epoch": 0.56, + "learning_rate": 2.1744402636010744e-06, + "loss": 1.0072, + "step": 18434 + }, + { + "epoch": 0.56, + "learning_rate": 2.1741984221764567e-06, + "loss": 1.1451, + "step": 18435 + }, + { + "epoch": 0.56, + "learning_rate": 2.173956583853312e-06, + "loss": 1.1776, + "step": 18436 + }, + { + "epoch": 0.56, + "learning_rate": 2.1737147486339434e-06, + "loss": 1.2236, + "step": 18437 + }, + { + "epoch": 0.56, + "learning_rate": 2.173472916520653e-06, + "loss": 0.9957, + "step": 18438 + }, + { + "epoch": 0.56, + "learning_rate": 2.173231087515745e-06, + "loss": 1.1697, + "step": 18439 + }, + { + "epoch": 0.56, + "learning_rate": 2.172989261621518e-06, + "loss": 0.9693, + "step": 18440 + }, + { + "epoch": 0.56, + "learning_rate": 2.1727474388402756e-06, + "loss": 1.0538, + "step": 18441 + }, + { + "epoch": 0.56, + "learning_rate": 2.1725056191743203e-06, + "loss": 1.1697, + "step": 18442 + }, + { + "epoch": 0.56, + "learning_rate": 2.1722638026259545e-06, + "loss": 1.1837, + "step": 18443 + }, + { + "epoch": 0.56, + "learning_rate": 2.1720219891974787e-06, + "loss": 1.0073, + "step": 18444 + }, + { + "epoch": 0.56, + "learning_rate": 2.1717801788911955e-06, + "loss": 1.1773, + "step": 18445 + }, + { + "epoch": 0.56, + "learning_rate": 2.1715383717094073e-06, + "loss": 1.1388, + "step": 18446 + }, + { + "epoch": 0.56, + "learning_rate": 2.171296567654415e-06, + "loss": 1.1121, + "step": 18447 + }, + { + "epoch": 0.56, + "learning_rate": 2.1710547667285227e-06, + "loss": 1.1571, + "step": 18448 + }, + { + "epoch": 0.56, + "learning_rate": 2.1708129689340292e-06, + "loss": 1.0723, + "step": 18449 + }, + { + "epoch": 0.56, + "learning_rate": 2.170571174273238e-06, + "loss": 1.0845, + "step": 18450 + }, + { + "epoch": 0.56, + "learning_rate": 2.1703293827484504e-06, + "loss": 1.1129, + "step": 18451 + }, + { + "epoch": 0.56, + "learning_rate": 2.1700875943619692e-06, + "loss": 0.9504, + "step": 18452 + }, + { + "epoch": 0.56, + "learning_rate": 2.1698458091160943e-06, + "loss": 1.178, + "step": 18453 + }, + { + "epoch": 0.56, + "learning_rate": 2.1696040270131284e-06, + "loss": 1.0582, + "step": 18454 + }, + { + "epoch": 0.56, + "learning_rate": 2.169362248055373e-06, + "loss": 0.9996, + "step": 18455 + }, + { + "epoch": 0.56, + "learning_rate": 2.16912047224513e-06, + "loss": 1.1436, + "step": 18456 + }, + { + "epoch": 0.56, + "learning_rate": 2.1688786995847e-06, + "loss": 1.1093, + "step": 18457 + }, + { + "epoch": 0.56, + "learning_rate": 2.168636930076386e-06, + "loss": 1.1201, + "step": 18458 + }, + { + "epoch": 0.56, + "learning_rate": 2.168395163722489e-06, + "loss": 1.1959, + "step": 18459 + }, + { + "epoch": 0.56, + "learning_rate": 2.16815340052531e-06, + "loss": 1.1185, + "step": 18460 + }, + { + "epoch": 0.56, + "learning_rate": 2.167911640487151e-06, + "loss": 1.1537, + "step": 18461 + }, + { + "epoch": 0.56, + "learning_rate": 2.1676698836103132e-06, + "loss": 1.1395, + "step": 18462 + }, + { + "epoch": 0.56, + "learning_rate": 2.1674281298970977e-06, + "loss": 1.1777, + "step": 18463 + }, + { + "epoch": 0.56, + "learning_rate": 2.1671863793498064e-06, + "loss": 0.979, + "step": 18464 + }, + { + "epoch": 0.56, + "learning_rate": 2.1669446319707414e-06, + "loss": 1.0674, + "step": 18465 + }, + { + "epoch": 0.56, + "learning_rate": 2.166702887762202e-06, + "loss": 1.1656, + "step": 18466 + }, + { + "epoch": 0.56, + "learning_rate": 2.1664611467264906e-06, + "loss": 1.1385, + "step": 18467 + }, + { + "epoch": 0.56, + "learning_rate": 2.166219408865909e-06, + "loss": 1.1266, + "step": 18468 + }, + { + "epoch": 0.56, + "learning_rate": 2.1659776741827577e-06, + "loss": 1.1602, + "step": 18469 + }, + { + "epoch": 0.56, + "learning_rate": 2.165735942679338e-06, + "loss": 1.1235, + "step": 18470 + }, + { + "epoch": 0.56, + "learning_rate": 2.165494214357951e-06, + "loss": 1.0527, + "step": 18471 + }, + { + "epoch": 0.56, + "learning_rate": 2.1652524892208983e-06, + "loss": 1.1505, + "step": 18472 + }, + { + "epoch": 0.56, + "learning_rate": 2.1650107672704803e-06, + "loss": 1.1576, + "step": 18473 + }, + { + "epoch": 0.56, + "learning_rate": 2.1647690485089986e-06, + "loss": 1.1799, + "step": 18474 + }, + { + "epoch": 0.56, + "learning_rate": 2.164527332938754e-06, + "loss": 1.1251, + "step": 18475 + }, + { + "epoch": 0.56, + "learning_rate": 2.1642856205620476e-06, + "loss": 1.1157, + "step": 18476 + }, + { + "epoch": 0.56, + "learning_rate": 2.16404391138118e-06, + "loss": 1.1172, + "step": 18477 + }, + { + "epoch": 0.56, + "learning_rate": 2.1638022053984542e-06, + "loss": 1.0547, + "step": 18478 + }, + { + "epoch": 0.56, + "learning_rate": 2.163560502616168e-06, + "loss": 1.0377, + "step": 18479 + }, + { + "epoch": 0.56, + "learning_rate": 2.1633188030366242e-06, + "loss": 1.1381, + "step": 18480 + }, + { + "epoch": 0.56, + "learning_rate": 2.163077106662123e-06, + "loss": 1.1854, + "step": 18481 + }, + { + "epoch": 0.56, + "learning_rate": 2.1628354134949666e-06, + "loss": 1.1223, + "step": 18482 + }, + { + "epoch": 0.56, + "learning_rate": 2.1625937235374535e-06, + "loss": 1.0361, + "step": 18483 + }, + { + "epoch": 0.56, + "learning_rate": 2.162352036791886e-06, + "loss": 1.0149, + "step": 18484 + }, + { + "epoch": 0.56, + "learning_rate": 2.162110353260564e-06, + "loss": 1.1516, + "step": 18485 + }, + { + "epoch": 0.56, + "learning_rate": 2.1618686729457892e-06, + "loss": 1.0838, + "step": 18486 + }, + { + "epoch": 0.56, + "learning_rate": 2.161626995849862e-06, + "loss": 1.1641, + "step": 18487 + }, + { + "epoch": 0.56, + "learning_rate": 2.1613853219750825e-06, + "loss": 1.1398, + "step": 18488 + }, + { + "epoch": 0.56, + "learning_rate": 2.1611436513237512e-06, + "loss": 1.1295, + "step": 18489 + }, + { + "epoch": 0.56, + "learning_rate": 2.1609019838981696e-06, + "loss": 1.1263, + "step": 18490 + }, + { + "epoch": 0.56, + "learning_rate": 2.1606603197006386e-06, + "loss": 1.0591, + "step": 18491 + }, + { + "epoch": 0.56, + "learning_rate": 2.160418658733457e-06, + "loss": 1.1483, + "step": 18492 + }, + { + "epoch": 0.56, + "learning_rate": 2.1601770009989264e-06, + "loss": 1.093, + "step": 18493 + }, + { + "epoch": 0.56, + "learning_rate": 2.1599353464993466e-06, + "loss": 1.1116, + "step": 18494 + }, + { + "epoch": 0.56, + "learning_rate": 2.15969369523702e-06, + "loss": 1.0399, + "step": 18495 + }, + { + "epoch": 0.56, + "learning_rate": 2.1594520472142443e-06, + "loss": 1.1722, + "step": 18496 + }, + { + "epoch": 0.56, + "learning_rate": 2.159210402433321e-06, + "loss": 1.0737, + "step": 18497 + }, + { + "epoch": 0.56, + "learning_rate": 2.1589687608965507e-06, + "loss": 1.1291, + "step": 18498 + }, + { + "epoch": 0.56, + "learning_rate": 2.1587271226062334e-06, + "loss": 1.1412, + "step": 18499 + }, + { + "epoch": 0.56, + "learning_rate": 2.1584854875646704e-06, + "loss": 1.0901, + "step": 18500 + }, + { + "epoch": 0.56, + "learning_rate": 2.1582438557741605e-06, + "loss": 1.048, + "step": 18501 + }, + { + "epoch": 0.56, + "learning_rate": 2.158002227237004e-06, + "loss": 1.1371, + "step": 18502 + }, + { + "epoch": 0.56, + "learning_rate": 2.157760601955502e-06, + "loss": 1.1899, + "step": 18503 + }, + { + "epoch": 0.56, + "learning_rate": 2.1575189799319552e-06, + "loss": 1.0049, + "step": 18504 + }, + { + "epoch": 0.56, + "learning_rate": 2.1572773611686616e-06, + "loss": 1.1959, + "step": 18505 + }, + { + "epoch": 0.56, + "learning_rate": 2.1570357456679226e-06, + "loss": 1.0903, + "step": 18506 + }, + { + "epoch": 0.56, + "learning_rate": 2.156794133432038e-06, + "loss": 1.1413, + "step": 18507 + }, + { + "epoch": 0.56, + "learning_rate": 2.156552524463309e-06, + "loss": 1.1627, + "step": 18508 + }, + { + "epoch": 0.56, + "learning_rate": 2.156310918764034e-06, + "loss": 1.127, + "step": 18509 + }, + { + "epoch": 0.56, + "learning_rate": 2.1560693163365127e-06, + "loss": 1.1282, + "step": 18510 + }, + { + "epoch": 0.56, + "learning_rate": 2.1558277171830466e-06, + "loss": 1.0903, + "step": 18511 + }, + { + "epoch": 0.56, + "learning_rate": 2.1555861213059344e-06, + "loss": 1.1228, + "step": 18512 + }, + { + "epoch": 0.56, + "learning_rate": 2.155344528707477e-06, + "loss": 1.0689, + "step": 18513 + }, + { + "epoch": 0.56, + "learning_rate": 2.1551029393899736e-06, + "loss": 1.1322, + "step": 18514 + }, + { + "epoch": 0.56, + "learning_rate": 2.154861353355724e-06, + "loss": 1.0526, + "step": 18515 + }, + { + "epoch": 0.56, + "learning_rate": 2.1546197706070275e-06, + "loss": 1.101, + "step": 18516 + }, + { + "epoch": 0.56, + "learning_rate": 2.1543781911461863e-06, + "loss": 1.1212, + "step": 18517 + }, + { + "epoch": 0.56, + "learning_rate": 2.154136614975497e-06, + "loss": 1.1147, + "step": 18518 + }, + { + "epoch": 0.56, + "learning_rate": 2.15389504209726e-06, + "loss": 1.1225, + "step": 18519 + }, + { + "epoch": 0.56, + "learning_rate": 2.153653472513776e-06, + "loss": 1.1214, + "step": 18520 + }, + { + "epoch": 0.56, + "learning_rate": 2.153411906227345e-06, + "loss": 1.0927, + "step": 18521 + }, + { + "epoch": 0.56, + "learning_rate": 2.153170343240265e-06, + "loss": 1.1768, + "step": 18522 + }, + { + "epoch": 0.56, + "learning_rate": 2.152928783554836e-06, + "loss": 1.1874, + "step": 18523 + }, + { + "epoch": 0.56, + "learning_rate": 2.1526872271733577e-06, + "loss": 1.1902, + "step": 18524 + }, + { + "epoch": 0.56, + "learning_rate": 2.15244567409813e-06, + "loss": 0.9997, + "step": 18525 + }, + { + "epoch": 0.56, + "learning_rate": 2.1522041243314525e-06, + "loss": 1.1086, + "step": 18526 + }, + { + "epoch": 0.56, + "learning_rate": 2.1519625778756237e-06, + "loss": 1.1345, + "step": 18527 + }, + { + "epoch": 0.56, + "learning_rate": 2.1517210347329435e-06, + "loss": 1.078, + "step": 18528 + }, + { + "epoch": 0.56, + "learning_rate": 2.151479494905711e-06, + "loss": 1.0695, + "step": 18529 + }, + { + "epoch": 0.56, + "learning_rate": 2.1512379583962277e-06, + "loss": 1.1329, + "step": 18530 + }, + { + "epoch": 0.56, + "learning_rate": 2.1509964252067894e-06, + "loss": 1.003, + "step": 18531 + }, + { + "epoch": 0.56, + "learning_rate": 2.1507548953396973e-06, + "loss": 1.0345, + "step": 18532 + }, + { + "epoch": 0.56, + "learning_rate": 2.1505133687972505e-06, + "loss": 1.1245, + "step": 18533 + }, + { + "epoch": 0.56, + "learning_rate": 2.150271845581749e-06, + "loss": 1.1139, + "step": 18534 + }, + { + "epoch": 0.56, + "learning_rate": 2.15003032569549e-06, + "loss": 1.077, + "step": 18535 + }, + { + "epoch": 0.56, + "learning_rate": 2.1497888091407736e-06, + "loss": 1.072, + "step": 18536 + }, + { + "epoch": 0.56, + "learning_rate": 2.1495472959198994e-06, + "loss": 1.1458, + "step": 18537 + }, + { + "epoch": 0.56, + "learning_rate": 2.149305786035166e-06, + "loss": 1.1395, + "step": 18538 + }, + { + "epoch": 0.56, + "learning_rate": 2.149064279488873e-06, + "loss": 1.0349, + "step": 18539 + }, + { + "epoch": 0.56, + "learning_rate": 2.1488227762833187e-06, + "loss": 1.0989, + "step": 18540 + }, + { + "epoch": 0.56, + "learning_rate": 2.1485812764208025e-06, + "loss": 1.0634, + "step": 18541 + }, + { + "epoch": 0.56, + "learning_rate": 2.148339779903624e-06, + "loss": 1.1371, + "step": 18542 + }, + { + "epoch": 0.56, + "learning_rate": 2.148098286734081e-06, + "loss": 1.1053, + "step": 18543 + }, + { + "epoch": 0.56, + "learning_rate": 2.1478567969144726e-06, + "loss": 1.1112, + "step": 18544 + }, + { + "epoch": 0.56, + "learning_rate": 2.1476153104470977e-06, + "loss": 1.1367, + "step": 18545 + }, + { + "epoch": 0.56, + "learning_rate": 2.1473738273342553e-06, + "loss": 1.131, + "step": 18546 + }, + { + "epoch": 0.56, + "learning_rate": 2.1471323475782455e-06, + "loss": 1.1193, + "step": 18547 + }, + { + "epoch": 0.56, + "learning_rate": 2.1468908711813647e-06, + "loss": 1.0791, + "step": 18548 + }, + { + "epoch": 0.56, + "learning_rate": 2.1466493981459126e-06, + "loss": 1.2239, + "step": 18549 + }, + { + "epoch": 0.56, + "learning_rate": 2.146407928474188e-06, + "loss": 1.0455, + "step": 18550 + }, + { + "epoch": 0.56, + "learning_rate": 2.1461664621684897e-06, + "loss": 1.1403, + "step": 18551 + }, + { + "epoch": 0.56, + "learning_rate": 2.145924999231117e-06, + "loss": 1.1382, + "step": 18552 + }, + { + "epoch": 0.56, + "learning_rate": 2.145683539664368e-06, + "loss": 1.0178, + "step": 18553 + }, + { + "epoch": 0.56, + "learning_rate": 2.1454420834705396e-06, + "loss": 1.1924, + "step": 18554 + }, + { + "epoch": 0.56, + "learning_rate": 2.1452006306519322e-06, + "loss": 1.0978, + "step": 18555 + }, + { + "epoch": 0.56, + "learning_rate": 2.144959181210845e-06, + "loss": 1.1605, + "step": 18556 + }, + { + "epoch": 0.56, + "learning_rate": 2.1447177351495746e-06, + "loss": 1.179, + "step": 18557 + }, + { + "epoch": 0.56, + "learning_rate": 2.14447629247042e-06, + "loss": 1.1379, + "step": 18558 + }, + { + "epoch": 0.56, + "learning_rate": 2.14423485317568e-06, + "loss": 1.1107, + "step": 18559 + }, + { + "epoch": 0.56, + "learning_rate": 2.143993417267654e-06, + "loss": 1.0507, + "step": 18560 + }, + { + "epoch": 0.56, + "learning_rate": 2.143751984748638e-06, + "loss": 1.1308, + "step": 18561 + }, + { + "epoch": 0.56, + "learning_rate": 2.1435105556209316e-06, + "loss": 1.0793, + "step": 18562 + }, + { + "epoch": 0.56, + "learning_rate": 2.143269129886833e-06, + "loss": 1.0979, + "step": 18563 + }, + { + "epoch": 0.56, + "learning_rate": 2.1430277075486405e-06, + "loss": 1.1359, + "step": 18564 + }, + { + "epoch": 0.56, + "learning_rate": 2.1427862886086536e-06, + "loss": 1.1115, + "step": 18565 + }, + { + "epoch": 0.56, + "learning_rate": 2.1425448730691677e-06, + "loss": 1.0593, + "step": 18566 + }, + { + "epoch": 0.56, + "learning_rate": 2.1423034609324825e-06, + "loss": 1.1487, + "step": 18567 + }, + { + "epoch": 0.56, + "learning_rate": 2.142062052200896e-06, + "loss": 1.2585, + "step": 18568 + }, + { + "epoch": 0.56, + "learning_rate": 2.141820646876707e-06, + "loss": 1.0703, + "step": 18569 + }, + { + "epoch": 0.56, + "learning_rate": 2.141579244962213e-06, + "loss": 1.1073, + "step": 18570 + }, + { + "epoch": 0.56, + "learning_rate": 2.1413378464597115e-06, + "loss": 1.0983, + "step": 18571 + }, + { + "epoch": 0.56, + "learning_rate": 2.1410964513715007e-06, + "loss": 1.0933, + "step": 18572 + }, + { + "epoch": 0.56, + "learning_rate": 2.1408550596998803e-06, + "loss": 1.2638, + "step": 18573 + }, + { + "epoch": 0.56, + "learning_rate": 2.1406136714471458e-06, + "loss": 1.1992, + "step": 18574 + }, + { + "epoch": 0.56, + "learning_rate": 2.1403722866155955e-06, + "loss": 1.2626, + "step": 18575 + }, + { + "epoch": 0.56, + "learning_rate": 2.140130905207528e-06, + "loss": 1.0295, + "step": 18576 + }, + { + "epoch": 0.56, + "learning_rate": 2.1398895272252424e-06, + "loss": 1.0544, + "step": 18577 + }, + { + "epoch": 0.56, + "learning_rate": 2.139648152671034e-06, + "loss": 1.0352, + "step": 18578 + }, + { + "epoch": 0.56, + "learning_rate": 2.1394067815472012e-06, + "loss": 1.0618, + "step": 18579 + }, + { + "epoch": 0.56, + "learning_rate": 2.1391654138560424e-06, + "loss": 1.1829, + "step": 18580 + }, + { + "epoch": 0.56, + "learning_rate": 2.138924049599855e-06, + "loss": 1.1246, + "step": 18581 + }, + { + "epoch": 0.56, + "learning_rate": 2.138682688780937e-06, + "loss": 1.1539, + "step": 18582 + }, + { + "epoch": 0.56, + "learning_rate": 2.1384413314015858e-06, + "loss": 1.0846, + "step": 18583 + }, + { + "epoch": 0.56, + "learning_rate": 2.1381999774640986e-06, + "loss": 1.127, + "step": 18584 + }, + { + "epoch": 0.56, + "learning_rate": 2.137958626970774e-06, + "loss": 1.1866, + "step": 18585 + }, + { + "epoch": 0.56, + "learning_rate": 2.1377172799239092e-06, + "loss": 1.2029, + "step": 18586 + }, + { + "epoch": 0.56, + "learning_rate": 2.137475936325801e-06, + "loss": 1.0718, + "step": 18587 + }, + { + "epoch": 0.56, + "learning_rate": 2.1372345961787466e-06, + "loss": 1.1064, + "step": 18588 + }, + { + "epoch": 0.56, + "learning_rate": 2.1369932594850444e-06, + "loss": 1.1667, + "step": 18589 + }, + { + "epoch": 0.56, + "learning_rate": 2.136751926246993e-06, + "loss": 1.1109, + "step": 18590 + }, + { + "epoch": 0.56, + "learning_rate": 2.1365105964668868e-06, + "loss": 1.0528, + "step": 18591 + }, + { + "epoch": 0.56, + "learning_rate": 2.136269270147025e-06, + "loss": 1.0887, + "step": 18592 + }, + { + "epoch": 0.56, + "learning_rate": 2.136027947289704e-06, + "loss": 1.1543, + "step": 18593 + }, + { + "epoch": 0.56, + "learning_rate": 2.1357866278972224e-06, + "loss": 1.0231, + "step": 18594 + }, + { + "epoch": 0.56, + "learning_rate": 2.1355453119718766e-06, + "loss": 1.1093, + "step": 18595 + }, + { + "epoch": 0.56, + "learning_rate": 2.1353039995159637e-06, + "loss": 1.0469, + "step": 18596 + }, + { + "epoch": 0.56, + "learning_rate": 2.135062690531781e-06, + "loss": 1.1535, + "step": 18597 + }, + { + "epoch": 0.56, + "learning_rate": 2.134821385021626e-06, + "loss": 1.1697, + "step": 18598 + }, + { + "epoch": 0.56, + "learning_rate": 2.134580082987796e-06, + "loss": 1.144, + "step": 18599 + }, + { + "epoch": 0.56, + "learning_rate": 2.134338784432587e-06, + "loss": 1.1179, + "step": 18600 + }, + { + "epoch": 0.56, + "learning_rate": 2.1340974893582963e-06, + "loss": 1.1049, + "step": 18601 + }, + { + "epoch": 0.56, + "learning_rate": 2.133856197767222e-06, + "loss": 1.0996, + "step": 18602 + }, + { + "epoch": 0.56, + "learning_rate": 2.1336149096616606e-06, + "loss": 1.2218, + "step": 18603 + }, + { + "epoch": 0.56, + "learning_rate": 2.133373625043908e-06, + "loss": 1.1201, + "step": 18604 + }, + { + "epoch": 0.56, + "learning_rate": 2.1331323439162623e-06, + "loss": 1.1199, + "step": 18605 + }, + { + "epoch": 0.56, + "learning_rate": 2.132891066281019e-06, + "loss": 1.2786, + "step": 18606 + }, + { + "epoch": 0.56, + "learning_rate": 2.132649792140477e-06, + "loss": 1.0687, + "step": 18607 + }, + { + "epoch": 0.56, + "learning_rate": 2.132408521496932e-06, + "loss": 1.2113, + "step": 18608 + }, + { + "epoch": 0.56, + "learning_rate": 2.1321672543526805e-06, + "loss": 1.0458, + "step": 18609 + }, + { + "epoch": 0.56, + "learning_rate": 2.1319259907100198e-06, + "loss": 1.046, + "step": 18610 + }, + { + "epoch": 0.56, + "learning_rate": 2.1316847305712464e-06, + "loss": 1.1392, + "step": 18611 + }, + { + "epoch": 0.56, + "learning_rate": 2.131443473938658e-06, + "loss": 1.0631, + "step": 18612 + }, + { + "epoch": 0.56, + "learning_rate": 2.131202220814549e-06, + "loss": 1.0074, + "step": 18613 + }, + { + "epoch": 0.56, + "learning_rate": 2.130960971201217e-06, + "loss": 1.1164, + "step": 18614 + }, + { + "epoch": 0.56, + "learning_rate": 2.1307197251009588e-06, + "loss": 0.9899, + "step": 18615 + }, + { + "epoch": 0.56, + "learning_rate": 2.1304784825160725e-06, + "loss": 1.1432, + "step": 18616 + }, + { + "epoch": 0.56, + "learning_rate": 2.1302372434488517e-06, + "loss": 1.1169, + "step": 18617 + }, + { + "epoch": 0.56, + "learning_rate": 2.1299960079015945e-06, + "loss": 1.0366, + "step": 18618 + }, + { + "epoch": 0.56, + "learning_rate": 2.129754775876597e-06, + "loss": 1.1526, + "step": 18619 + }, + { + "epoch": 0.56, + "learning_rate": 2.1295135473761557e-06, + "loss": 1.0276, + "step": 18620 + }, + { + "epoch": 0.56, + "learning_rate": 2.1292723224025675e-06, + "loss": 1.0145, + "step": 18621 + }, + { + "epoch": 0.56, + "learning_rate": 2.1290311009581277e-06, + "loss": 1.1824, + "step": 18622 + }, + { + "epoch": 0.56, + "learning_rate": 2.128789883045133e-06, + "loss": 1.1304, + "step": 18623 + }, + { + "epoch": 0.56, + "learning_rate": 2.1285486686658805e-06, + "loss": 1.1613, + "step": 18624 + }, + { + "epoch": 0.56, + "learning_rate": 2.1283074578226658e-06, + "loss": 1.1276, + "step": 18625 + }, + { + "epoch": 0.56, + "learning_rate": 2.128066250517785e-06, + "loss": 1.1149, + "step": 18626 + }, + { + "epoch": 0.56, + "learning_rate": 2.127825046753534e-06, + "loss": 1.1103, + "step": 18627 + }, + { + "epoch": 0.56, + "learning_rate": 2.1275838465322092e-06, + "loss": 1.0486, + "step": 18628 + }, + { + "epoch": 0.56, + "learning_rate": 2.127342649856108e-06, + "loss": 1.1835, + "step": 18629 + }, + { + "epoch": 0.56, + "learning_rate": 2.127101456727524e-06, + "loss": 1.1736, + "step": 18630 + }, + { + "epoch": 0.56, + "learning_rate": 2.1268602671487545e-06, + "loss": 1.1367, + "step": 18631 + }, + { + "epoch": 0.56, + "learning_rate": 2.126619081122096e-06, + "loss": 1.0654, + "step": 18632 + }, + { + "epoch": 0.56, + "learning_rate": 2.126377898649844e-06, + "loss": 1.0835, + "step": 18633 + }, + { + "epoch": 0.56, + "learning_rate": 2.1261367197342943e-06, + "loss": 1.1249, + "step": 18634 + }, + { + "epoch": 0.56, + "learning_rate": 2.1258955443777434e-06, + "loss": 1.1184, + "step": 18635 + }, + { + "epoch": 0.56, + "learning_rate": 2.1256543725824863e-06, + "loss": 1.0929, + "step": 18636 + }, + { + "epoch": 0.56, + "learning_rate": 2.1254132043508195e-06, + "loss": 1.2515, + "step": 18637 + }, + { + "epoch": 0.56, + "learning_rate": 2.1251720396850386e-06, + "loss": 1.0442, + "step": 18638 + }, + { + "epoch": 0.56, + "learning_rate": 2.124930878587439e-06, + "loss": 1.2523, + "step": 18639 + }, + { + "epoch": 0.56, + "learning_rate": 2.1246897210603173e-06, + "loss": 1.0479, + "step": 18640 + }, + { + "epoch": 0.56, + "learning_rate": 2.124448567105968e-06, + "loss": 1.0969, + "step": 18641 + }, + { + "epoch": 0.56, + "learning_rate": 2.1242074167266888e-06, + "loss": 1.2275, + "step": 18642 + }, + { + "epoch": 0.56, + "learning_rate": 2.123966269924773e-06, + "loss": 1.1541, + "step": 18643 + }, + { + "epoch": 0.56, + "learning_rate": 2.1237251267025172e-06, + "loss": 1.2259, + "step": 18644 + }, + { + "epoch": 0.56, + "learning_rate": 2.123483987062217e-06, + "loss": 1.0691, + "step": 18645 + }, + { + "epoch": 0.56, + "learning_rate": 2.1232428510061676e-06, + "loss": 1.1459, + "step": 18646 + }, + { + "epoch": 0.56, + "learning_rate": 2.1230017185366664e-06, + "loss": 1.1993, + "step": 18647 + }, + { + "epoch": 0.56, + "learning_rate": 2.1227605896560057e-06, + "loss": 1.2392, + "step": 18648 + }, + { + "epoch": 0.56, + "learning_rate": 2.1225194643664827e-06, + "loss": 1.1979, + "step": 18649 + }, + { + "epoch": 0.56, + "learning_rate": 2.1222783426703927e-06, + "loss": 1.2405, + "step": 18650 + }, + { + "epoch": 0.56, + "learning_rate": 2.1220372245700313e-06, + "loss": 1.061, + "step": 18651 + }, + { + "epoch": 0.56, + "learning_rate": 2.121796110067693e-06, + "loss": 1.1404, + "step": 18652 + }, + { + "epoch": 0.56, + "learning_rate": 2.1215549991656738e-06, + "loss": 1.1298, + "step": 18653 + }, + { + "epoch": 0.56, + "learning_rate": 2.1213138918662687e-06, + "loss": 1.0955, + "step": 18654 + }, + { + "epoch": 0.56, + "learning_rate": 2.121072788171774e-06, + "loss": 1.0924, + "step": 18655 + }, + { + "epoch": 0.56, + "learning_rate": 2.1208316880844825e-06, + "loss": 1.125, + "step": 18656 + }, + { + "epoch": 0.56, + "learning_rate": 2.120590591606691e-06, + "loss": 1.0315, + "step": 18657 + }, + { + "epoch": 0.56, + "learning_rate": 2.1203494987406943e-06, + "loss": 1.2681, + "step": 18658 + }, + { + "epoch": 0.56, + "learning_rate": 2.1201084094887873e-06, + "loss": 1.1536, + "step": 18659 + }, + { + "epoch": 0.56, + "learning_rate": 2.1198673238532667e-06, + "loss": 1.1724, + "step": 18660 + }, + { + "epoch": 0.56, + "learning_rate": 2.1196262418364245e-06, + "loss": 1.1602, + "step": 18661 + }, + { + "epoch": 0.56, + "learning_rate": 2.119385163440558e-06, + "loss": 1.1614, + "step": 18662 + }, + { + "epoch": 0.56, + "learning_rate": 2.119144088667961e-06, + "loss": 1.1638, + "step": 18663 + }, + { + "epoch": 0.56, + "learning_rate": 2.1189030175209295e-06, + "loss": 1.1305, + "step": 18664 + }, + { + "epoch": 0.56, + "learning_rate": 2.118661950001757e-06, + "loss": 1.0798, + "step": 18665 + }, + { + "epoch": 0.56, + "learning_rate": 2.1184208861127393e-06, + "loss": 1.1401, + "step": 18666 + }, + { + "epoch": 0.56, + "learning_rate": 2.118179825856171e-06, + "loss": 1.173, + "step": 18667 + }, + { + "epoch": 0.56, + "learning_rate": 2.1179387692343478e-06, + "loss": 1.1537, + "step": 18668 + }, + { + "epoch": 0.56, + "learning_rate": 2.117697716249563e-06, + "loss": 1.1787, + "step": 18669 + }, + { + "epoch": 0.56, + "learning_rate": 2.117456666904111e-06, + "loss": 1.0981, + "step": 18670 + }, + { + "epoch": 0.56, + "learning_rate": 2.1172156212002878e-06, + "loss": 0.9902, + "step": 18671 + }, + { + "epoch": 0.56, + "learning_rate": 2.116974579140387e-06, + "loss": 1.0784, + "step": 18672 + }, + { + "epoch": 0.56, + "learning_rate": 2.1167335407267053e-06, + "loss": 1.2532, + "step": 18673 + }, + { + "epoch": 0.56, + "learning_rate": 2.1164925059615342e-06, + "loss": 1.3434, + "step": 18674 + }, + { + "epoch": 0.56, + "learning_rate": 2.11625147484717e-06, + "loss": 1.1053, + "step": 18675 + }, + { + "epoch": 0.56, + "learning_rate": 2.1160104473859074e-06, + "loss": 1.1656, + "step": 18676 + }, + { + "epoch": 0.56, + "learning_rate": 2.1157694235800404e-06, + "loss": 1.0931, + "step": 18677 + }, + { + "epoch": 0.56, + "learning_rate": 2.115528403431863e-06, + "loss": 1.0064, + "step": 18678 + }, + { + "epoch": 0.56, + "learning_rate": 2.11528738694367e-06, + "loss": 1.1109, + "step": 18679 + }, + { + "epoch": 0.56, + "learning_rate": 2.1150463741177557e-06, + "loss": 1.1467, + "step": 18680 + }, + { + "epoch": 0.56, + "learning_rate": 2.114805364956416e-06, + "loss": 1.1617, + "step": 18681 + }, + { + "epoch": 0.56, + "learning_rate": 2.114564359461942e-06, + "loss": 1.0472, + "step": 18682 + }, + { + "epoch": 0.56, + "learning_rate": 2.1143233576366305e-06, + "loss": 1.1259, + "step": 18683 + }, + { + "epoch": 0.56, + "learning_rate": 2.1140823594827743e-06, + "loss": 1.1356, + "step": 18684 + }, + { + "epoch": 0.56, + "learning_rate": 2.113841365002668e-06, + "loss": 1.1784, + "step": 18685 + }, + { + "epoch": 0.56, + "learning_rate": 2.1136003741986075e-06, + "loss": 1.1871, + "step": 18686 + }, + { + "epoch": 0.56, + "learning_rate": 2.113359387072884e-06, + "loss": 1.1859, + "step": 18687 + }, + { + "epoch": 0.56, + "learning_rate": 2.113118403627793e-06, + "loss": 1.1255, + "step": 18688 + }, + { + "epoch": 0.56, + "learning_rate": 2.1128774238656284e-06, + "loss": 1.1266, + "step": 18689 + }, + { + "epoch": 0.56, + "learning_rate": 2.1126364477886847e-06, + "loss": 1.1381, + "step": 18690 + }, + { + "epoch": 0.56, + "learning_rate": 2.1123954753992554e-06, + "loss": 1.1759, + "step": 18691 + }, + { + "epoch": 0.56, + "learning_rate": 2.112154506699634e-06, + "loss": 1.1434, + "step": 18692 + }, + { + "epoch": 0.56, + "learning_rate": 2.1119135416921152e-06, + "loss": 1.2115, + "step": 18693 + }, + { + "epoch": 0.56, + "learning_rate": 2.1116725803789936e-06, + "loss": 1.072, + "step": 18694 + }, + { + "epoch": 0.56, + "learning_rate": 2.111431622762561e-06, + "loss": 1.1347, + "step": 18695 + }, + { + "epoch": 0.56, + "learning_rate": 2.1111906688451117e-06, + "loss": 1.1581, + "step": 18696 + }, + { + "epoch": 0.56, + "learning_rate": 2.1109497186289403e-06, + "loss": 1.1279, + "step": 18697 + }, + { + "epoch": 0.56, + "learning_rate": 2.1107087721163404e-06, + "loss": 1.109, + "step": 18698 + }, + { + "epoch": 0.56, + "learning_rate": 2.1104678293096067e-06, + "loss": 1.1539, + "step": 18699 + }, + { + "epoch": 0.56, + "learning_rate": 2.1102268902110303e-06, + "loss": 1.1989, + "step": 18700 + }, + { + "epoch": 0.56, + "learning_rate": 2.109985954822906e-06, + "loss": 1.0609, + "step": 18701 + }, + { + "epoch": 0.56, + "learning_rate": 2.1097450231475276e-06, + "loss": 1.0835, + "step": 18702 + }, + { + "epoch": 0.56, + "learning_rate": 2.1095040951871896e-06, + "loss": 1.0323, + "step": 18703 + }, + { + "epoch": 0.56, + "learning_rate": 2.1092631709441837e-06, + "loss": 1.1834, + "step": 18704 + }, + { + "epoch": 0.56, + "learning_rate": 2.1090222504208044e-06, + "loss": 1.2001, + "step": 18705 + }, + { + "epoch": 0.56, + "learning_rate": 2.1087813336193454e-06, + "loss": 1.089, + "step": 18706 + }, + { + "epoch": 0.56, + "learning_rate": 2.1085404205420997e-06, + "loss": 1.0908, + "step": 18707 + }, + { + "epoch": 0.56, + "learning_rate": 2.1082995111913602e-06, + "loss": 1.1307, + "step": 18708 + }, + { + "epoch": 0.56, + "learning_rate": 2.1080586055694203e-06, + "loss": 1.0406, + "step": 18709 + }, + { + "epoch": 0.56, + "learning_rate": 2.107817703678574e-06, + "loss": 1.1763, + "step": 18710 + }, + { + "epoch": 0.56, + "learning_rate": 2.107576805521114e-06, + "loss": 1.2608, + "step": 18711 + }, + { + "epoch": 0.56, + "learning_rate": 2.1073359110993354e-06, + "loss": 1.1418, + "step": 18712 + }, + { + "epoch": 0.56, + "learning_rate": 2.107095020415529e-06, + "loss": 1.1248, + "step": 18713 + }, + { + "epoch": 0.56, + "learning_rate": 2.106854133471988e-06, + "loss": 1.0106, + "step": 18714 + }, + { + "epoch": 0.56, + "learning_rate": 2.1066132502710064e-06, + "loss": 0.9861, + "step": 18715 + }, + { + "epoch": 0.56, + "learning_rate": 2.106372370814878e-06, + "loss": 1.0226, + "step": 18716 + }, + { + "epoch": 0.56, + "learning_rate": 2.106131495105895e-06, + "loss": 1.09, + "step": 18717 + }, + { + "epoch": 0.56, + "learning_rate": 2.10589062314635e-06, + "loss": 1.1647, + "step": 18718 + }, + { + "epoch": 0.56, + "learning_rate": 2.1056497549385363e-06, + "loss": 1.1434, + "step": 18719 + }, + { + "epoch": 0.56, + "learning_rate": 2.1054088904847477e-06, + "loss": 1.0916, + "step": 18720 + }, + { + "epoch": 0.56, + "learning_rate": 2.1051680297872758e-06, + "loss": 1.0136, + "step": 18721 + }, + { + "epoch": 0.56, + "learning_rate": 2.1049271728484143e-06, + "loss": 1.0704, + "step": 18722 + }, + { + "epoch": 0.56, + "learning_rate": 2.1046863196704553e-06, + "loss": 1.1168, + "step": 18723 + }, + { + "epoch": 0.56, + "learning_rate": 2.1044454702556927e-06, + "loss": 1.1318, + "step": 18724 + }, + { + "epoch": 0.56, + "learning_rate": 2.1042046246064196e-06, + "loss": 1.1801, + "step": 18725 + }, + { + "epoch": 0.56, + "learning_rate": 2.1039637827249266e-06, + "loss": 1.0715, + "step": 18726 + }, + { + "epoch": 0.56, + "learning_rate": 2.103722944613508e-06, + "loss": 1.182, + "step": 18727 + }, + { + "epoch": 0.56, + "learning_rate": 2.1034821102744556e-06, + "loss": 1.0845, + "step": 18728 + }, + { + "epoch": 0.56, + "learning_rate": 2.1032412797100643e-06, + "loss": 1.0723, + "step": 18729 + }, + { + "epoch": 0.56, + "learning_rate": 2.1030004529226234e-06, + "loss": 1.2538, + "step": 18730 + }, + { + "epoch": 0.56, + "learning_rate": 2.102759629914427e-06, + "loss": 1.1334, + "step": 18731 + }, + { + "epoch": 0.56, + "learning_rate": 2.102518810687768e-06, + "loss": 1.0167, + "step": 18732 + }, + { + "epoch": 0.56, + "learning_rate": 2.1022779952449383e-06, + "loss": 1.1067, + "step": 18733 + }, + { + "epoch": 0.56, + "learning_rate": 2.1020371835882308e-06, + "loss": 1.1436, + "step": 18734 + }, + { + "epoch": 0.56, + "learning_rate": 2.1017963757199374e-06, + "loss": 1.1401, + "step": 18735 + }, + { + "epoch": 0.56, + "learning_rate": 2.10155557164235e-06, + "loss": 1.2282, + "step": 18736 + }, + { + "epoch": 0.56, + "learning_rate": 2.1013147713577626e-06, + "loss": 1.1786, + "step": 18737 + }, + { + "epoch": 0.56, + "learning_rate": 2.101073974868467e-06, + "loss": 1.1229, + "step": 18738 + }, + { + "epoch": 0.56, + "learning_rate": 2.1008331821767543e-06, + "loss": 1.092, + "step": 18739 + }, + { + "epoch": 0.56, + "learning_rate": 2.1005923932849174e-06, + "loss": 1.1306, + "step": 18740 + }, + { + "epoch": 0.56, + "learning_rate": 2.1003516081952483e-06, + "loss": 1.0541, + "step": 18741 + }, + { + "epoch": 0.56, + "learning_rate": 2.1001108269100413e-06, + "loss": 1.0657, + "step": 18742 + }, + { + "epoch": 0.56, + "learning_rate": 2.099870049431585e-06, + "loss": 1.191, + "step": 18743 + }, + { + "epoch": 0.56, + "learning_rate": 2.0996292757621727e-06, + "loss": 1.1149, + "step": 18744 + }, + { + "epoch": 0.56, + "learning_rate": 2.0993885059040974e-06, + "loss": 1.1442, + "step": 18745 + }, + { + "epoch": 0.56, + "learning_rate": 2.099147739859651e-06, + "loss": 1.1466, + "step": 18746 + }, + { + "epoch": 0.56, + "learning_rate": 2.098906977631125e-06, + "loss": 1.1511, + "step": 18747 + }, + { + "epoch": 0.56, + "learning_rate": 2.0986662192208108e-06, + "loss": 1.1431, + "step": 18748 + }, + { + "epoch": 0.56, + "learning_rate": 2.098425464631001e-06, + "loss": 1.087, + "step": 18749 + }, + { + "epoch": 0.56, + "learning_rate": 2.098184713863987e-06, + "loss": 1.0081, + "step": 18750 + }, + { + "epoch": 0.56, + "learning_rate": 2.0979439669220626e-06, + "loss": 1.0108, + "step": 18751 + }, + { + "epoch": 0.56, + "learning_rate": 2.097703223807517e-06, + "loss": 1.0934, + "step": 18752 + }, + { + "epoch": 0.56, + "learning_rate": 2.0974624845226427e-06, + "loss": 1.0634, + "step": 18753 + }, + { + "epoch": 0.56, + "learning_rate": 2.0972217490697316e-06, + "loss": 1.1246, + "step": 18754 + }, + { + "epoch": 0.56, + "learning_rate": 2.096981017451077e-06, + "loss": 1.3098, + "step": 18755 + }, + { + "epoch": 0.57, + "learning_rate": 2.0967402896689677e-06, + "loss": 1.1605, + "step": 18756 + }, + { + "epoch": 0.57, + "learning_rate": 2.0964995657256965e-06, + "loss": 1.1138, + "step": 18757 + }, + { + "epoch": 0.57, + "learning_rate": 2.096258845623555e-06, + "loss": 1.0773, + "step": 18758 + }, + { + "epoch": 0.57, + "learning_rate": 2.0960181293648357e-06, + "loss": 1.0995, + "step": 18759 + }, + { + "epoch": 0.57, + "learning_rate": 2.0957774169518284e-06, + "loss": 1.092, + "step": 18760 + }, + { + "epoch": 0.57, + "learning_rate": 2.0955367083868254e-06, + "loss": 1.1152, + "step": 18761 + }, + { + "epoch": 0.57, + "learning_rate": 2.0952960036721186e-06, + "loss": 0.9997, + "step": 18762 + }, + { + "epoch": 0.57, + "learning_rate": 2.0950553028099997e-06, + "loss": 1.1654, + "step": 18763 + }, + { + "epoch": 0.57, + "learning_rate": 2.094814605802758e-06, + "loss": 1.1587, + "step": 18764 + }, + { + "epoch": 0.57, + "learning_rate": 2.0945739126526864e-06, + "loss": 1.0474, + "step": 18765 + }, + { + "epoch": 0.57, + "learning_rate": 2.0943332233620756e-06, + "loss": 1.1011, + "step": 18766 + }, + { + "epoch": 0.57, + "learning_rate": 2.0940925379332176e-06, + "loss": 1.129, + "step": 18767 + }, + { + "epoch": 0.57, + "learning_rate": 2.0938518563684037e-06, + "loss": 1.1016, + "step": 18768 + }, + { + "epoch": 0.57, + "learning_rate": 2.0936111786699237e-06, + "loss": 1.1389, + "step": 18769 + }, + { + "epoch": 0.57, + "learning_rate": 2.09337050484007e-06, + "loss": 1.1968, + "step": 18770 + }, + { + "epoch": 0.57, + "learning_rate": 2.0931298348811323e-06, + "loss": 0.9937, + "step": 18771 + }, + { + "epoch": 0.57, + "learning_rate": 2.0928891687954037e-06, + "loss": 1.1478, + "step": 18772 + }, + { + "epoch": 0.57, + "learning_rate": 2.0926485065851736e-06, + "loss": 1.1194, + "step": 18773 + }, + { + "epoch": 0.57, + "learning_rate": 2.0924078482527336e-06, + "loss": 1.256, + "step": 18774 + }, + { + "epoch": 0.57, + "learning_rate": 2.0921671938003745e-06, + "loss": 1.0274, + "step": 18775 + }, + { + "epoch": 0.57, + "learning_rate": 2.0919265432303884e-06, + "loss": 1.2088, + "step": 18776 + }, + { + "epoch": 0.57, + "learning_rate": 2.091685896545064e-06, + "loss": 1.1266, + "step": 18777 + }, + { + "epoch": 0.57, + "learning_rate": 2.0914452537466936e-06, + "loss": 1.1248, + "step": 18778 + }, + { + "epoch": 0.57, + "learning_rate": 2.091204614837567e-06, + "loss": 1.1652, + "step": 18779 + }, + { + "epoch": 0.57, + "learning_rate": 2.0909639798199756e-06, + "loss": 1.2325, + "step": 18780 + }, + { + "epoch": 0.57, + "learning_rate": 2.0907233486962113e-06, + "loss": 1.1396, + "step": 18781 + }, + { + "epoch": 0.57, + "learning_rate": 2.0904827214685626e-06, + "loss": 1.0755, + "step": 18782 + }, + { + "epoch": 0.57, + "learning_rate": 2.090242098139321e-06, + "loss": 1.1249, + "step": 18783 + }, + { + "epoch": 0.57, + "learning_rate": 2.0900014787107775e-06, + "loss": 1.0887, + "step": 18784 + }, + { + "epoch": 0.57, + "learning_rate": 2.089760863185223e-06, + "loss": 1.0715, + "step": 18785 + }, + { + "epoch": 0.57, + "learning_rate": 2.089520251564947e-06, + "loss": 1.1662, + "step": 18786 + }, + { + "epoch": 0.57, + "learning_rate": 2.0892796438522405e-06, + "loss": 1.1879, + "step": 18787 + }, + { + "epoch": 0.57, + "learning_rate": 2.089039040049394e-06, + "loss": 1.1385, + "step": 18788 + }, + { + "epoch": 0.57, + "learning_rate": 2.0887984401586985e-06, + "loss": 1.041, + "step": 18789 + }, + { + "epoch": 0.57, + "learning_rate": 2.0885578441824435e-06, + "loss": 1.1868, + "step": 18790 + }, + { + "epoch": 0.57, + "learning_rate": 2.088317252122919e-06, + "loss": 1.0262, + "step": 18791 + }, + { + "epoch": 0.57, + "learning_rate": 2.0880766639824165e-06, + "loss": 1.1484, + "step": 18792 + }, + { + "epoch": 0.57, + "learning_rate": 2.0878360797632257e-06, + "loss": 1.1548, + "step": 18793 + }, + { + "epoch": 0.57, + "learning_rate": 2.0875954994676376e-06, + "loss": 1.1339, + "step": 18794 + }, + { + "epoch": 0.57, + "learning_rate": 2.087354923097941e-06, + "loss": 1.0225, + "step": 18795 + }, + { + "epoch": 0.57, + "learning_rate": 2.0871143506564265e-06, + "loss": 1.106, + "step": 18796 + }, + { + "epoch": 0.57, + "learning_rate": 2.0868737821453846e-06, + "loss": 1.0719, + "step": 18797 + }, + { + "epoch": 0.57, + "learning_rate": 2.086633217567106e-06, + "loss": 1.0817, + "step": 18798 + }, + { + "epoch": 0.57, + "learning_rate": 2.0863926569238797e-06, + "loss": 1.0107, + "step": 18799 + }, + { + "epoch": 0.57, + "learning_rate": 2.086152100217996e-06, + "loss": 1.0624, + "step": 18800 + }, + { + "epoch": 0.57, + "learning_rate": 2.0859115474517454e-06, + "loss": 1.1635, + "step": 18801 + }, + { + "epoch": 0.57, + "learning_rate": 2.0856709986274175e-06, + "loss": 1.0285, + "step": 18802 + }, + { + "epoch": 0.57, + "learning_rate": 2.0854304537473014e-06, + "loss": 1.1201, + "step": 18803 + }, + { + "epoch": 0.57, + "learning_rate": 2.085189912813688e-06, + "loss": 1.1794, + "step": 18804 + }, + { + "epoch": 0.57, + "learning_rate": 2.084949375828867e-06, + "loss": 1.2799, + "step": 18805 + }, + { + "epoch": 0.57, + "learning_rate": 2.0847088427951274e-06, + "loss": 1.2022, + "step": 18806 + }, + { + "epoch": 0.57, + "learning_rate": 2.084468313714761e-06, + "loss": 1.1957, + "step": 18807 + }, + { + "epoch": 0.57, + "learning_rate": 2.0842277885900553e-06, + "loss": 1.1544, + "step": 18808 + }, + { + "epoch": 0.57, + "learning_rate": 2.083987267423301e-06, + "loss": 1.0029, + "step": 18809 + }, + { + "epoch": 0.57, + "learning_rate": 2.0837467502167867e-06, + "loss": 0.9846, + "step": 18810 + }, + { + "epoch": 0.57, + "learning_rate": 2.0835062369728044e-06, + "loss": 1.0344, + "step": 18811 + }, + { + "epoch": 0.57, + "learning_rate": 2.0832657276936415e-06, + "loss": 1.1927, + "step": 18812 + }, + { + "epoch": 0.57, + "learning_rate": 2.083025222381588e-06, + "loss": 1.2679, + "step": 18813 + }, + { + "epoch": 0.57, + "learning_rate": 2.0827847210389328e-06, + "loss": 1.0879, + "step": 18814 + }, + { + "epoch": 0.57, + "learning_rate": 2.0825442236679676e-06, + "loss": 1.0745, + "step": 18815 + }, + { + "epoch": 0.57, + "learning_rate": 2.082303730270979e-06, + "loss": 1.1147, + "step": 18816 + }, + { + "epoch": 0.57, + "learning_rate": 2.0820632408502584e-06, + "loss": 1.119, + "step": 18817 + }, + { + "epoch": 0.57, + "learning_rate": 2.081822755408094e-06, + "loss": 1.1328, + "step": 18818 + }, + { + "epoch": 0.57, + "learning_rate": 2.0815822739467754e-06, + "loss": 1.0752, + "step": 18819 + }, + { + "epoch": 0.57, + "learning_rate": 2.0813417964685937e-06, + "loss": 1.1285, + "step": 18820 + }, + { + "epoch": 0.57, + "learning_rate": 2.0811013229758355e-06, + "loss": 0.9761, + "step": 18821 + }, + { + "epoch": 0.57, + "learning_rate": 2.0808608534707903e-06, + "loss": 1.0932, + "step": 18822 + }, + { + "epoch": 0.57, + "learning_rate": 2.0806203879557483e-06, + "loss": 1.1645, + "step": 18823 + }, + { + "epoch": 0.57, + "learning_rate": 2.0803799264329993e-06, + "loss": 1.1281, + "step": 18824 + }, + { + "epoch": 0.57, + "learning_rate": 2.08013946890483e-06, + "loss": 1.0539, + "step": 18825 + }, + { + "epoch": 0.57, + "learning_rate": 2.0798990153735306e-06, + "loss": 1.1426, + "step": 18826 + }, + { + "epoch": 0.57, + "learning_rate": 2.0796585658413906e-06, + "loss": 1.0593, + "step": 18827 + }, + { + "epoch": 0.57, + "learning_rate": 2.0794181203106993e-06, + "loss": 1.1703, + "step": 18828 + }, + { + "epoch": 0.57, + "learning_rate": 2.079177678783744e-06, + "loss": 1.1115, + "step": 18829 + }, + { + "epoch": 0.57, + "learning_rate": 2.078937241262815e-06, + "loss": 1.0381, + "step": 18830 + }, + { + "epoch": 0.57, + "learning_rate": 2.0786968077502e-06, + "loss": 1.1208, + "step": 18831 + }, + { + "epoch": 0.57, + "learning_rate": 2.078456378248189e-06, + "loss": 1.0919, + "step": 18832 + }, + { + "epoch": 0.57, + "learning_rate": 2.0782159527590712e-06, + "loss": 1.0062, + "step": 18833 + }, + { + "epoch": 0.57, + "learning_rate": 2.0779755312851334e-06, + "loss": 1.016, + "step": 18834 + }, + { + "epoch": 0.57, + "learning_rate": 2.077735113828665e-06, + "loss": 1.0655, + "step": 18835 + }, + { + "epoch": 0.57, + "learning_rate": 2.077494700391955e-06, + "loss": 1.1531, + "step": 18836 + }, + { + "epoch": 0.57, + "learning_rate": 2.0772542909772935e-06, + "loss": 1.3226, + "step": 18837 + }, + { + "epoch": 0.57, + "learning_rate": 2.077013885586966e-06, + "loss": 1.1322, + "step": 18838 + }, + { + "epoch": 0.57, + "learning_rate": 2.0767734842232628e-06, + "loss": 1.1211, + "step": 18839 + }, + { + "epoch": 0.57, + "learning_rate": 2.076533086888472e-06, + "loss": 1.1452, + "step": 18840 + }, + { + "epoch": 0.57, + "learning_rate": 2.076292693584883e-06, + "loss": 1.1699, + "step": 18841 + }, + { + "epoch": 0.57, + "learning_rate": 2.076052304314783e-06, + "loss": 1.1524, + "step": 18842 + }, + { + "epoch": 0.57, + "learning_rate": 2.0758119190804603e-06, + "loss": 1.167, + "step": 18843 + }, + { + "epoch": 0.57, + "learning_rate": 2.0755715378842046e-06, + "loss": 1.1564, + "step": 18844 + }, + { + "epoch": 0.57, + "learning_rate": 2.075331160728303e-06, + "loss": 1.0848, + "step": 18845 + }, + { + "epoch": 0.57, + "learning_rate": 2.0750907876150454e-06, + "loss": 1.0966, + "step": 18846 + }, + { + "epoch": 0.57, + "learning_rate": 2.074850418546718e-06, + "loss": 1.0629, + "step": 18847 + }, + { + "epoch": 0.57, + "learning_rate": 2.0746100535256097e-06, + "loss": 1.1579, + "step": 18848 + }, + { + "epoch": 0.57, + "learning_rate": 2.074369692554009e-06, + "loss": 1.0831, + "step": 18849 + }, + { + "epoch": 0.57, + "learning_rate": 2.0741293356342045e-06, + "loss": 1.1066, + "step": 18850 + }, + { + "epoch": 0.57, + "learning_rate": 2.0738889827684827e-06, + "loss": 1.1666, + "step": 18851 + }, + { + "epoch": 0.57, + "learning_rate": 2.0736486339591327e-06, + "loss": 1.0728, + "step": 18852 + }, + { + "epoch": 0.57, + "learning_rate": 2.0734082892084423e-06, + "loss": 1.0913, + "step": 18853 + }, + { + "epoch": 0.57, + "learning_rate": 2.0731679485187e-06, + "loss": 1.1466, + "step": 18854 + }, + { + "epoch": 0.57, + "learning_rate": 2.072927611892193e-06, + "loss": 0.9597, + "step": 18855 + }, + { + "epoch": 0.57, + "learning_rate": 2.072687279331209e-06, + "loss": 1.1471, + "step": 18856 + }, + { + "epoch": 0.57, + "learning_rate": 2.0724469508380367e-06, + "loss": 1.1277, + "step": 18857 + }, + { + "epoch": 0.57, + "learning_rate": 2.072206626414963e-06, + "loss": 1.1243, + "step": 18858 + }, + { + "epoch": 0.57, + "learning_rate": 2.0719663060642777e-06, + "loss": 1.0801, + "step": 18859 + }, + { + "epoch": 0.57, + "learning_rate": 2.071725989788266e-06, + "loss": 1.22, + "step": 18860 + }, + { + "epoch": 0.57, + "learning_rate": 2.0714856775892165e-06, + "loss": 1.2311, + "step": 18861 + }, + { + "epoch": 0.57, + "learning_rate": 2.0712453694694167e-06, + "loss": 0.9444, + "step": 18862 + }, + { + "epoch": 0.57, + "learning_rate": 2.071005065431156e-06, + "loss": 1.0182, + "step": 18863 + }, + { + "epoch": 0.57, + "learning_rate": 2.070764765476719e-06, + "loss": 1.1797, + "step": 18864 + }, + { + "epoch": 0.57, + "learning_rate": 2.070524469608395e-06, + "loss": 1.1336, + "step": 18865 + }, + { + "epoch": 0.57, + "learning_rate": 2.070284177828471e-06, + "loss": 1.1034, + "step": 18866 + }, + { + "epoch": 0.57, + "learning_rate": 2.0700438901392355e-06, + "loss": 1.1222, + "step": 18867 + }, + { + "epoch": 0.57, + "learning_rate": 2.0698036065429746e-06, + "loss": 1.3265, + "step": 18868 + }, + { + "epoch": 0.57, + "learning_rate": 2.0695633270419757e-06, + "loss": 1.0816, + "step": 18869 + }, + { + "epoch": 0.57, + "learning_rate": 2.069323051638527e-06, + "loss": 1.0903, + "step": 18870 + }, + { + "epoch": 0.57, + "learning_rate": 2.0690827803349156e-06, + "loss": 1.1207, + "step": 18871 + }, + { + "epoch": 0.57, + "learning_rate": 2.068842513133429e-06, + "loss": 1.0399, + "step": 18872 + }, + { + "epoch": 0.57, + "learning_rate": 2.0686022500363533e-06, + "loss": 1.1518, + "step": 18873 + }, + { + "epoch": 0.57, + "learning_rate": 2.0683619910459764e-06, + "loss": 1.2184, + "step": 18874 + }, + { + "epoch": 0.57, + "learning_rate": 2.068121736164585e-06, + "loss": 1.2869, + "step": 18875 + }, + { + "epoch": 0.57, + "learning_rate": 2.0678814853944685e-06, + "loss": 1.1581, + "step": 18876 + }, + { + "epoch": 0.57, + "learning_rate": 2.0676412387379107e-06, + "loss": 1.1331, + "step": 18877 + }, + { + "epoch": 0.57, + "learning_rate": 2.0674009961972004e-06, + "loss": 1.0408, + "step": 18878 + }, + { + "epoch": 0.57, + "learning_rate": 2.067160757774624e-06, + "loss": 1.0908, + "step": 18879 + }, + { + "epoch": 0.57, + "learning_rate": 2.066920523472469e-06, + "loss": 1.28, + "step": 18880 + }, + { + "epoch": 0.57, + "learning_rate": 2.0666802932930218e-06, + "loss": 1.1683, + "step": 18881 + }, + { + "epoch": 0.57, + "learning_rate": 2.0664400672385702e-06, + "loss": 1.2886, + "step": 18882 + }, + { + "epoch": 0.57, + "learning_rate": 2.0661998453113998e-06, + "loss": 1.1664, + "step": 18883 + }, + { + "epoch": 0.57, + "learning_rate": 2.065959627513798e-06, + "loss": 1.1499, + "step": 18884 + }, + { + "epoch": 0.57, + "learning_rate": 2.0657194138480515e-06, + "loss": 1.2281, + "step": 18885 + }, + { + "epoch": 0.57, + "learning_rate": 2.0654792043164468e-06, + "loss": 1.0354, + "step": 18886 + }, + { + "epoch": 0.57, + "learning_rate": 2.065238998921271e-06, + "loss": 1.1426, + "step": 18887 + }, + { + "epoch": 0.57, + "learning_rate": 2.0649987976648102e-06, + "loss": 1.2399, + "step": 18888 + }, + { + "epoch": 0.57, + "learning_rate": 2.064758600549353e-06, + "loss": 1.0776, + "step": 18889 + }, + { + "epoch": 0.57, + "learning_rate": 2.0645184075771825e-06, + "loss": 1.1086, + "step": 18890 + }, + { + "epoch": 0.57, + "learning_rate": 2.0642782187505875e-06, + "loss": 1.1361, + "step": 18891 + }, + { + "epoch": 0.57, + "learning_rate": 2.064038034071854e-06, + "loss": 1.0103, + "step": 18892 + }, + { + "epoch": 0.57, + "learning_rate": 2.063797853543269e-06, + "loss": 1.2328, + "step": 18893 + }, + { + "epoch": 0.57, + "learning_rate": 2.063557677167118e-06, + "loss": 1.0431, + "step": 18894 + }, + { + "epoch": 0.57, + "learning_rate": 2.063317504945687e-06, + "loss": 1.0508, + "step": 18895 + }, + { + "epoch": 0.57, + "learning_rate": 2.0630773368812634e-06, + "loss": 1.2059, + "step": 18896 + }, + { + "epoch": 0.57, + "learning_rate": 2.062837172976133e-06, + "loss": 1.0943, + "step": 18897 + }, + { + "epoch": 0.57, + "learning_rate": 2.062597013232583e-06, + "loss": 1.1365, + "step": 18898 + }, + { + "epoch": 0.57, + "learning_rate": 2.062356857652898e-06, + "loss": 1.103, + "step": 18899 + }, + { + "epoch": 0.57, + "learning_rate": 2.062116706239365e-06, + "loss": 1.07, + "step": 18900 + }, + { + "epoch": 0.57, + "learning_rate": 2.06187655899427e-06, + "loss": 1.2076, + "step": 18901 + }, + { + "epoch": 0.57, + "learning_rate": 2.0616364159199006e-06, + "loss": 1.1379, + "step": 18902 + }, + { + "epoch": 0.57, + "learning_rate": 2.06139627701854e-06, + "loss": 1.0497, + "step": 18903 + }, + { + "epoch": 0.57, + "learning_rate": 2.061156142292476e-06, + "loss": 1.1193, + "step": 18904 + }, + { + "epoch": 0.57, + "learning_rate": 2.0609160117439937e-06, + "loss": 1.1213, + "step": 18905 + }, + { + "epoch": 0.57, + "learning_rate": 2.0606758853753805e-06, + "loss": 1.0759, + "step": 18906 + }, + { + "epoch": 0.57, + "learning_rate": 2.0604357631889206e-06, + "loss": 1.1093, + "step": 18907 + }, + { + "epoch": 0.57, + "learning_rate": 2.0601956451869003e-06, + "loss": 1.0669, + "step": 18908 + }, + { + "epoch": 0.57, + "learning_rate": 2.0599555313716055e-06, + "loss": 1.1873, + "step": 18909 + }, + { + "epoch": 0.57, + "learning_rate": 2.0597154217453224e-06, + "loss": 1.0776, + "step": 18910 + }, + { + "epoch": 0.57, + "learning_rate": 2.059475316310337e-06, + "loss": 1.1097, + "step": 18911 + }, + { + "epoch": 0.57, + "learning_rate": 2.0592352150689333e-06, + "loss": 1.119, + "step": 18912 + }, + { + "epoch": 0.57, + "learning_rate": 2.0589951180233984e-06, + "loss": 0.9672, + "step": 18913 + }, + { + "epoch": 0.57, + "learning_rate": 2.058755025176018e-06, + "loss": 1.0205, + "step": 18914 + }, + { + "epoch": 0.57, + "learning_rate": 2.0585149365290778e-06, + "loss": 1.0718, + "step": 18915 + }, + { + "epoch": 0.57, + "learning_rate": 2.0582748520848618e-06, + "loss": 1.1952, + "step": 18916 + }, + { + "epoch": 0.57, + "learning_rate": 2.0580347718456566e-06, + "loss": 1.1796, + "step": 18917 + }, + { + "epoch": 0.57, + "learning_rate": 2.0577946958137475e-06, + "loss": 1.1998, + "step": 18918 + }, + { + "epoch": 0.57, + "learning_rate": 2.0575546239914214e-06, + "loss": 1.2219, + "step": 18919 + }, + { + "epoch": 0.57, + "learning_rate": 2.0573145563809603e-06, + "loss": 1.09, + "step": 18920 + }, + { + "epoch": 0.57, + "learning_rate": 2.057074492984652e-06, + "loss": 1.1005, + "step": 18921 + }, + { + "epoch": 0.57, + "learning_rate": 2.056834433804781e-06, + "loss": 1.1562, + "step": 18922 + }, + { + "epoch": 0.57, + "learning_rate": 2.056594378843633e-06, + "loss": 1.1665, + "step": 18923 + }, + { + "epoch": 0.57, + "learning_rate": 2.0563543281034933e-06, + "loss": 1.055, + "step": 18924 + }, + { + "epoch": 0.57, + "learning_rate": 2.0561142815866463e-06, + "loss": 1.1147, + "step": 18925 + }, + { + "epoch": 0.57, + "learning_rate": 2.0558742392953772e-06, + "loss": 1.047, + "step": 18926 + }, + { + "epoch": 0.57, + "learning_rate": 2.0556342012319716e-06, + "loss": 1.2299, + "step": 18927 + }, + { + "epoch": 0.57, + "learning_rate": 2.0553941673987153e-06, + "loss": 1.0388, + "step": 18928 + }, + { + "epoch": 0.57, + "learning_rate": 2.0551541377978917e-06, + "loss": 1.1548, + "step": 18929 + }, + { + "epoch": 0.57, + "learning_rate": 2.0549141124317864e-06, + "loss": 1.2458, + "step": 18930 + }, + { + "epoch": 0.57, + "learning_rate": 2.0546740913026844e-06, + "loss": 1.1918, + "step": 18931 + }, + { + "epoch": 0.57, + "learning_rate": 2.0544340744128717e-06, + "loss": 1.0829, + "step": 18932 + }, + { + "epoch": 0.57, + "learning_rate": 2.0541940617646307e-06, + "loss": 1.0366, + "step": 18933 + }, + { + "epoch": 0.57, + "learning_rate": 2.0539540533602476e-06, + "loss": 0.9856, + "step": 18934 + }, + { + "epoch": 0.57, + "learning_rate": 2.053714049202007e-06, + "loss": 1.1104, + "step": 18935 + }, + { + "epoch": 0.57, + "learning_rate": 2.0534740492921947e-06, + "loss": 1.1593, + "step": 18936 + }, + { + "epoch": 0.57, + "learning_rate": 2.0532340536330934e-06, + "loss": 1.1942, + "step": 18937 + }, + { + "epoch": 0.57, + "learning_rate": 2.052994062226989e-06, + "loss": 1.0866, + "step": 18938 + }, + { + "epoch": 0.57, + "learning_rate": 2.0527540750761652e-06, + "loss": 1.0982, + "step": 18939 + }, + { + "epoch": 0.57, + "learning_rate": 2.052514092182908e-06, + "loss": 1.083, + "step": 18940 + }, + { + "epoch": 0.57, + "learning_rate": 2.052274113549502e-06, + "loss": 1.0805, + "step": 18941 + }, + { + "epoch": 0.57, + "learning_rate": 2.0520341391782296e-06, + "loss": 1.133, + "step": 18942 + }, + { + "epoch": 0.57, + "learning_rate": 2.051794169071377e-06, + "loss": 1.0461, + "step": 18943 + }, + { + "epoch": 0.57, + "learning_rate": 2.051554203231227e-06, + "loss": 1.1024, + "step": 18944 + }, + { + "epoch": 0.57, + "learning_rate": 2.0513142416600666e-06, + "loss": 1.1644, + "step": 18945 + }, + { + "epoch": 0.57, + "learning_rate": 2.051074284360178e-06, + "loss": 0.9968, + "step": 18946 + }, + { + "epoch": 0.57, + "learning_rate": 2.050834331333845e-06, + "loss": 1.0734, + "step": 18947 + }, + { + "epoch": 0.57, + "learning_rate": 2.0505943825833533e-06, + "loss": 1.0579, + "step": 18948 + }, + { + "epoch": 0.57, + "learning_rate": 2.0503544381109876e-06, + "loss": 1.11, + "step": 18949 + }, + { + "epoch": 0.57, + "learning_rate": 2.05011449791903e-06, + "loss": 1.2106, + "step": 18950 + }, + { + "epoch": 0.57, + "learning_rate": 2.0498745620097658e-06, + "loss": 1.1884, + "step": 18951 + }, + { + "epoch": 0.57, + "learning_rate": 2.049634630385479e-06, + "loss": 1.0637, + "step": 18952 + }, + { + "epoch": 0.57, + "learning_rate": 2.049394703048454e-06, + "loss": 1.1286, + "step": 18953 + }, + { + "epoch": 0.57, + "learning_rate": 2.0491547800009746e-06, + "loss": 1.0853, + "step": 18954 + }, + { + "epoch": 0.57, + "learning_rate": 2.048914861245324e-06, + "loss": 1.0969, + "step": 18955 + }, + { + "epoch": 0.57, + "learning_rate": 2.048674946783787e-06, + "loss": 1.1891, + "step": 18956 + }, + { + "epoch": 0.57, + "learning_rate": 2.048435036618647e-06, + "loss": 1.0439, + "step": 18957 + }, + { + "epoch": 0.57, + "learning_rate": 2.0481951307521886e-06, + "loss": 1.0482, + "step": 18958 + }, + { + "epoch": 0.57, + "learning_rate": 2.0479552291866944e-06, + "loss": 1.0192, + "step": 18959 + }, + { + "epoch": 0.57, + "learning_rate": 2.047715331924448e-06, + "loss": 1.2094, + "step": 18960 + }, + { + "epoch": 0.57, + "learning_rate": 2.0474754389677346e-06, + "loss": 1.1097, + "step": 18961 + }, + { + "epoch": 0.57, + "learning_rate": 2.0472355503188372e-06, + "loss": 1.1371, + "step": 18962 + }, + { + "epoch": 0.57, + "learning_rate": 2.046995665980039e-06, + "loss": 1.1376, + "step": 18963 + }, + { + "epoch": 0.57, + "learning_rate": 2.046755785953624e-06, + "loss": 1.1334, + "step": 18964 + }, + { + "epoch": 0.57, + "learning_rate": 2.0465159102418755e-06, + "loss": 0.9823, + "step": 18965 + }, + { + "epoch": 0.57, + "learning_rate": 2.046276038847077e-06, + "loss": 1.1208, + "step": 18966 + }, + { + "epoch": 0.57, + "learning_rate": 2.0460361717715128e-06, + "loss": 1.1799, + "step": 18967 + }, + { + "epoch": 0.57, + "learning_rate": 2.045796309017465e-06, + "loss": 1.2462, + "step": 18968 + }, + { + "epoch": 0.57, + "learning_rate": 2.045556450587217e-06, + "loss": 1.1092, + "step": 18969 + }, + { + "epoch": 0.57, + "learning_rate": 2.0453165964830533e-06, + "loss": 1.103, + "step": 18970 + }, + { + "epoch": 0.57, + "learning_rate": 2.0450767467072575e-06, + "loss": 1.126, + "step": 18971 + }, + { + "epoch": 0.57, + "learning_rate": 2.044836901262111e-06, + "loss": 1.0905, + "step": 18972 + }, + { + "epoch": 0.57, + "learning_rate": 2.0445970601498984e-06, + "loss": 1.0632, + "step": 18973 + }, + { + "epoch": 0.57, + "learning_rate": 2.044357223372902e-06, + "loss": 1.1043, + "step": 18974 + }, + { + "epoch": 0.57, + "learning_rate": 2.0441173909334064e-06, + "loss": 1.0909, + "step": 18975 + }, + { + "epoch": 0.57, + "learning_rate": 2.0438775628336928e-06, + "loss": 1.1003, + "step": 18976 + }, + { + "epoch": 0.57, + "learning_rate": 2.043637739076045e-06, + "loss": 1.1351, + "step": 18977 + }, + { + "epoch": 0.57, + "learning_rate": 2.043397919662746e-06, + "loss": 1.1525, + "step": 18978 + }, + { + "epoch": 0.57, + "learning_rate": 2.043158104596079e-06, + "loss": 1.2548, + "step": 18979 + }, + { + "epoch": 0.57, + "learning_rate": 2.0429182938783276e-06, + "loss": 1.0671, + "step": 18980 + }, + { + "epoch": 0.57, + "learning_rate": 2.0426784875117734e-06, + "loss": 1.0883, + "step": 18981 + }, + { + "epoch": 0.57, + "learning_rate": 2.0424386854986993e-06, + "loss": 1.1075, + "step": 18982 + }, + { + "epoch": 0.57, + "learning_rate": 2.0421988878413887e-06, + "loss": 1.0009, + "step": 18983 + }, + { + "epoch": 0.57, + "learning_rate": 2.0419590945421254e-06, + "loss": 1.1166, + "step": 18984 + }, + { + "epoch": 0.57, + "learning_rate": 2.04171930560319e-06, + "loss": 1.1307, + "step": 18985 + }, + { + "epoch": 0.57, + "learning_rate": 2.0414795210268658e-06, + "loss": 1.0761, + "step": 18986 + }, + { + "epoch": 0.57, + "learning_rate": 2.041239740815436e-06, + "loss": 1.161, + "step": 18987 + }, + { + "epoch": 0.57, + "learning_rate": 2.0409999649711837e-06, + "loss": 1.1465, + "step": 18988 + }, + { + "epoch": 0.57, + "learning_rate": 2.0407601934963896e-06, + "loss": 1.124, + "step": 18989 + }, + { + "epoch": 0.57, + "learning_rate": 2.0405204263933375e-06, + "loss": 1.0268, + "step": 18990 + }, + { + "epoch": 0.57, + "learning_rate": 2.0402806636643098e-06, + "loss": 1.0876, + "step": 18991 + }, + { + "epoch": 0.57, + "learning_rate": 2.0400409053115883e-06, + "loss": 1.1262, + "step": 18992 + }, + { + "epoch": 0.57, + "learning_rate": 2.0398011513374566e-06, + "loss": 1.2939, + "step": 18993 + }, + { + "epoch": 0.57, + "learning_rate": 2.0395614017441955e-06, + "loss": 1.1579, + "step": 18994 + }, + { + "epoch": 0.57, + "learning_rate": 2.039321656534089e-06, + "loss": 1.1363, + "step": 18995 + }, + { + "epoch": 0.57, + "learning_rate": 2.0390819157094174e-06, + "loss": 1.0834, + "step": 18996 + }, + { + "epoch": 0.57, + "learning_rate": 2.0388421792724656e-06, + "loss": 1.0829, + "step": 18997 + }, + { + "epoch": 0.57, + "learning_rate": 2.0386024472255127e-06, + "loss": 1.1733, + "step": 18998 + }, + { + "epoch": 0.57, + "learning_rate": 2.038362719570843e-06, + "loss": 1.2906, + "step": 18999 + }, + { + "epoch": 0.57, + "learning_rate": 2.038122996310737e-06, + "loss": 1.2875, + "step": 19000 + }, + { + "epoch": 0.57, + "learning_rate": 2.0378832774474793e-06, + "loss": 1.0918, + "step": 19001 + }, + { + "epoch": 0.57, + "learning_rate": 2.037643562983349e-06, + "loss": 1.0082, + "step": 19002 + }, + { + "epoch": 0.57, + "learning_rate": 2.0374038529206293e-06, + "loss": 1.1705, + "step": 19003 + }, + { + "epoch": 0.57, + "learning_rate": 2.037164147261602e-06, + "loss": 1.0469, + "step": 19004 + }, + { + "epoch": 0.57, + "learning_rate": 2.0369244460085494e-06, + "loss": 1.1171, + "step": 19005 + }, + { + "epoch": 0.57, + "learning_rate": 2.0366847491637535e-06, + "loss": 1.121, + "step": 19006 + }, + { + "epoch": 0.57, + "learning_rate": 2.036445056729495e-06, + "loss": 1.1407, + "step": 19007 + }, + { + "epoch": 0.57, + "learning_rate": 2.036205368708056e-06, + "loss": 1.2538, + "step": 19008 + }, + { + "epoch": 0.57, + "learning_rate": 2.035965685101719e-06, + "loss": 1.0401, + "step": 19009 + }, + { + "epoch": 0.57, + "learning_rate": 2.035726005912766e-06, + "loss": 1.1209, + "step": 19010 + }, + { + "epoch": 0.57, + "learning_rate": 2.035486331143477e-06, + "loss": 1.147, + "step": 19011 + }, + { + "epoch": 0.57, + "learning_rate": 2.035246660796134e-06, + "loss": 1.1494, + "step": 19012 + }, + { + "epoch": 0.57, + "learning_rate": 2.0350069948730197e-06, + "loss": 1.2766, + "step": 19013 + }, + { + "epoch": 0.57, + "learning_rate": 2.0347673333764155e-06, + "loss": 1.0643, + "step": 19014 + }, + { + "epoch": 0.57, + "learning_rate": 2.034527676308601e-06, + "loss": 1.2264, + "step": 19015 + }, + { + "epoch": 0.57, + "learning_rate": 2.034288023671859e-06, + "loss": 1.1591, + "step": 19016 + }, + { + "epoch": 0.57, + "learning_rate": 2.034048375468471e-06, + "loss": 1.1575, + "step": 19017 + }, + { + "epoch": 0.57, + "learning_rate": 2.0338087317007172e-06, + "loss": 1.1616, + "step": 19018 + }, + { + "epoch": 0.57, + "learning_rate": 2.033569092370881e-06, + "loss": 1.147, + "step": 19019 + }, + { + "epoch": 0.57, + "learning_rate": 2.033329457481242e-06, + "loss": 1.1446, + "step": 19020 + }, + { + "epoch": 0.57, + "learning_rate": 2.0330898270340813e-06, + "loss": 0.9487, + "step": 19021 + }, + { + "epoch": 0.57, + "learning_rate": 2.0328502010316804e-06, + "loss": 1.103, + "step": 19022 + }, + { + "epoch": 0.57, + "learning_rate": 2.0326105794763224e-06, + "loss": 1.1336, + "step": 19023 + }, + { + "epoch": 0.57, + "learning_rate": 2.032370962370285e-06, + "loss": 1.1639, + "step": 19024 + }, + { + "epoch": 0.57, + "learning_rate": 2.032131349715851e-06, + "loss": 1.2335, + "step": 19025 + }, + { + "epoch": 0.57, + "learning_rate": 2.031891741515301e-06, + "loss": 1.157, + "step": 19026 + }, + { + "epoch": 0.57, + "learning_rate": 2.0316521377709176e-06, + "loss": 1.1507, + "step": 19027 + }, + { + "epoch": 0.57, + "learning_rate": 2.0314125384849794e-06, + "loss": 1.1196, + "step": 19028 + }, + { + "epoch": 0.57, + "learning_rate": 2.0311729436597674e-06, + "loss": 1.167, + "step": 19029 + }, + { + "epoch": 0.57, + "learning_rate": 2.0309333532975636e-06, + "loss": 1.1636, + "step": 19030 + }, + { + "epoch": 0.57, + "learning_rate": 2.030693767400648e-06, + "loss": 1.1904, + "step": 19031 + }, + { + "epoch": 0.57, + "learning_rate": 2.030454185971303e-06, + "loss": 1.2346, + "step": 19032 + }, + { + "epoch": 0.57, + "learning_rate": 2.030214609011807e-06, + "loss": 1.1287, + "step": 19033 + }, + { + "epoch": 0.57, + "learning_rate": 2.029975036524442e-06, + "loss": 1.077, + "step": 19034 + }, + { + "epoch": 0.57, + "learning_rate": 2.0297354685114878e-06, + "loss": 1.1824, + "step": 19035 + }, + { + "epoch": 0.57, + "learning_rate": 2.0294959049752265e-06, + "loss": 1.2335, + "step": 19036 + }, + { + "epoch": 0.57, + "learning_rate": 2.029256345917937e-06, + "loss": 1.1252, + "step": 19037 + }, + { + "epoch": 0.57, + "learning_rate": 2.0290167913419e-06, + "loss": 1.0311, + "step": 19038 + }, + { + "epoch": 0.57, + "learning_rate": 2.0287772412493964e-06, + "loss": 1.0079, + "step": 19039 + }, + { + "epoch": 0.57, + "learning_rate": 2.0285376956427076e-06, + "loss": 1.1166, + "step": 19040 + }, + { + "epoch": 0.57, + "learning_rate": 2.0282981545241122e-06, + "loss": 1.032, + "step": 19041 + }, + { + "epoch": 0.57, + "learning_rate": 2.0280586178958905e-06, + "loss": 1.0739, + "step": 19042 + }, + { + "epoch": 0.57, + "learning_rate": 2.0278190857603234e-06, + "loss": 1.0985, + "step": 19043 + }, + { + "epoch": 0.57, + "learning_rate": 2.0275795581196917e-06, + "loss": 1.0217, + "step": 19044 + }, + { + "epoch": 0.57, + "learning_rate": 2.0273400349762756e-06, + "loss": 1.1251, + "step": 19045 + }, + { + "epoch": 0.57, + "learning_rate": 2.0271005163323543e-06, + "loss": 1.1213, + "step": 19046 + }, + { + "epoch": 0.57, + "learning_rate": 2.0268610021902087e-06, + "loss": 1.2316, + "step": 19047 + }, + { + "epoch": 0.57, + "learning_rate": 2.0266214925521175e-06, + "loss": 1.04, + "step": 19048 + }, + { + "epoch": 0.57, + "learning_rate": 2.0263819874203627e-06, + "loss": 1.2775, + "step": 19049 + }, + { + "epoch": 0.57, + "learning_rate": 2.0261424867972225e-06, + "loss": 0.9562, + "step": 19050 + }, + { + "epoch": 0.57, + "learning_rate": 2.025902990684978e-06, + "loss": 1.1459, + "step": 19051 + }, + { + "epoch": 0.57, + "learning_rate": 2.0256634990859084e-06, + "loss": 1.0688, + "step": 19052 + }, + { + "epoch": 0.57, + "learning_rate": 2.025424012002295e-06, + "loss": 1.0933, + "step": 19053 + }, + { + "epoch": 0.57, + "learning_rate": 2.0251845294364153e-06, + "loss": 1.0485, + "step": 19054 + }, + { + "epoch": 0.57, + "learning_rate": 2.0249450513905503e-06, + "loss": 1.1295, + "step": 19055 + }, + { + "epoch": 0.57, + "learning_rate": 2.02470557786698e-06, + "loss": 1.0942, + "step": 19056 + }, + { + "epoch": 0.57, + "learning_rate": 2.0244661088679828e-06, + "loss": 1.1894, + "step": 19057 + }, + { + "epoch": 0.57, + "learning_rate": 2.0242266443958406e-06, + "loss": 1.1822, + "step": 19058 + }, + { + "epoch": 0.57, + "learning_rate": 2.0239871844528307e-06, + "loss": 1.1255, + "step": 19059 + }, + { + "epoch": 0.57, + "learning_rate": 2.023747729041234e-06, + "loss": 1.1901, + "step": 19060 + }, + { + "epoch": 0.57, + "learning_rate": 2.0235082781633286e-06, + "loss": 1.2617, + "step": 19061 + }, + { + "epoch": 0.57, + "learning_rate": 2.023268831821396e-06, + "loss": 1.0411, + "step": 19062 + }, + { + "epoch": 0.57, + "learning_rate": 2.023029390017714e-06, + "loss": 1.1458, + "step": 19063 + }, + { + "epoch": 0.57, + "learning_rate": 2.0227899527545623e-06, + "loss": 1.2105, + "step": 19064 + }, + { + "epoch": 0.57, + "learning_rate": 2.0225505200342206e-06, + "loss": 1.1465, + "step": 19065 + }, + { + "epoch": 0.57, + "learning_rate": 2.0223110918589687e-06, + "loss": 1.0302, + "step": 19066 + }, + { + "epoch": 0.57, + "learning_rate": 2.022071668231085e-06, + "loss": 1.1502, + "step": 19067 + }, + { + "epoch": 0.57, + "learning_rate": 2.0218322491528478e-06, + "loss": 1.0882, + "step": 19068 + }, + { + "epoch": 0.57, + "learning_rate": 2.021592834626538e-06, + "loss": 1.1974, + "step": 19069 + }, + { + "epoch": 0.57, + "learning_rate": 2.021353424654433e-06, + "loss": 1.1443, + "step": 19070 + }, + { + "epoch": 0.57, + "learning_rate": 2.021114019238815e-06, + "loss": 1.1513, + "step": 19071 + }, + { + "epoch": 0.57, + "learning_rate": 2.0208746183819594e-06, + "loss": 0.9953, + "step": 19072 + }, + { + "epoch": 0.57, + "learning_rate": 2.020635222086147e-06, + "loss": 0.9911, + "step": 19073 + }, + { + "epoch": 0.57, + "learning_rate": 2.0203958303536562e-06, + "loss": 1.157, + "step": 19074 + }, + { + "epoch": 0.57, + "learning_rate": 2.0201564431867663e-06, + "loss": 1.1667, + "step": 19075 + }, + { + "epoch": 0.57, + "learning_rate": 2.0199170605877557e-06, + "loss": 1.2239, + "step": 19076 + }, + { + "epoch": 0.57, + "learning_rate": 2.0196776825589037e-06, + "loss": 1.0728, + "step": 19077 + }, + { + "epoch": 0.57, + "learning_rate": 2.0194383091024885e-06, + "loss": 1.105, + "step": 19078 + }, + { + "epoch": 0.57, + "learning_rate": 2.01919894022079e-06, + "loss": 1.0795, + "step": 19079 + }, + { + "epoch": 0.57, + "learning_rate": 2.0189595759160857e-06, + "loss": 1.1118, + "step": 19080 + }, + { + "epoch": 0.57, + "learning_rate": 2.0187202161906543e-06, + "loss": 1.22, + "step": 19081 + }, + { + "epoch": 0.57, + "learning_rate": 2.018480861046774e-06, + "loss": 1.1818, + "step": 19082 + }, + { + "epoch": 0.57, + "learning_rate": 2.0182415104867246e-06, + "loss": 1.022, + "step": 19083 + }, + { + "epoch": 0.57, + "learning_rate": 2.0180021645127855e-06, + "loss": 1.0918, + "step": 19084 + }, + { + "epoch": 0.57, + "learning_rate": 2.017762823127232e-06, + "loss": 1.0288, + "step": 19085 + }, + { + "epoch": 0.57, + "learning_rate": 2.017523486332344e-06, + "loss": 1.0913, + "step": 19086 + }, + { + "epoch": 0.57, + "learning_rate": 2.0172841541304004e-06, + "loss": 1.196, + "step": 19087 + }, + { + "epoch": 0.58, + "learning_rate": 2.0170448265236795e-06, + "loss": 1.141, + "step": 19088 + }, + { + "epoch": 0.58, + "learning_rate": 2.0168055035144587e-06, + "loss": 1.1917, + "step": 19089 + }, + { + "epoch": 0.58, + "learning_rate": 2.0165661851050168e-06, + "loss": 1.1063, + "step": 19090 + }, + { + "epoch": 0.58, + "learning_rate": 2.0163268712976324e-06, + "loss": 1.1159, + "step": 19091 + }, + { + "epoch": 0.58, + "learning_rate": 2.016087562094584e-06, + "loss": 1.3617, + "step": 19092 + }, + { + "epoch": 0.58, + "learning_rate": 2.015848257498148e-06, + "loss": 1.2057, + "step": 19093 + }, + { + "epoch": 0.58, + "learning_rate": 2.015608957510603e-06, + "loss": 1.0914, + "step": 19094 + }, + { + "epoch": 0.58, + "learning_rate": 2.0153696621342277e-06, + "loss": 1.0963, + "step": 19095 + }, + { + "epoch": 0.58, + "learning_rate": 2.0151303713713e-06, + "loss": 1.1005, + "step": 19096 + }, + { + "epoch": 0.58, + "learning_rate": 2.0148910852240984e-06, + "loss": 1.114, + "step": 19097 + }, + { + "epoch": 0.58, + "learning_rate": 2.014651803694899e-06, + "loss": 1.1111, + "step": 19098 + }, + { + "epoch": 0.58, + "learning_rate": 2.014412526785981e-06, + "loss": 1.1217, + "step": 19099 + }, + { + "epoch": 0.58, + "learning_rate": 2.0141732544996214e-06, + "loss": 1.1486, + "step": 19100 + }, + { + "epoch": 0.58, + "learning_rate": 2.0139339868380994e-06, + "loss": 1.1682, + "step": 19101 + }, + { + "epoch": 0.58, + "learning_rate": 2.0136947238036906e-06, + "loss": 1.1558, + "step": 19102 + }, + { + "epoch": 0.58, + "learning_rate": 2.0134554653986747e-06, + "loss": 1.0338, + "step": 19103 + }, + { + "epoch": 0.58, + "learning_rate": 2.0132162116253277e-06, + "loss": 1.2238, + "step": 19104 + }, + { + "epoch": 0.58, + "learning_rate": 2.0129769624859298e-06, + "loss": 1.181, + "step": 19105 + }, + { + "epoch": 0.58, + "learning_rate": 2.012737717982755e-06, + "loss": 0.9578, + "step": 19106 + }, + { + "epoch": 0.58, + "learning_rate": 2.0124984781180823e-06, + "loss": 1.1204, + "step": 19107 + }, + { + "epoch": 0.58, + "learning_rate": 2.0122592428941893e-06, + "loss": 1.1343, + "step": 19108 + }, + { + "epoch": 0.58, + "learning_rate": 2.0120200123133536e-06, + "loss": 1.0775, + "step": 19109 + }, + { + "epoch": 0.58, + "learning_rate": 2.0117807863778537e-06, + "loss": 1.0162, + "step": 19110 + }, + { + "epoch": 0.58, + "learning_rate": 2.0115415650899643e-06, + "loss": 1.0391, + "step": 19111 + }, + { + "epoch": 0.58, + "learning_rate": 2.011302348451964e-06, + "loss": 1.1704, + "step": 19112 + }, + { + "epoch": 0.58, + "learning_rate": 2.0110631364661296e-06, + "loss": 1.1089, + "step": 19113 + }, + { + "epoch": 0.58, + "learning_rate": 2.01082392913474e-06, + "loss": 1.0563, + "step": 19114 + }, + { + "epoch": 0.58, + "learning_rate": 2.01058472646007e-06, + "loss": 1.0824, + "step": 19115 + }, + { + "epoch": 0.58, + "learning_rate": 2.010345528444397e-06, + "loss": 1.087, + "step": 19116 + }, + { + "epoch": 0.58, + "learning_rate": 2.0101063350899996e-06, + "loss": 1.1051, + "step": 19117 + }, + { + "epoch": 0.58, + "learning_rate": 2.009867146399155e-06, + "loss": 1.1301, + "step": 19118 + }, + { + "epoch": 0.58, + "learning_rate": 2.0096279623741376e-06, + "loss": 1.0259, + "step": 19119 + }, + { + "epoch": 0.58, + "learning_rate": 2.0093887830172264e-06, + "loss": 1.1165, + "step": 19120 + }, + { + "epoch": 0.58, + "learning_rate": 2.0091496083306972e-06, + "loss": 1.0084, + "step": 19121 + }, + { + "epoch": 0.58, + "learning_rate": 2.0089104383168288e-06, + "loss": 1.1052, + "step": 19122 + }, + { + "epoch": 0.58, + "learning_rate": 2.008671272977895e-06, + "loss": 1.2023, + "step": 19123 + }, + { + "epoch": 0.58, + "learning_rate": 2.0084321123161742e-06, + "loss": 1.0733, + "step": 19124 + }, + { + "epoch": 0.58, + "learning_rate": 2.008192956333943e-06, + "loss": 1.0165, + "step": 19125 + }, + { + "epoch": 0.58, + "learning_rate": 2.0079538050334783e-06, + "loss": 1.1847, + "step": 19126 + }, + { + "epoch": 0.58, + "learning_rate": 2.0077146584170565e-06, + "loss": 1.0522, + "step": 19127 + }, + { + "epoch": 0.58, + "learning_rate": 2.0074755164869537e-06, + "loss": 1.1061, + "step": 19128 + }, + { + "epoch": 0.58, + "learning_rate": 2.0072363792454472e-06, + "loss": 0.9749, + "step": 19129 + }, + { + "epoch": 0.58, + "learning_rate": 2.0069972466948126e-06, + "loss": 1.087, + "step": 19130 + }, + { + "epoch": 0.58, + "learning_rate": 2.006758118837327e-06, + "loss": 1.2848, + "step": 19131 + }, + { + "epoch": 0.58, + "learning_rate": 2.0065189956752667e-06, + "loss": 1.1411, + "step": 19132 + }, + { + "epoch": 0.58, + "learning_rate": 2.0062798772109073e-06, + "loss": 1.0288, + "step": 19133 + }, + { + "epoch": 0.58, + "learning_rate": 2.006040763446526e-06, + "loss": 1.1562, + "step": 19134 + }, + { + "epoch": 0.58, + "learning_rate": 2.0058016543844e-06, + "loss": 1.0878, + "step": 19135 + }, + { + "epoch": 0.58, + "learning_rate": 2.0055625500268025e-06, + "loss": 1.0611, + "step": 19136 + }, + { + "epoch": 0.58, + "learning_rate": 2.0053234503760117e-06, + "loss": 1.1069, + "step": 19137 + }, + { + "epoch": 0.58, + "learning_rate": 2.0050843554343036e-06, + "loss": 1.0157, + "step": 19138 + }, + { + "epoch": 0.58, + "learning_rate": 2.004845265203954e-06, + "loss": 1.054, + "step": 19139 + }, + { + "epoch": 0.58, + "learning_rate": 2.00460617968724e-06, + "loss": 1.0494, + "step": 19140 + }, + { + "epoch": 0.58, + "learning_rate": 2.0043670988864358e-06, + "loss": 1.0402, + "step": 19141 + }, + { + "epoch": 0.58, + "learning_rate": 2.0041280228038175e-06, + "loss": 1.1089, + "step": 19142 + }, + { + "epoch": 0.58, + "learning_rate": 2.003888951441662e-06, + "loss": 1.0332, + "step": 19143 + }, + { + "epoch": 0.58, + "learning_rate": 2.003649884802245e-06, + "loss": 1.3183, + "step": 19144 + }, + { + "epoch": 0.58, + "learning_rate": 2.003410822887842e-06, + "loss": 1.1197, + "step": 19145 + }, + { + "epoch": 0.58, + "learning_rate": 2.0031717657007284e-06, + "loss": 1.0045, + "step": 19146 + }, + { + "epoch": 0.58, + "learning_rate": 2.0029327132431805e-06, + "loss": 1.0927, + "step": 19147 + }, + { + "epoch": 0.58, + "learning_rate": 2.0026936655174746e-06, + "loss": 1.1553, + "step": 19148 + }, + { + "epoch": 0.58, + "learning_rate": 2.002454622525885e-06, + "loss": 1.201, + "step": 19149 + }, + { + "epoch": 0.58, + "learning_rate": 2.0022155842706874e-06, + "loss": 1.0943, + "step": 19150 + }, + { + "epoch": 0.58, + "learning_rate": 2.0019765507541574e-06, + "loss": 1.0335, + "step": 19151 + }, + { + "epoch": 0.58, + "learning_rate": 2.001737521978571e-06, + "loss": 1.0638, + "step": 19152 + }, + { + "epoch": 0.58, + "learning_rate": 2.0014984979462046e-06, + "loss": 1.067, + "step": 19153 + }, + { + "epoch": 0.58, + "learning_rate": 2.0012594786593313e-06, + "loss": 1.0734, + "step": 19154 + }, + { + "epoch": 0.58, + "learning_rate": 2.0010204641202275e-06, + "loss": 1.1334, + "step": 19155 + }, + { + "epoch": 0.58, + "learning_rate": 2.000781454331169e-06, + "loss": 1.0693, + "step": 19156 + }, + { + "epoch": 0.58, + "learning_rate": 2.0005424492944302e-06, + "loss": 1.0848, + "step": 19157 + }, + { + "epoch": 0.58, + "learning_rate": 2.000303449012287e-06, + "loss": 1.0087, + "step": 19158 + }, + { + "epoch": 0.58, + "learning_rate": 2.000064453487014e-06, + "loss": 1.1306, + "step": 19159 + }, + { + "epoch": 0.58, + "learning_rate": 1.999825462720887e-06, + "loss": 1.1162, + "step": 19160 + }, + { + "epoch": 0.58, + "learning_rate": 1.999586476716181e-06, + "loss": 1.2264, + "step": 19161 + }, + { + "epoch": 0.58, + "learning_rate": 1.9993474954751703e-06, + "loss": 1.264, + "step": 19162 + }, + { + "epoch": 0.58, + "learning_rate": 1.99910851900013e-06, + "loss": 1.0817, + "step": 19163 + }, + { + "epoch": 0.58, + "learning_rate": 1.9988695472933358e-06, + "loss": 1.0912, + "step": 19164 + }, + { + "epoch": 0.58, + "learning_rate": 1.998630580357062e-06, + "loss": 1.1539, + "step": 19165 + }, + { + "epoch": 0.58, + "learning_rate": 1.9983916181935844e-06, + "loss": 1.1728, + "step": 19166 + }, + { + "epoch": 0.58, + "learning_rate": 1.998152660805176e-06, + "loss": 1.09, + "step": 19167 + }, + { + "epoch": 0.58, + "learning_rate": 1.9979137081941126e-06, + "loss": 1.0897, + "step": 19168 + }, + { + "epoch": 0.58, + "learning_rate": 1.997674760362669e-06, + "loss": 1.0696, + "step": 19169 + }, + { + "epoch": 0.58, + "learning_rate": 1.9974358173131205e-06, + "loss": 1.178, + "step": 19170 + }, + { + "epoch": 0.58, + "learning_rate": 1.99719687904774e-06, + "loss": 1.1415, + "step": 19171 + }, + { + "epoch": 0.58, + "learning_rate": 1.9969579455688033e-06, + "loss": 1.0464, + "step": 19172 + }, + { + "epoch": 0.58, + "learning_rate": 1.9967190168785843e-06, + "loss": 1.1711, + "step": 19173 + }, + { + "epoch": 0.58, + "learning_rate": 1.9964800929793595e-06, + "loss": 1.0828, + "step": 19174 + }, + { + "epoch": 0.58, + "learning_rate": 1.9962411738734005e-06, + "loss": 1.2354, + "step": 19175 + }, + { + "epoch": 0.58, + "learning_rate": 1.996002259562983e-06, + "loss": 1.2506, + "step": 19176 + }, + { + "epoch": 0.58, + "learning_rate": 1.995763350050381e-06, + "loss": 1.1813, + "step": 19177 + }, + { + "epoch": 0.58, + "learning_rate": 1.995524445337869e-06, + "loss": 1.217, + "step": 19178 + }, + { + "epoch": 0.58, + "learning_rate": 1.995285545427722e-06, + "loss": 1.0772, + "step": 19179 + }, + { + "epoch": 0.58, + "learning_rate": 1.9950466503222134e-06, + "loss": 1.1161, + "step": 19180 + }, + { + "epoch": 0.58, + "learning_rate": 1.994807760023617e-06, + "loss": 1.2218, + "step": 19181 + }, + { + "epoch": 0.58, + "learning_rate": 1.9945688745342075e-06, + "loss": 1.0626, + "step": 19182 + }, + { + "epoch": 0.58, + "learning_rate": 1.9943299938562592e-06, + "loss": 1.1035, + "step": 19183 + }, + { + "epoch": 0.58, + "learning_rate": 1.994091117992046e-06, + "loss": 1.0557, + "step": 19184 + }, + { + "epoch": 0.58, + "learning_rate": 1.993852246943841e-06, + "loss": 1.186, + "step": 19185 + }, + { + "epoch": 0.58, + "learning_rate": 1.993613380713919e-06, + "loss": 1.1887, + "step": 19186 + }, + { + "epoch": 0.58, + "learning_rate": 1.9933745193045548e-06, + "loss": 1.224, + "step": 19187 + }, + { + "epoch": 0.58, + "learning_rate": 1.99313566271802e-06, + "loss": 1.2134, + "step": 19188 + }, + { + "epoch": 0.58, + "learning_rate": 1.99289681095659e-06, + "loss": 1.2327, + "step": 19189 + }, + { + "epoch": 0.58, + "learning_rate": 1.992657964022538e-06, + "loss": 1.1564, + "step": 19190 + }, + { + "epoch": 0.58, + "learning_rate": 1.992419121918137e-06, + "loss": 1.1627, + "step": 19191 + }, + { + "epoch": 0.58, + "learning_rate": 1.992180284645664e-06, + "loss": 1.0706, + "step": 19192 + }, + { + "epoch": 0.58, + "learning_rate": 1.991941452207388e-06, + "loss": 1.2129, + "step": 19193 + }, + { + "epoch": 0.58, + "learning_rate": 1.9917026246055846e-06, + "loss": 1.0811, + "step": 19194 + }, + { + "epoch": 0.58, + "learning_rate": 1.991463801842528e-06, + "loss": 1.1755, + "step": 19195 + }, + { + "epoch": 0.58, + "learning_rate": 1.9912249839204912e-06, + "loss": 1.1648, + "step": 19196 + }, + { + "epoch": 0.58, + "learning_rate": 1.9909861708417476e-06, + "loss": 1.0927, + "step": 19197 + }, + { + "epoch": 0.58, + "learning_rate": 1.99074736260857e-06, + "loss": 1.1473, + "step": 19198 + }, + { + "epoch": 0.58, + "learning_rate": 1.9905085592232322e-06, + "loss": 1.0124, + "step": 19199 + }, + { + "epoch": 0.58, + "learning_rate": 1.990269760688009e-06, + "loss": 1.1304, + "step": 19200 + }, + { + "epoch": 0.58, + "learning_rate": 1.9900309670051705e-06, + "loss": 1.0781, + "step": 19201 + }, + { + "epoch": 0.58, + "learning_rate": 1.989792178176992e-06, + "loss": 1.1414, + "step": 19202 + }, + { + "epoch": 0.58, + "learning_rate": 1.989553394205746e-06, + "loss": 1.1399, + "step": 19203 + }, + { + "epoch": 0.58, + "learning_rate": 1.9893146150937063e-06, + "loss": 1.0226, + "step": 19204 + }, + { + "epoch": 0.58, + "learning_rate": 1.9890758408431465e-06, + "loss": 1.037, + "step": 19205 + }, + { + "epoch": 0.58, + "learning_rate": 1.9888370714563375e-06, + "loss": 1.2209, + "step": 19206 + }, + { + "epoch": 0.58, + "learning_rate": 1.988598306935553e-06, + "loss": 1.1451, + "step": 19207 + }, + { + "epoch": 0.58, + "learning_rate": 1.9883595472830668e-06, + "loss": 1.1203, + "step": 19208 + }, + { + "epoch": 0.58, + "learning_rate": 1.9881207925011514e-06, + "loss": 1.1616, + "step": 19209 + }, + { + "epoch": 0.58, + "learning_rate": 1.9878820425920793e-06, + "loss": 1.038, + "step": 19210 + }, + { + "epoch": 0.58, + "learning_rate": 1.987643297558124e-06, + "loss": 1.2908, + "step": 19211 + }, + { + "epoch": 0.58, + "learning_rate": 1.9874045574015573e-06, + "loss": 1.1122, + "step": 19212 + }, + { + "epoch": 0.58, + "learning_rate": 1.9871658221246524e-06, + "loss": 0.9954, + "step": 19213 + }, + { + "epoch": 0.58, + "learning_rate": 1.9869270917296817e-06, + "loss": 1.1641, + "step": 19214 + }, + { + "epoch": 0.58, + "learning_rate": 1.986688366218918e-06, + "loss": 1.1011, + "step": 19215 + }, + { + "epoch": 0.58, + "learning_rate": 1.986449645594634e-06, + "loss": 1.0773, + "step": 19216 + }, + { + "epoch": 0.58, + "learning_rate": 1.9862109298591018e-06, + "loss": 1.3063, + "step": 19217 + }, + { + "epoch": 0.58, + "learning_rate": 1.985972219014595e-06, + "loss": 1.0861, + "step": 19218 + }, + { + "epoch": 0.58, + "learning_rate": 1.985733513063384e-06, + "loss": 1.0589, + "step": 19219 + }, + { + "epoch": 0.58, + "learning_rate": 1.985494812007743e-06, + "loss": 1.087, + "step": 19220 + }, + { + "epoch": 0.58, + "learning_rate": 1.985256115849943e-06, + "loss": 1.1694, + "step": 19221 + }, + { + "epoch": 0.58, + "learning_rate": 1.9850174245922583e-06, + "loss": 1.0133, + "step": 19222 + }, + { + "epoch": 0.58, + "learning_rate": 1.984778738236958e-06, + "loss": 1.1085, + "step": 19223 + }, + { + "epoch": 0.58, + "learning_rate": 1.9845400567863166e-06, + "loss": 1.0986, + "step": 19224 + }, + { + "epoch": 0.58, + "learning_rate": 1.984301380242605e-06, + "loss": 1.1525, + "step": 19225 + }, + { + "epoch": 0.58, + "learning_rate": 1.9840627086080973e-06, + "loss": 1.1557, + "step": 19226 + }, + { + "epoch": 0.58, + "learning_rate": 1.983824041885063e-06, + "loss": 1.1131, + "step": 19227 + }, + { + "epoch": 0.58, + "learning_rate": 1.983585380075775e-06, + "loss": 1.0661, + "step": 19228 + }, + { + "epoch": 0.58, + "learning_rate": 1.983346723182506e-06, + "loss": 1.0975, + "step": 19229 + }, + { + "epoch": 0.58, + "learning_rate": 1.983108071207527e-06, + "loss": 1.1304, + "step": 19230 + }, + { + "epoch": 0.58, + "learning_rate": 1.9828694241531115e-06, + "loss": 1.0729, + "step": 19231 + }, + { + "epoch": 0.58, + "learning_rate": 1.982630782021529e-06, + "loss": 1.1505, + "step": 19232 + }, + { + "epoch": 0.58, + "learning_rate": 1.982392144815052e-06, + "loss": 1.1548, + "step": 19233 + }, + { + "epoch": 0.58, + "learning_rate": 1.9821535125359527e-06, + "loss": 1.1168, + "step": 19234 + }, + { + "epoch": 0.58, + "learning_rate": 1.9819148851865037e-06, + "loss": 1.1077, + "step": 19235 + }, + { + "epoch": 0.58, + "learning_rate": 1.9816762627689743e-06, + "loss": 1.1315, + "step": 19236 + }, + { + "epoch": 0.58, + "learning_rate": 1.981437645285637e-06, + "loss": 1.2462, + "step": 19237 + }, + { + "epoch": 0.58, + "learning_rate": 1.981199032738764e-06, + "loss": 1.2123, + "step": 19238 + }, + { + "epoch": 0.58, + "learning_rate": 1.9809604251306265e-06, + "loss": 1.1223, + "step": 19239 + }, + { + "epoch": 0.58, + "learning_rate": 1.9807218224634957e-06, + "loss": 1.1414, + "step": 19240 + }, + { + "epoch": 0.58, + "learning_rate": 1.9804832247396428e-06, + "loss": 1.0997, + "step": 19241 + }, + { + "epoch": 0.58, + "learning_rate": 1.9802446319613395e-06, + "loss": 1.0663, + "step": 19242 + }, + { + "epoch": 0.58, + "learning_rate": 1.9800060441308564e-06, + "loss": 1.0701, + "step": 19243 + }, + { + "epoch": 0.58, + "learning_rate": 1.979767461250467e-06, + "loss": 1.1888, + "step": 19244 + }, + { + "epoch": 0.58, + "learning_rate": 1.9795288833224397e-06, + "loss": 1.1038, + "step": 19245 + }, + { + "epoch": 0.58, + "learning_rate": 1.9792903103490467e-06, + "loss": 1.0555, + "step": 19246 + }, + { + "epoch": 0.58, + "learning_rate": 1.979051742332559e-06, + "loss": 1.0477, + "step": 19247 + }, + { + "epoch": 0.58, + "learning_rate": 1.978813179275249e-06, + "loss": 1.1994, + "step": 19248 + }, + { + "epoch": 0.58, + "learning_rate": 1.9785746211793856e-06, + "loss": 1.0889, + "step": 19249 + }, + { + "epoch": 0.58, + "learning_rate": 1.9783360680472405e-06, + "loss": 1.1715, + "step": 19250 + }, + { + "epoch": 0.58, + "learning_rate": 1.9780975198810847e-06, + "loss": 1.1231, + "step": 19251 + }, + { + "epoch": 0.58, + "learning_rate": 1.97785897668319e-06, + "loss": 1.1298, + "step": 19252 + }, + { + "epoch": 0.58, + "learning_rate": 1.9776204384558254e-06, + "loss": 1.0608, + "step": 19253 + }, + { + "epoch": 0.58, + "learning_rate": 1.977381905201263e-06, + "loss": 1.0604, + "step": 19254 + }, + { + "epoch": 0.58, + "learning_rate": 1.977143376921773e-06, + "loss": 1.2618, + "step": 19255 + }, + { + "epoch": 0.58, + "learning_rate": 1.9769048536196264e-06, + "loss": 1.1973, + "step": 19256 + }, + { + "epoch": 0.58, + "learning_rate": 1.9766663352970947e-06, + "loss": 1.1677, + "step": 19257 + }, + { + "epoch": 0.58, + "learning_rate": 1.976427821956446e-06, + "loss": 1.2311, + "step": 19258 + }, + { + "epoch": 0.58, + "learning_rate": 1.9761893135999525e-06, + "loss": 1.1167, + "step": 19259 + }, + { + "epoch": 0.58, + "learning_rate": 1.9759508102298846e-06, + "loss": 1.2598, + "step": 19260 + }, + { + "epoch": 0.58, + "learning_rate": 1.975712311848514e-06, + "loss": 1.19, + "step": 19261 + }, + { + "epoch": 0.58, + "learning_rate": 1.975473818458108e-06, + "loss": 1.2242, + "step": 19262 + }, + { + "epoch": 0.58, + "learning_rate": 1.9752353300609387e-06, + "loss": 1.2037, + "step": 19263 + }, + { + "epoch": 0.58, + "learning_rate": 1.9749968466592766e-06, + "loss": 1.1019, + "step": 19264 + }, + { + "epoch": 0.58, + "learning_rate": 1.974758368255392e-06, + "loss": 1.0045, + "step": 19265 + }, + { + "epoch": 0.58, + "learning_rate": 1.9745198948515543e-06, + "loss": 1.1835, + "step": 19266 + }, + { + "epoch": 0.58, + "learning_rate": 1.974281426450034e-06, + "loss": 1.1226, + "step": 19267 + }, + { + "epoch": 0.58, + "learning_rate": 1.9740429630531015e-06, + "loss": 1.169, + "step": 19268 + }, + { + "epoch": 0.58, + "learning_rate": 1.9738045046630268e-06, + "loss": 1.1434, + "step": 19269 + }, + { + "epoch": 0.58, + "learning_rate": 1.9735660512820804e-06, + "loss": 1.0993, + "step": 19270 + }, + { + "epoch": 0.58, + "learning_rate": 1.973327602912531e-06, + "loss": 1.0832, + "step": 19271 + }, + { + "epoch": 0.58, + "learning_rate": 1.9730891595566493e-06, + "loss": 1.156, + "step": 19272 + }, + { + "epoch": 0.58, + "learning_rate": 1.9728507212167045e-06, + "loss": 1.0635, + "step": 19273 + }, + { + "epoch": 0.58, + "learning_rate": 1.9726122878949684e-06, + "loss": 1.1046, + "step": 19274 + }, + { + "epoch": 0.58, + "learning_rate": 1.972373859593708e-06, + "loss": 1.0556, + "step": 19275 + }, + { + "epoch": 0.58, + "learning_rate": 1.9721354363151944e-06, + "loss": 1.1487, + "step": 19276 + }, + { + "epoch": 0.58, + "learning_rate": 1.9718970180616976e-06, + "loss": 1.0269, + "step": 19277 + }, + { + "epoch": 0.58, + "learning_rate": 1.971658604835487e-06, + "loss": 1.1036, + "step": 19278 + }, + { + "epoch": 0.58, + "learning_rate": 1.9714201966388317e-06, + "loss": 1.0652, + "step": 19279 + }, + { + "epoch": 0.58, + "learning_rate": 1.971181793474001e-06, + "loss": 1.1787, + "step": 19280 + }, + { + "epoch": 0.58, + "learning_rate": 1.9709433953432656e-06, + "loss": 1.1769, + "step": 19281 + }, + { + "epoch": 0.58, + "learning_rate": 1.970705002248894e-06, + "loss": 1.1165, + "step": 19282 + }, + { + "epoch": 0.58, + "learning_rate": 1.970466614193157e-06, + "loss": 1.0338, + "step": 19283 + }, + { + "epoch": 0.58, + "learning_rate": 1.9702282311783214e-06, + "loss": 1.0352, + "step": 19284 + }, + { + "epoch": 0.58, + "learning_rate": 1.9699898532066584e-06, + "loss": 1.2336, + "step": 19285 + }, + { + "epoch": 0.58, + "learning_rate": 1.9697514802804365e-06, + "loss": 1.0544, + "step": 19286 + }, + { + "epoch": 0.58, + "learning_rate": 1.969513112401926e-06, + "loss": 1.0859, + "step": 19287 + }, + { + "epoch": 0.58, + "learning_rate": 1.969274749573395e-06, + "loss": 1.1617, + "step": 19288 + }, + { + "epoch": 0.58, + "learning_rate": 1.969036391797112e-06, + "loss": 1.1258, + "step": 19289 + }, + { + "epoch": 0.58, + "learning_rate": 1.968798039075347e-06, + "loss": 1.1371, + "step": 19290 + }, + { + "epoch": 0.58, + "learning_rate": 1.968559691410369e-06, + "loss": 1.2101, + "step": 19291 + }, + { + "epoch": 0.58, + "learning_rate": 1.968321348804447e-06, + "loss": 1.3052, + "step": 19292 + }, + { + "epoch": 0.58, + "learning_rate": 1.9680830112598487e-06, + "loss": 1.1831, + "step": 19293 + }, + { + "epoch": 0.58, + "learning_rate": 1.967844678778845e-06, + "loss": 1.0886, + "step": 19294 + }, + { + "epoch": 0.58, + "learning_rate": 1.9676063513637035e-06, + "loss": 1.0647, + "step": 19295 + }, + { + "epoch": 0.58, + "learning_rate": 1.9673680290166933e-06, + "loss": 1.0784, + "step": 19296 + }, + { + "epoch": 0.58, + "learning_rate": 1.9671297117400824e-06, + "loss": 1.1127, + "step": 19297 + }, + { + "epoch": 0.58, + "learning_rate": 1.96689139953614e-06, + "loss": 1.2389, + "step": 19298 + }, + { + "epoch": 0.58, + "learning_rate": 1.9666530924071347e-06, + "loss": 1.1919, + "step": 19299 + }, + { + "epoch": 0.58, + "learning_rate": 1.9664147903553363e-06, + "loss": 1.0532, + "step": 19300 + }, + { + "epoch": 0.58, + "learning_rate": 1.966176493383011e-06, + "loss": 1.1436, + "step": 19301 + }, + { + "epoch": 0.58, + "learning_rate": 1.965938201492428e-06, + "loss": 1.1013, + "step": 19302 + }, + { + "epoch": 0.58, + "learning_rate": 1.965699914685857e-06, + "loss": 0.8794, + "step": 19303 + }, + { + "epoch": 0.58, + "learning_rate": 1.9654616329655653e-06, + "loss": 1.1348, + "step": 19304 + }, + { + "epoch": 0.58, + "learning_rate": 1.9652233563338215e-06, + "loss": 1.1776, + "step": 19305 + }, + { + "epoch": 0.58, + "learning_rate": 1.9649850847928935e-06, + "loss": 1.2546, + "step": 19306 + }, + { + "epoch": 0.58, + "learning_rate": 1.9647468183450497e-06, + "loss": 1.1332, + "step": 19307 + }, + { + "epoch": 0.58, + "learning_rate": 1.964508556992559e-06, + "loss": 1.1614, + "step": 19308 + }, + { + "epoch": 0.58, + "learning_rate": 1.964270300737688e-06, + "loss": 1.1113, + "step": 19309 + }, + { + "epoch": 0.58, + "learning_rate": 1.964032049582706e-06, + "loss": 1.1308, + "step": 19310 + }, + { + "epoch": 0.58, + "learning_rate": 1.9637938035298807e-06, + "loss": 1.1961, + "step": 19311 + }, + { + "epoch": 0.58, + "learning_rate": 1.96355556258148e-06, + "loss": 1.1263, + "step": 19312 + }, + { + "epoch": 0.58, + "learning_rate": 1.963317326739774e-06, + "loss": 1.1216, + "step": 19313 + }, + { + "epoch": 0.58, + "learning_rate": 1.9630790960070264e-06, + "loss": 1.0757, + "step": 19314 + }, + { + "epoch": 0.58, + "learning_rate": 1.9628408703855075e-06, + "loss": 1.102, + "step": 19315 + }, + { + "epoch": 0.58, + "learning_rate": 1.962602649877485e-06, + "loss": 1.1332, + "step": 19316 + }, + { + "epoch": 0.58, + "learning_rate": 1.9623644344852275e-06, + "loss": 1.0817, + "step": 19317 + }, + { + "epoch": 0.58, + "learning_rate": 1.9621262242110006e-06, + "loss": 1.1143, + "step": 19318 + }, + { + "epoch": 0.58, + "learning_rate": 1.9618880190570727e-06, + "loss": 1.0975, + "step": 19319 + }, + { + "epoch": 0.58, + "learning_rate": 1.961649819025712e-06, + "loss": 1.1751, + "step": 19320 + }, + { + "epoch": 0.58, + "learning_rate": 1.9614116241191862e-06, + "loss": 1.0565, + "step": 19321 + }, + { + "epoch": 0.58, + "learning_rate": 1.961173434339762e-06, + "loss": 1.108, + "step": 19322 + }, + { + "epoch": 0.58, + "learning_rate": 1.9609352496897067e-06, + "loss": 1.0588, + "step": 19323 + }, + { + "epoch": 0.58, + "learning_rate": 1.9606970701712886e-06, + "loss": 1.1664, + "step": 19324 + }, + { + "epoch": 0.58, + "learning_rate": 1.9604588957867744e-06, + "loss": 1.117, + "step": 19325 + }, + { + "epoch": 0.58, + "learning_rate": 1.9602207265384333e-06, + "loss": 1.0696, + "step": 19326 + }, + { + "epoch": 0.58, + "learning_rate": 1.959982562428529e-06, + "loss": 1.1782, + "step": 19327 + }, + { + "epoch": 0.58, + "learning_rate": 1.9597444034593314e-06, + "loss": 1.0157, + "step": 19328 + }, + { + "epoch": 0.58, + "learning_rate": 1.9595062496331065e-06, + "loss": 1.1954, + "step": 19329 + }, + { + "epoch": 0.58, + "learning_rate": 1.959268100952123e-06, + "loss": 1.2408, + "step": 19330 + }, + { + "epoch": 0.58, + "learning_rate": 1.959029957418645e-06, + "loss": 1.1799, + "step": 19331 + }, + { + "epoch": 0.58, + "learning_rate": 1.958791819034942e-06, + "loss": 1.1145, + "step": 19332 + }, + { + "epoch": 0.58, + "learning_rate": 1.95855368580328e-06, + "loss": 1.2191, + "step": 19333 + }, + { + "epoch": 0.58, + "learning_rate": 1.958315557725927e-06, + "loss": 1.058, + "step": 19334 + }, + { + "epoch": 0.58, + "learning_rate": 1.958077434805148e-06, + "loss": 1.1249, + "step": 19335 + }, + { + "epoch": 0.58, + "learning_rate": 1.9578393170432113e-06, + "loss": 1.1053, + "step": 19336 + }, + { + "epoch": 0.58, + "learning_rate": 1.9576012044423827e-06, + "loss": 1.1327, + "step": 19337 + }, + { + "epoch": 0.58, + "learning_rate": 1.9573630970049297e-06, + "loss": 1.1489, + "step": 19338 + }, + { + "epoch": 0.58, + "learning_rate": 1.95712499473312e-06, + "loss": 1.0358, + "step": 19339 + }, + { + "epoch": 0.58, + "learning_rate": 1.9568868976292172e-06, + "loss": 0.9841, + "step": 19340 + }, + { + "epoch": 0.58, + "learning_rate": 1.95664880569549e-06, + "loss": 1.0469, + "step": 19341 + }, + { + "epoch": 0.58, + "learning_rate": 1.9564107189342042e-06, + "loss": 1.1678, + "step": 19342 + }, + { + "epoch": 0.58, + "learning_rate": 1.956172637347628e-06, + "loss": 1.1382, + "step": 19343 + }, + { + "epoch": 0.58, + "learning_rate": 1.9559345609380252e-06, + "loss": 1.0612, + "step": 19344 + }, + { + "epoch": 0.58, + "learning_rate": 1.955696489707663e-06, + "loss": 1.0842, + "step": 19345 + }, + { + "epoch": 0.58, + "learning_rate": 1.9554584236588085e-06, + "loss": 1.1193, + "step": 19346 + }, + { + "epoch": 0.58, + "learning_rate": 1.9552203627937278e-06, + "loss": 1.0198, + "step": 19347 + }, + { + "epoch": 0.58, + "learning_rate": 1.9549823071146864e-06, + "loss": 0.9966, + "step": 19348 + }, + { + "epoch": 0.58, + "learning_rate": 1.954744256623951e-06, + "loss": 1.0408, + "step": 19349 + }, + { + "epoch": 0.58, + "learning_rate": 1.9545062113237875e-06, + "loss": 1.1708, + "step": 19350 + }, + { + "epoch": 0.58, + "learning_rate": 1.9542681712164626e-06, + "loss": 1.1335, + "step": 19351 + }, + { + "epoch": 0.58, + "learning_rate": 1.9540301363042423e-06, + "loss": 1.1194, + "step": 19352 + }, + { + "epoch": 0.58, + "learning_rate": 1.9537921065893916e-06, + "loss": 1.1095, + "step": 19353 + }, + { + "epoch": 0.58, + "learning_rate": 1.9535540820741767e-06, + "loss": 1.1451, + "step": 19354 + }, + { + "epoch": 0.58, + "learning_rate": 1.953316062760864e-06, + "loss": 1.1652, + "step": 19355 + }, + { + "epoch": 0.58, + "learning_rate": 1.95307804865172e-06, + "loss": 1.0046, + "step": 19356 + }, + { + "epoch": 0.58, + "learning_rate": 1.952840039749008e-06, + "loss": 1.0561, + "step": 19357 + }, + { + "epoch": 0.58, + "learning_rate": 1.9526020360549965e-06, + "loss": 1.0651, + "step": 19358 + }, + { + "epoch": 0.58, + "learning_rate": 1.9523640375719493e-06, + "loss": 1.0875, + "step": 19359 + }, + { + "epoch": 0.58, + "learning_rate": 1.9521260443021328e-06, + "loss": 1.2121, + "step": 19360 + }, + { + "epoch": 0.58, + "learning_rate": 1.951888056247813e-06, + "loss": 1.181, + "step": 19361 + }, + { + "epoch": 0.58, + "learning_rate": 1.951650073411254e-06, + "loss": 1.0995, + "step": 19362 + }, + { + "epoch": 0.58, + "learning_rate": 1.9514120957947223e-06, + "loss": 1.1238, + "step": 19363 + }, + { + "epoch": 0.58, + "learning_rate": 1.9511741234004834e-06, + "loss": 1.147, + "step": 19364 + }, + { + "epoch": 0.58, + "learning_rate": 1.950936156230804e-06, + "loss": 1.1674, + "step": 19365 + }, + { + "epoch": 0.58, + "learning_rate": 1.9506981942879466e-06, + "loss": 1.1227, + "step": 19366 + }, + { + "epoch": 0.58, + "learning_rate": 1.9504602375741777e-06, + "loss": 1.2324, + "step": 19367 + }, + { + "epoch": 0.58, + "learning_rate": 1.9502222860917626e-06, + "loss": 1.1616, + "step": 19368 + }, + { + "epoch": 0.58, + "learning_rate": 1.949984339842968e-06, + "loss": 1.0823, + "step": 19369 + }, + { + "epoch": 0.58, + "learning_rate": 1.9497463988300564e-06, + "loss": 1.1657, + "step": 19370 + }, + { + "epoch": 0.58, + "learning_rate": 1.949508463055294e-06, + "loss": 1.0966, + "step": 19371 + }, + { + "epoch": 0.58, + "learning_rate": 1.9492705325209455e-06, + "loss": 1.0773, + "step": 19372 + }, + { + "epoch": 0.58, + "learning_rate": 1.949032607229277e-06, + "loss": 1.1791, + "step": 19373 + }, + { + "epoch": 0.58, + "learning_rate": 1.9487946871825527e-06, + "loss": 1.0186, + "step": 19374 + }, + { + "epoch": 0.58, + "learning_rate": 1.9485567723830374e-06, + "loss": 1.0441, + "step": 19375 + }, + { + "epoch": 0.58, + "learning_rate": 1.9483188628329964e-06, + "loss": 1.1705, + "step": 19376 + }, + { + "epoch": 0.58, + "learning_rate": 1.9480809585346936e-06, + "loss": 1.0703, + "step": 19377 + }, + { + "epoch": 0.58, + "learning_rate": 1.9478430594903946e-06, + "loss": 1.1722, + "step": 19378 + }, + { + "epoch": 0.58, + "learning_rate": 1.9476051657023633e-06, + "loss": 1.0646, + "step": 19379 + }, + { + "epoch": 0.58, + "learning_rate": 1.947367277172865e-06, + "loss": 1.1785, + "step": 19380 + }, + { + "epoch": 0.58, + "learning_rate": 1.947129393904164e-06, + "loss": 1.1119, + "step": 19381 + }, + { + "epoch": 0.58, + "learning_rate": 1.946891515898526e-06, + "loss": 1.0492, + "step": 19382 + }, + { + "epoch": 0.58, + "learning_rate": 1.946653643158213e-06, + "loss": 1.151, + "step": 19383 + }, + { + "epoch": 0.58, + "learning_rate": 1.946415775685491e-06, + "loss": 0.9944, + "step": 19384 + }, + { + "epoch": 0.58, + "learning_rate": 1.946177913482624e-06, + "loss": 1.1252, + "step": 19385 + }, + { + "epoch": 0.58, + "learning_rate": 1.945940056551878e-06, + "loss": 1.0756, + "step": 19386 + }, + { + "epoch": 0.58, + "learning_rate": 1.945702204895515e-06, + "loss": 1.1226, + "step": 19387 + }, + { + "epoch": 0.58, + "learning_rate": 1.9454643585157994e-06, + "loss": 1.1027, + "step": 19388 + }, + { + "epoch": 0.58, + "learning_rate": 1.945226517414996e-06, + "loss": 1.0614, + "step": 19389 + }, + { + "epoch": 0.58, + "learning_rate": 1.9449886815953696e-06, + "loss": 1.1225, + "step": 19390 + }, + { + "epoch": 0.58, + "learning_rate": 1.9447508510591836e-06, + "loss": 1.02, + "step": 19391 + }, + { + "epoch": 0.58, + "learning_rate": 1.9445130258087016e-06, + "loss": 1.0995, + "step": 19392 + }, + { + "epoch": 0.58, + "learning_rate": 1.9442752058461884e-06, + "loss": 1.2045, + "step": 19393 + }, + { + "epoch": 0.58, + "learning_rate": 1.9440373911739075e-06, + "loss": 1.0282, + "step": 19394 + }, + { + "epoch": 0.58, + "learning_rate": 1.943799581794124e-06, + "loss": 1.0911, + "step": 19395 + }, + { + "epoch": 0.58, + "learning_rate": 1.943561777709099e-06, + "loss": 1.1207, + "step": 19396 + }, + { + "epoch": 0.58, + "learning_rate": 1.9433239789210984e-06, + "loss": 1.1873, + "step": 19397 + }, + { + "epoch": 0.58, + "learning_rate": 1.943086185432385e-06, + "loss": 1.0903, + "step": 19398 + }, + { + "epoch": 0.58, + "learning_rate": 1.9428483972452245e-06, + "loss": 1.1037, + "step": 19399 + }, + { + "epoch": 0.58, + "learning_rate": 1.942610614361878e-06, + "loss": 1.2117, + "step": 19400 + }, + { + "epoch": 0.58, + "learning_rate": 1.942372836784609e-06, + "loss": 1.0654, + "step": 19401 + }, + { + "epoch": 0.58, + "learning_rate": 1.9421350645156827e-06, + "loss": 1.0694, + "step": 19402 + }, + { + "epoch": 0.58, + "learning_rate": 1.9418972975573623e-06, + "loss": 1.1401, + "step": 19403 + }, + { + "epoch": 0.58, + "learning_rate": 1.9416595359119104e-06, + "loss": 1.0994, + "step": 19404 + }, + { + "epoch": 0.58, + "learning_rate": 1.941421779581591e-06, + "loss": 1.2101, + "step": 19405 + }, + { + "epoch": 0.58, + "learning_rate": 1.9411840285686672e-06, + "loss": 1.064, + "step": 19406 + }, + { + "epoch": 0.58, + "learning_rate": 1.940946282875402e-06, + "loss": 1.0235, + "step": 19407 + }, + { + "epoch": 0.58, + "learning_rate": 1.94070854250406e-06, + "loss": 1.0699, + "step": 19408 + }, + { + "epoch": 0.58, + "learning_rate": 1.9404708074569027e-06, + "loss": 1.0285, + "step": 19409 + }, + { + "epoch": 0.58, + "learning_rate": 1.9402330777361937e-06, + "loss": 1.1993, + "step": 19410 + }, + { + "epoch": 0.58, + "learning_rate": 1.939995353344196e-06, + "loss": 1.2581, + "step": 19411 + }, + { + "epoch": 0.58, + "learning_rate": 1.939757634283174e-06, + "loss": 1.1209, + "step": 19412 + }, + { + "epoch": 0.58, + "learning_rate": 1.939519920555388e-06, + "loss": 1.0943, + "step": 19413 + }, + { + "epoch": 0.58, + "learning_rate": 1.939282212163103e-06, + "loss": 1.2084, + "step": 19414 + }, + { + "epoch": 0.58, + "learning_rate": 1.939044509108581e-06, + "loss": 1.1085, + "step": 19415 + }, + { + "epoch": 0.58, + "learning_rate": 1.9388068113940853e-06, + "loss": 1.2152, + "step": 19416 + }, + { + "epoch": 0.58, + "learning_rate": 1.9385691190218787e-06, + "loss": 1.2124, + "step": 19417 + }, + { + "epoch": 0.58, + "learning_rate": 1.938331431994224e-06, + "loss": 1.2096, + "step": 19418 + }, + { + "epoch": 0.58, + "learning_rate": 1.9380937503133824e-06, + "loss": 1.086, + "step": 19419 + }, + { + "epoch": 0.59, + "learning_rate": 1.9378560739816183e-06, + "loss": 1.1349, + "step": 19420 + }, + { + "epoch": 0.59, + "learning_rate": 1.9376184030011946e-06, + "loss": 1.1152, + "step": 19421 + }, + { + "epoch": 0.59, + "learning_rate": 1.937380737374372e-06, + "loss": 1.1265, + "step": 19422 + }, + { + "epoch": 0.59, + "learning_rate": 1.9371430771034133e-06, + "loss": 0.9897, + "step": 19423 + }, + { + "epoch": 0.59, + "learning_rate": 1.9369054221905816e-06, + "loss": 1.22, + "step": 19424 + }, + { + "epoch": 0.59, + "learning_rate": 1.9366677726381407e-06, + "loss": 1.2001, + "step": 19425 + }, + { + "epoch": 0.59, + "learning_rate": 1.9364301284483496e-06, + "loss": 1.0883, + "step": 19426 + }, + { + "epoch": 0.59, + "learning_rate": 1.9361924896234725e-06, + "loss": 1.0895, + "step": 19427 + }, + { + "epoch": 0.59, + "learning_rate": 1.935954856165771e-06, + "loss": 1.0663, + "step": 19428 + }, + { + "epoch": 0.59, + "learning_rate": 1.9357172280775084e-06, + "loss": 1.1019, + "step": 19429 + }, + { + "epoch": 0.59, + "learning_rate": 1.935479605360946e-06, + "loss": 1.0463, + "step": 19430 + }, + { + "epoch": 0.59, + "learning_rate": 1.9352419880183454e-06, + "loss": 1.0972, + "step": 19431 + }, + { + "epoch": 0.59, + "learning_rate": 1.935004376051969e-06, + "loss": 1.1522, + "step": 19432 + }, + { + "epoch": 0.59, + "learning_rate": 1.934766769464079e-06, + "loss": 1.1053, + "step": 19433 + }, + { + "epoch": 0.59, + "learning_rate": 1.934529168256938e-06, + "loss": 1.1092, + "step": 19434 + }, + { + "epoch": 0.59, + "learning_rate": 1.934291572432806e-06, + "loss": 1.1727, + "step": 19435 + }, + { + "epoch": 0.59, + "learning_rate": 1.934053981993946e-06, + "loss": 1.1478, + "step": 19436 + }, + { + "epoch": 0.59, + "learning_rate": 1.9338163969426195e-06, + "loss": 1.149, + "step": 19437 + }, + { + "epoch": 0.59, + "learning_rate": 1.933578817281089e-06, + "loss": 1.1171, + "step": 19438 + }, + { + "epoch": 0.59, + "learning_rate": 1.9333412430116145e-06, + "loss": 1.0701, + "step": 19439 + }, + { + "epoch": 0.59, + "learning_rate": 1.933103674136458e-06, + "loss": 1.131, + "step": 19440 + }, + { + "epoch": 0.59, + "learning_rate": 1.932866110657882e-06, + "loss": 1.028, + "step": 19441 + }, + { + "epoch": 0.59, + "learning_rate": 1.9326285525781476e-06, + "loss": 1.2433, + "step": 19442 + }, + { + "epoch": 0.59, + "learning_rate": 1.932390999899516e-06, + "loss": 1.1921, + "step": 19443 + }, + { + "epoch": 0.59, + "learning_rate": 1.932153452624249e-06, + "loss": 1.1575, + "step": 19444 + }, + { + "epoch": 0.59, + "learning_rate": 1.9319159107546072e-06, + "loss": 1.0956, + "step": 19445 + }, + { + "epoch": 0.59, + "learning_rate": 1.931678374292852e-06, + "loss": 1.0804, + "step": 19446 + }, + { + "epoch": 0.59, + "learning_rate": 1.9314408432412467e-06, + "loss": 1.0624, + "step": 19447 + }, + { + "epoch": 0.59, + "learning_rate": 1.9312033176020493e-06, + "loss": 1.0521, + "step": 19448 + }, + { + "epoch": 0.59, + "learning_rate": 1.9309657973775227e-06, + "loss": 1.0797, + "step": 19449 + }, + { + "epoch": 0.59, + "learning_rate": 1.930728282569927e-06, + "loss": 1.0403, + "step": 19450 + }, + { + "epoch": 0.59, + "learning_rate": 1.9304907731815254e-06, + "loss": 1.0902, + "step": 19451 + }, + { + "epoch": 0.59, + "learning_rate": 1.9302532692145765e-06, + "loss": 1.12, + "step": 19452 + }, + { + "epoch": 0.59, + "learning_rate": 1.9300157706713413e-06, + "loss": 1.0583, + "step": 19453 + }, + { + "epoch": 0.59, + "learning_rate": 1.929778277554082e-06, + "loss": 1.0887, + "step": 19454 + }, + { + "epoch": 0.59, + "learning_rate": 1.929540789865059e-06, + "loss": 1.2184, + "step": 19455 + }, + { + "epoch": 0.59, + "learning_rate": 1.9293033076065333e-06, + "loss": 1.1268, + "step": 19456 + }, + { + "epoch": 0.59, + "learning_rate": 1.9290658307807647e-06, + "loss": 1.0297, + "step": 19457 + }, + { + "epoch": 0.59, + "learning_rate": 1.928828359390015e-06, + "loss": 1.1759, + "step": 19458 + }, + { + "epoch": 0.59, + "learning_rate": 1.9285908934365438e-06, + "loss": 1.0739, + "step": 19459 + }, + { + "epoch": 0.59, + "learning_rate": 1.9283534329226125e-06, + "loss": 1.176, + "step": 19460 + }, + { + "epoch": 0.59, + "learning_rate": 1.928115977850481e-06, + "loss": 1.0763, + "step": 19461 + }, + { + "epoch": 0.59, + "learning_rate": 1.9278785282224095e-06, + "loss": 1.1221, + "step": 19462 + }, + { + "epoch": 0.59, + "learning_rate": 1.9276410840406588e-06, + "loss": 1.1148, + "step": 19463 + }, + { + "epoch": 0.59, + "learning_rate": 1.9274036453074907e-06, + "loss": 1.1338, + "step": 19464 + }, + { + "epoch": 0.59, + "learning_rate": 1.9271662120251626e-06, + "loss": 1.1613, + "step": 19465 + }, + { + "epoch": 0.59, + "learning_rate": 1.926928784195937e-06, + "loss": 1.1156, + "step": 19466 + }, + { + "epoch": 0.59, + "learning_rate": 1.926691361822073e-06, + "loss": 1.1911, + "step": 19467 + }, + { + "epoch": 0.59, + "learning_rate": 1.926453944905831e-06, + "loss": 1.0789, + "step": 19468 + }, + { + "epoch": 0.59, + "learning_rate": 1.926216533449472e-06, + "loss": 1.1276, + "step": 19469 + }, + { + "epoch": 0.59, + "learning_rate": 1.925979127455255e-06, + "loss": 1.16, + "step": 19470 + }, + { + "epoch": 0.59, + "learning_rate": 1.92574172692544e-06, + "loss": 1.0975, + "step": 19471 + }, + { + "epoch": 0.59, + "learning_rate": 1.925504331862287e-06, + "loss": 1.1039, + "step": 19472 + }, + { + "epoch": 0.59, + "learning_rate": 1.9252669422680564e-06, + "loss": 1.1357, + "step": 19473 + }, + { + "epoch": 0.59, + "learning_rate": 1.9250295581450074e-06, + "loss": 1.1818, + "step": 19474 + }, + { + "epoch": 0.59, + "learning_rate": 1.9247921794954002e-06, + "loss": 1.0478, + "step": 19475 + }, + { + "epoch": 0.59, + "learning_rate": 1.9245548063214942e-06, + "loss": 1.1276, + "step": 19476 + }, + { + "epoch": 0.59, + "learning_rate": 1.9243174386255507e-06, + "loss": 1.1091, + "step": 19477 + }, + { + "epoch": 0.59, + "learning_rate": 1.924080076409827e-06, + "loss": 1.1063, + "step": 19478 + }, + { + "epoch": 0.59, + "learning_rate": 1.923842719676583e-06, + "loss": 1.0637, + "step": 19479 + }, + { + "epoch": 0.59, + "learning_rate": 1.923605368428079e-06, + "loss": 1.2628, + "step": 19480 + }, + { + "epoch": 0.59, + "learning_rate": 1.923368022666574e-06, + "loss": 1.1531, + "step": 19481 + }, + { + "epoch": 0.59, + "learning_rate": 1.9231306823943294e-06, + "loss": 1.151, + "step": 19482 + }, + { + "epoch": 0.59, + "learning_rate": 1.9228933476136016e-06, + "loss": 1.016, + "step": 19483 + }, + { + "epoch": 0.59, + "learning_rate": 1.9226560183266508e-06, + "loss": 1.0822, + "step": 19484 + }, + { + "epoch": 0.59, + "learning_rate": 1.922418694535737e-06, + "loss": 1.0596, + "step": 19485 + }, + { + "epoch": 0.59, + "learning_rate": 1.92218137624312e-06, + "loss": 1.1138, + "step": 19486 + }, + { + "epoch": 0.59, + "learning_rate": 1.921944063451057e-06, + "loss": 1.0381, + "step": 19487 + }, + { + "epoch": 0.59, + "learning_rate": 1.921706756161808e-06, + "loss": 1.0209, + "step": 19488 + }, + { + "epoch": 0.59, + "learning_rate": 1.9214694543776324e-06, + "loss": 1.0668, + "step": 19489 + }, + { + "epoch": 0.59, + "learning_rate": 1.92123215810079e-06, + "loss": 1.0333, + "step": 19490 + }, + { + "epoch": 0.59, + "learning_rate": 1.920994867333538e-06, + "loss": 1.1154, + "step": 19491 + }, + { + "epoch": 0.59, + "learning_rate": 1.9207575820781354e-06, + "loss": 1.2516, + "step": 19492 + }, + { + "epoch": 0.59, + "learning_rate": 1.9205203023368415e-06, + "loss": 1.1055, + "step": 19493 + }, + { + "epoch": 0.59, + "learning_rate": 1.9202830281119167e-06, + "loss": 1.1693, + "step": 19494 + }, + { + "epoch": 0.59, + "learning_rate": 1.9200457594056173e-06, + "loss": 1.163, + "step": 19495 + }, + { + "epoch": 0.59, + "learning_rate": 1.9198084962202024e-06, + "loss": 1.0671, + "step": 19496 + }, + { + "epoch": 0.59, + "learning_rate": 1.919571238557932e-06, + "loss": 1.1421, + "step": 19497 + }, + { + "epoch": 0.59, + "learning_rate": 1.9193339864210633e-06, + "loss": 1.1527, + "step": 19498 + }, + { + "epoch": 0.59, + "learning_rate": 1.919096739811856e-06, + "loss": 1.0843, + "step": 19499 + }, + { + "epoch": 0.59, + "learning_rate": 1.9188594987325677e-06, + "loss": 0.9818, + "step": 19500 + }, + { + "epoch": 0.59, + "learning_rate": 1.918622263185457e-06, + "loss": 1.1691, + "step": 19501 + }, + { + "epoch": 0.59, + "learning_rate": 1.918385033172782e-06, + "loss": 1.1395, + "step": 19502 + }, + { + "epoch": 0.59, + "learning_rate": 1.918147808696803e-06, + "loss": 1.1139, + "step": 19503 + }, + { + "epoch": 0.59, + "learning_rate": 1.917910589759775e-06, + "loss": 1.1429, + "step": 19504 + }, + { + "epoch": 0.59, + "learning_rate": 1.917673376363958e-06, + "loss": 1.1854, + "step": 19505 + }, + { + "epoch": 0.59, + "learning_rate": 1.9174361685116104e-06, + "loss": 1.1767, + "step": 19506 + }, + { + "epoch": 0.59, + "learning_rate": 1.9171989662049908e-06, + "loss": 1.1887, + "step": 19507 + }, + { + "epoch": 0.59, + "learning_rate": 1.9169617694463548e-06, + "loss": 1.1282, + "step": 19508 + }, + { + "epoch": 0.59, + "learning_rate": 1.9167245782379627e-06, + "loss": 0.9849, + "step": 19509 + }, + { + "epoch": 0.59, + "learning_rate": 1.916487392582071e-06, + "loss": 1.0698, + "step": 19510 + }, + { + "epoch": 0.59, + "learning_rate": 1.9162502124809385e-06, + "loss": 1.1589, + "step": 19511 + }, + { + "epoch": 0.59, + "learning_rate": 1.9160130379368236e-06, + "loss": 1.1102, + "step": 19512 + }, + { + "epoch": 0.59, + "learning_rate": 1.915775868951983e-06, + "loss": 1.0853, + "step": 19513 + }, + { + "epoch": 0.59, + "learning_rate": 1.915538705528674e-06, + "loss": 1.09, + "step": 19514 + }, + { + "epoch": 0.59, + "learning_rate": 1.9153015476691555e-06, + "loss": 1.0322, + "step": 19515 + }, + { + "epoch": 0.59, + "learning_rate": 1.915064395375686e-06, + "loss": 1.1738, + "step": 19516 + }, + { + "epoch": 0.59, + "learning_rate": 1.91482724865052e-06, + "loss": 1.0005, + "step": 19517 + }, + { + "epoch": 0.59, + "learning_rate": 1.914590107495917e-06, + "loss": 1.1238, + "step": 19518 + }, + { + "epoch": 0.59, + "learning_rate": 1.9143529719141345e-06, + "loss": 0.9287, + "step": 19519 + }, + { + "epoch": 0.59, + "learning_rate": 1.914115841907431e-06, + "loss": 1.0921, + "step": 19520 + }, + { + "epoch": 0.59, + "learning_rate": 1.9138787174780605e-06, + "loss": 1.0507, + "step": 19521 + }, + { + "epoch": 0.59, + "learning_rate": 1.913641598628283e-06, + "loss": 1.0956, + "step": 19522 + }, + { + "epoch": 0.59, + "learning_rate": 1.913404485360355e-06, + "loss": 1.046, + "step": 19523 + }, + { + "epoch": 0.59, + "learning_rate": 1.9131673776765336e-06, + "loss": 1.0999, + "step": 19524 + }, + { + "epoch": 0.59, + "learning_rate": 1.9129302755790768e-06, + "loss": 1.2418, + "step": 19525 + }, + { + "epoch": 0.59, + "learning_rate": 1.912693179070241e-06, + "loss": 1.1252, + "step": 19526 + }, + { + "epoch": 0.59, + "learning_rate": 1.9124560881522824e-06, + "loss": 1.1604, + "step": 19527 + }, + { + "epoch": 0.59, + "learning_rate": 1.912219002827459e-06, + "loss": 1.0048, + "step": 19528 + }, + { + "epoch": 0.59, + "learning_rate": 1.911981923098029e-06, + "loss": 1.1653, + "step": 19529 + }, + { + "epoch": 0.59, + "learning_rate": 1.911744848966247e-06, + "loss": 1.2767, + "step": 19530 + }, + { + "epoch": 0.59, + "learning_rate": 1.9115077804343704e-06, + "loss": 1.1478, + "step": 19531 + }, + { + "epoch": 0.59, + "learning_rate": 1.9112707175046565e-06, + "loss": 1.2031, + "step": 19532 + }, + { + "epoch": 0.59, + "learning_rate": 1.9110336601793623e-06, + "loss": 1.1711, + "step": 19533 + }, + { + "epoch": 0.59, + "learning_rate": 1.910796608460744e-06, + "loss": 1.1489, + "step": 19534 + }, + { + "epoch": 0.59, + "learning_rate": 1.910559562351057e-06, + "loss": 1.1149, + "step": 19535 + }, + { + "epoch": 0.59, + "learning_rate": 1.9103225218525603e-06, + "loss": 1.1853, + "step": 19536 + }, + { + "epoch": 0.59, + "learning_rate": 1.910085486967508e-06, + "loss": 1.1362, + "step": 19537 + }, + { + "epoch": 0.59, + "learning_rate": 1.909848457698159e-06, + "loss": 1.0706, + "step": 19538 + }, + { + "epoch": 0.59, + "learning_rate": 1.9096114340467677e-06, + "loss": 1.1063, + "step": 19539 + }, + { + "epoch": 0.59, + "learning_rate": 1.909374416015591e-06, + "loss": 1.1086, + "step": 19540 + }, + { + "epoch": 0.59, + "learning_rate": 1.9091374036068867e-06, + "loss": 0.9355, + "step": 19541 + }, + { + "epoch": 0.59, + "learning_rate": 1.9089003968229092e-06, + "loss": 1.0189, + "step": 19542 + }, + { + "epoch": 0.59, + "learning_rate": 1.9086633956659148e-06, + "loss": 1.3491, + "step": 19543 + }, + { + "epoch": 0.59, + "learning_rate": 1.90842640013816e-06, + "loss": 1.1982, + "step": 19544 + }, + { + "epoch": 0.59, + "learning_rate": 1.908189410241901e-06, + "loss": 1.1589, + "step": 19545 + }, + { + "epoch": 0.59, + "learning_rate": 1.907952425979395e-06, + "loss": 1.1916, + "step": 19546 + }, + { + "epoch": 0.59, + "learning_rate": 1.9077154473528957e-06, + "loss": 1.0587, + "step": 19547 + }, + { + "epoch": 0.59, + "learning_rate": 1.90747847436466e-06, + "loss": 1.0228, + "step": 19548 + }, + { + "epoch": 0.59, + "learning_rate": 1.9072415070169437e-06, + "loss": 1.1448, + "step": 19549 + }, + { + "epoch": 0.59, + "learning_rate": 1.9070045453120029e-06, + "loss": 1.1053, + "step": 19550 + }, + { + "epoch": 0.59, + "learning_rate": 1.9067675892520937e-06, + "loss": 1.1589, + "step": 19551 + }, + { + "epoch": 0.59, + "learning_rate": 1.9065306388394713e-06, + "loss": 1.0807, + "step": 19552 + }, + { + "epoch": 0.59, + "learning_rate": 1.906293694076391e-06, + "loss": 1.0323, + "step": 19553 + }, + { + "epoch": 0.59, + "learning_rate": 1.9060567549651088e-06, + "loss": 1.1472, + "step": 19554 + }, + { + "epoch": 0.59, + "learning_rate": 1.9058198215078808e-06, + "loss": 1.1555, + "step": 19555 + }, + { + "epoch": 0.59, + "learning_rate": 1.9055828937069611e-06, + "loss": 1.0985, + "step": 19556 + }, + { + "epoch": 0.59, + "learning_rate": 1.9053459715646063e-06, + "loss": 1.0642, + "step": 19557 + }, + { + "epoch": 0.59, + "learning_rate": 1.9051090550830714e-06, + "loss": 1.2386, + "step": 19558 + }, + { + "epoch": 0.59, + "learning_rate": 1.9048721442646128e-06, + "loss": 1.1193, + "step": 19559 + }, + { + "epoch": 0.59, + "learning_rate": 1.9046352391114837e-06, + "loss": 1.0595, + "step": 19560 + }, + { + "epoch": 0.59, + "learning_rate": 1.9043983396259401e-06, + "loss": 1.0552, + "step": 19561 + }, + { + "epoch": 0.59, + "learning_rate": 1.9041614458102382e-06, + "loss": 1.1922, + "step": 19562 + }, + { + "epoch": 0.59, + "learning_rate": 1.9039245576666316e-06, + "loss": 1.1762, + "step": 19563 + }, + { + "epoch": 0.59, + "learning_rate": 1.9036876751973777e-06, + "loss": 1.1094, + "step": 19564 + }, + { + "epoch": 0.59, + "learning_rate": 1.9034507984047285e-06, + "loss": 1.1566, + "step": 19565 + }, + { + "epoch": 0.59, + "learning_rate": 1.9032139272909406e-06, + "loss": 1.1206, + "step": 19566 + }, + { + "epoch": 0.59, + "learning_rate": 1.9029770618582688e-06, + "loss": 1.1199, + "step": 19567 + }, + { + "epoch": 0.59, + "learning_rate": 1.902740202108968e-06, + "loss": 1.0403, + "step": 19568 + }, + { + "epoch": 0.59, + "learning_rate": 1.9025033480452926e-06, + "loss": 1.1435, + "step": 19569 + }, + { + "epoch": 0.59, + "learning_rate": 1.9022664996694975e-06, + "loss": 1.2067, + "step": 19570 + }, + { + "epoch": 0.59, + "learning_rate": 1.9020296569838376e-06, + "loss": 1.1287, + "step": 19571 + }, + { + "epoch": 0.59, + "learning_rate": 1.901792819990568e-06, + "loss": 1.07, + "step": 19572 + }, + { + "epoch": 0.59, + "learning_rate": 1.9015559886919418e-06, + "loss": 1.0702, + "step": 19573 + }, + { + "epoch": 0.59, + "learning_rate": 1.9013191630902144e-06, + "loss": 1.244, + "step": 19574 + }, + { + "epoch": 0.59, + "learning_rate": 1.9010823431876404e-06, + "loss": 1.172, + "step": 19575 + }, + { + "epoch": 0.59, + "learning_rate": 1.900845528986474e-06, + "loss": 1.1443, + "step": 19576 + }, + { + "epoch": 0.59, + "learning_rate": 1.9006087204889707e-06, + "loss": 1.0334, + "step": 19577 + }, + { + "epoch": 0.59, + "learning_rate": 1.9003719176973823e-06, + "loss": 1.205, + "step": 19578 + }, + { + "epoch": 0.59, + "learning_rate": 1.9001351206139646e-06, + "loss": 1.0964, + "step": 19579 + }, + { + "epoch": 0.59, + "learning_rate": 1.8998983292409718e-06, + "loss": 1.1272, + "step": 19580 + }, + { + "epoch": 0.59, + "learning_rate": 1.8996615435806582e-06, + "loss": 1.0954, + "step": 19581 + }, + { + "epoch": 0.59, + "learning_rate": 1.8994247636352772e-06, + "loss": 1.0305, + "step": 19582 + }, + { + "epoch": 0.59, + "learning_rate": 1.899187989407083e-06, + "loss": 1.074, + "step": 19583 + }, + { + "epoch": 0.59, + "learning_rate": 1.8989512208983301e-06, + "loss": 1.046, + "step": 19584 + }, + { + "epoch": 0.59, + "learning_rate": 1.8987144581112729e-06, + "loss": 1.098, + "step": 19585 + }, + { + "epoch": 0.59, + "learning_rate": 1.8984777010481636e-06, + "loss": 1.0649, + "step": 19586 + }, + { + "epoch": 0.59, + "learning_rate": 1.898240949711257e-06, + "loss": 1.293, + "step": 19587 + }, + { + "epoch": 0.59, + "learning_rate": 1.8980042041028064e-06, + "loss": 0.9854, + "step": 19588 + }, + { + "epoch": 0.59, + "learning_rate": 1.897767464225066e-06, + "loss": 1.1302, + "step": 19589 + }, + { + "epoch": 0.59, + "learning_rate": 1.8975307300802904e-06, + "loss": 1.1688, + "step": 19590 + }, + { + "epoch": 0.59, + "learning_rate": 1.8972940016707308e-06, + "loss": 1.041, + "step": 19591 + }, + { + "epoch": 0.59, + "learning_rate": 1.8970572789986422e-06, + "loss": 1.1931, + "step": 19592 + }, + { + "epoch": 0.59, + "learning_rate": 1.8968205620662778e-06, + "loss": 1.0576, + "step": 19593 + }, + { + "epoch": 0.59, + "learning_rate": 1.8965838508758918e-06, + "loss": 1.0627, + "step": 19594 + }, + { + "epoch": 0.59, + "learning_rate": 1.8963471454297366e-06, + "loss": 1.0937, + "step": 19595 + }, + { + "epoch": 0.59, + "learning_rate": 1.8961104457300656e-06, + "loss": 1.0662, + "step": 19596 + }, + { + "epoch": 0.59, + "learning_rate": 1.8958737517791323e-06, + "loss": 1.0819, + "step": 19597 + }, + { + "epoch": 0.59, + "learning_rate": 1.895637063579191e-06, + "loss": 1.1344, + "step": 19598 + }, + { + "epoch": 0.59, + "learning_rate": 1.8954003811324928e-06, + "loss": 1.035, + "step": 19599 + }, + { + "epoch": 0.59, + "learning_rate": 1.8951637044412918e-06, + "loss": 1.1394, + "step": 19600 + }, + { + "epoch": 0.59, + "learning_rate": 1.894927033507841e-06, + "loss": 1.1358, + "step": 19601 + }, + { + "epoch": 0.59, + "learning_rate": 1.8946903683343932e-06, + "loss": 1.132, + "step": 19602 + }, + { + "epoch": 0.59, + "learning_rate": 1.8944537089232028e-06, + "loss": 1.0488, + "step": 19603 + }, + { + "epoch": 0.59, + "learning_rate": 1.8942170552765204e-06, + "loss": 1.1215, + "step": 19604 + }, + { + "epoch": 0.59, + "learning_rate": 1.8939804073966e-06, + "loss": 1.1038, + "step": 19605 + }, + { + "epoch": 0.59, + "learning_rate": 1.893743765285694e-06, + "loss": 0.9781, + "step": 19606 + }, + { + "epoch": 0.59, + "learning_rate": 1.8935071289460564e-06, + "loss": 1.0654, + "step": 19607 + }, + { + "epoch": 0.59, + "learning_rate": 1.8932704983799378e-06, + "loss": 1.0643, + "step": 19608 + }, + { + "epoch": 0.59, + "learning_rate": 1.893033873589592e-06, + "loss": 1.0832, + "step": 19609 + }, + { + "epoch": 0.59, + "learning_rate": 1.8927972545772713e-06, + "loss": 0.9361, + "step": 19610 + }, + { + "epoch": 0.59, + "learning_rate": 1.8925606413452296e-06, + "loss": 1.252, + "step": 19611 + }, + { + "epoch": 0.59, + "learning_rate": 1.892324033895717e-06, + "loss": 1.0685, + "step": 19612 + }, + { + "epoch": 0.59, + "learning_rate": 1.8920874322309865e-06, + "loss": 1.233, + "step": 19613 + }, + { + "epoch": 0.59, + "learning_rate": 1.891850836353291e-06, + "loss": 1.081, + "step": 19614 + }, + { + "epoch": 0.59, + "learning_rate": 1.891614246264883e-06, + "loss": 1.0978, + "step": 19615 + }, + { + "epoch": 0.59, + "learning_rate": 1.8913776619680153e-06, + "loss": 1.0942, + "step": 19616 + }, + { + "epoch": 0.59, + "learning_rate": 1.891141083464938e-06, + "loss": 1.0969, + "step": 19617 + }, + { + "epoch": 0.59, + "learning_rate": 1.8909045107579044e-06, + "loss": 1.2337, + "step": 19618 + }, + { + "epoch": 0.59, + "learning_rate": 1.8906679438491662e-06, + "loss": 1.2331, + "step": 19619 + }, + { + "epoch": 0.59, + "learning_rate": 1.8904313827409764e-06, + "loss": 1.1312, + "step": 19620 + }, + { + "epoch": 0.59, + "learning_rate": 1.8901948274355857e-06, + "loss": 1.1419, + "step": 19621 + }, + { + "epoch": 0.59, + "learning_rate": 1.8899582779352468e-06, + "loss": 1.1601, + "step": 19622 + }, + { + "epoch": 0.59, + "learning_rate": 1.889721734242212e-06, + "loss": 1.1049, + "step": 19623 + }, + { + "epoch": 0.59, + "learning_rate": 1.8894851963587317e-06, + "loss": 1.2327, + "step": 19624 + }, + { + "epoch": 0.59, + "learning_rate": 1.8892486642870584e-06, + "loss": 1.2535, + "step": 19625 + }, + { + "epoch": 0.59, + "learning_rate": 1.8890121380294433e-06, + "loss": 1.0549, + "step": 19626 + }, + { + "epoch": 0.59, + "learning_rate": 1.8887756175881384e-06, + "loss": 1.1262, + "step": 19627 + }, + { + "epoch": 0.59, + "learning_rate": 1.8885391029653954e-06, + "loss": 1.1169, + "step": 19628 + }, + { + "epoch": 0.59, + "learning_rate": 1.8883025941634664e-06, + "loss": 1.0634, + "step": 19629 + }, + { + "epoch": 0.59, + "learning_rate": 1.8880660911846014e-06, + "loss": 1.0013, + "step": 19630 + }, + { + "epoch": 0.59, + "learning_rate": 1.8878295940310524e-06, + "loss": 1.1596, + "step": 19631 + }, + { + "epoch": 0.59, + "learning_rate": 1.8875931027050705e-06, + "loss": 1.1145, + "step": 19632 + }, + { + "epoch": 0.59, + "learning_rate": 1.8873566172089084e-06, + "loss": 1.0744, + "step": 19633 + }, + { + "epoch": 0.59, + "learning_rate": 1.8871201375448158e-06, + "loss": 1.0867, + "step": 19634 + }, + { + "epoch": 0.59, + "learning_rate": 1.8868836637150438e-06, + "loss": 1.1445, + "step": 19635 + }, + { + "epoch": 0.59, + "learning_rate": 1.8866471957218447e-06, + "loss": 1.1194, + "step": 19636 + }, + { + "epoch": 0.59, + "learning_rate": 1.8864107335674686e-06, + "loss": 1.0845, + "step": 19637 + }, + { + "epoch": 0.59, + "learning_rate": 1.8861742772541666e-06, + "loss": 1.0851, + "step": 19638 + }, + { + "epoch": 0.59, + "learning_rate": 1.8859378267841899e-06, + "loss": 1.0481, + "step": 19639 + }, + { + "epoch": 0.59, + "learning_rate": 1.8857013821597895e-06, + "loss": 1.0588, + "step": 19640 + }, + { + "epoch": 0.59, + "learning_rate": 1.8854649433832157e-06, + "loss": 1.0801, + "step": 19641 + }, + { + "epoch": 0.59, + "learning_rate": 1.8852285104567208e-06, + "loss": 0.9926, + "step": 19642 + }, + { + "epoch": 0.59, + "learning_rate": 1.8849920833825537e-06, + "loss": 1.187, + "step": 19643 + }, + { + "epoch": 0.59, + "learning_rate": 1.8847556621629654e-06, + "loss": 1.1401, + "step": 19644 + }, + { + "epoch": 0.59, + "learning_rate": 1.8845192468002071e-06, + "loss": 1.2614, + "step": 19645 + }, + { + "epoch": 0.59, + "learning_rate": 1.88428283729653e-06, + "loss": 1.0724, + "step": 19646 + }, + { + "epoch": 0.59, + "learning_rate": 1.8840464336541827e-06, + "loss": 1.0887, + "step": 19647 + }, + { + "epoch": 0.59, + "learning_rate": 1.883810035875417e-06, + "loss": 1.054, + "step": 19648 + }, + { + "epoch": 0.59, + "learning_rate": 1.8835736439624827e-06, + "loss": 1.1656, + "step": 19649 + }, + { + "epoch": 0.59, + "learning_rate": 1.883337257917631e-06, + "loss": 1.1022, + "step": 19650 + }, + { + "epoch": 0.59, + "learning_rate": 1.8831008777431112e-06, + "loss": 1.2168, + "step": 19651 + }, + { + "epoch": 0.59, + "learning_rate": 1.8828645034411738e-06, + "loss": 1.1313, + "step": 19652 + }, + { + "epoch": 0.59, + "learning_rate": 1.882628135014069e-06, + "loss": 1.1539, + "step": 19653 + }, + { + "epoch": 0.59, + "learning_rate": 1.8823917724640472e-06, + "loss": 1.1874, + "step": 19654 + }, + { + "epoch": 0.59, + "learning_rate": 1.8821554157933593e-06, + "loss": 1.1442, + "step": 19655 + }, + { + "epoch": 0.59, + "learning_rate": 1.8819190650042535e-06, + "loss": 1.2347, + "step": 19656 + }, + { + "epoch": 0.59, + "learning_rate": 1.8816827200989802e-06, + "loss": 1.0172, + "step": 19657 + }, + { + "epoch": 0.59, + "learning_rate": 1.8814463810797896e-06, + "loss": 1.1323, + "step": 19658 + }, + { + "epoch": 0.59, + "learning_rate": 1.8812100479489325e-06, + "loss": 1.0709, + "step": 19659 + }, + { + "epoch": 0.59, + "learning_rate": 1.880973720708657e-06, + "loss": 1.146, + "step": 19660 + }, + { + "epoch": 0.59, + "learning_rate": 1.8807373993612133e-06, + "loss": 1.0819, + "step": 19661 + }, + { + "epoch": 0.59, + "learning_rate": 1.8805010839088516e-06, + "loss": 1.0202, + "step": 19662 + }, + { + "epoch": 0.59, + "learning_rate": 1.8802647743538217e-06, + "loss": 1.1405, + "step": 19663 + }, + { + "epoch": 0.59, + "learning_rate": 1.8800284706983718e-06, + "loss": 0.9635, + "step": 19664 + }, + { + "epoch": 0.59, + "learning_rate": 1.8797921729447523e-06, + "loss": 1.1586, + "step": 19665 + }, + { + "epoch": 0.59, + "learning_rate": 1.879555881095213e-06, + "loss": 1.1243, + "step": 19666 + }, + { + "epoch": 0.59, + "learning_rate": 1.8793195951520026e-06, + "loss": 1.085, + "step": 19667 + }, + { + "epoch": 0.59, + "learning_rate": 1.8790833151173717e-06, + "loss": 1.0505, + "step": 19668 + }, + { + "epoch": 0.59, + "learning_rate": 1.8788470409935678e-06, + "loss": 1.0986, + "step": 19669 + }, + { + "epoch": 0.59, + "learning_rate": 1.8786107727828406e-06, + "loss": 1.1491, + "step": 19670 + }, + { + "epoch": 0.59, + "learning_rate": 1.8783745104874399e-06, + "loss": 0.9993, + "step": 19671 + }, + { + "epoch": 0.59, + "learning_rate": 1.8781382541096155e-06, + "loss": 1.2036, + "step": 19672 + }, + { + "epoch": 0.59, + "learning_rate": 1.8779020036516144e-06, + "loss": 1.0214, + "step": 19673 + }, + { + "epoch": 0.59, + "learning_rate": 1.8776657591156863e-06, + "loss": 1.2056, + "step": 19674 + }, + { + "epoch": 0.59, + "learning_rate": 1.8774295205040807e-06, + "loss": 1.1766, + "step": 19675 + }, + { + "epoch": 0.59, + "learning_rate": 1.8771932878190467e-06, + "loss": 1.1346, + "step": 19676 + }, + { + "epoch": 0.59, + "learning_rate": 1.876957061062832e-06, + "loss": 1.0403, + "step": 19677 + }, + { + "epoch": 0.59, + "learning_rate": 1.876720840237686e-06, + "loss": 1.1088, + "step": 19678 + }, + { + "epoch": 0.59, + "learning_rate": 1.8764846253458577e-06, + "loss": 1.0572, + "step": 19679 + }, + { + "epoch": 0.59, + "learning_rate": 1.8762484163895964e-06, + "loss": 1.2189, + "step": 19680 + }, + { + "epoch": 0.59, + "learning_rate": 1.8760122133711487e-06, + "loss": 1.1682, + "step": 19681 + }, + { + "epoch": 0.59, + "learning_rate": 1.8757760162927642e-06, + "loss": 1.1721, + "step": 19682 + }, + { + "epoch": 0.59, + "learning_rate": 1.8755398251566912e-06, + "loss": 1.1529, + "step": 19683 + }, + { + "epoch": 0.59, + "learning_rate": 1.8753036399651786e-06, + "loss": 1.0263, + "step": 19684 + }, + { + "epoch": 0.59, + "learning_rate": 1.8750674607204752e-06, + "loss": 1.1675, + "step": 19685 + }, + { + "epoch": 0.59, + "learning_rate": 1.8748312874248278e-06, + "loss": 1.2009, + "step": 19686 + }, + { + "epoch": 0.59, + "learning_rate": 1.8745951200804854e-06, + "loss": 1.0191, + "step": 19687 + }, + { + "epoch": 0.59, + "learning_rate": 1.8743589586896966e-06, + "loss": 1.1996, + "step": 19688 + }, + { + "epoch": 0.59, + "learning_rate": 1.8741228032547094e-06, + "loss": 1.2251, + "step": 19689 + }, + { + "epoch": 0.59, + "learning_rate": 1.8738866537777708e-06, + "loss": 1.2396, + "step": 19690 + }, + { + "epoch": 0.59, + "learning_rate": 1.8736505102611303e-06, + "loss": 1.0828, + "step": 19691 + }, + { + "epoch": 0.59, + "learning_rate": 1.8734143727070347e-06, + "loss": 1.1356, + "step": 19692 + }, + { + "epoch": 0.59, + "learning_rate": 1.873178241117734e-06, + "loss": 1.0476, + "step": 19693 + }, + { + "epoch": 0.59, + "learning_rate": 1.8729421154954735e-06, + "loss": 1.0907, + "step": 19694 + }, + { + "epoch": 0.59, + "learning_rate": 1.872705995842502e-06, + "loss": 1.0605, + "step": 19695 + }, + { + "epoch": 0.59, + "learning_rate": 1.872469882161067e-06, + "loss": 1.1309, + "step": 19696 + }, + { + "epoch": 0.59, + "learning_rate": 1.872233774453417e-06, + "loss": 1.1427, + "step": 19697 + }, + { + "epoch": 0.59, + "learning_rate": 1.8719976727217998e-06, + "loss": 1.1412, + "step": 19698 + }, + { + "epoch": 0.59, + "learning_rate": 1.8717615769684612e-06, + "loss": 1.0518, + "step": 19699 + }, + { + "epoch": 0.59, + "learning_rate": 1.87152548719565e-06, + "loss": 1.2158, + "step": 19700 + }, + { + "epoch": 0.59, + "learning_rate": 1.8712894034056133e-06, + "loss": 1.0834, + "step": 19701 + }, + { + "epoch": 0.59, + "learning_rate": 1.8710533256005997e-06, + "loss": 1.1354, + "step": 19702 + }, + { + "epoch": 0.59, + "learning_rate": 1.8708172537828545e-06, + "loss": 1.0323, + "step": 19703 + }, + { + "epoch": 0.59, + "learning_rate": 1.8705811879546262e-06, + "loss": 1.0236, + "step": 19704 + }, + { + "epoch": 0.59, + "learning_rate": 1.8703451281181623e-06, + "loss": 1.1035, + "step": 19705 + }, + { + "epoch": 0.59, + "learning_rate": 1.8701090742757096e-06, + "loss": 1.0228, + "step": 19706 + }, + { + "epoch": 0.59, + "learning_rate": 1.8698730264295146e-06, + "loss": 1.0524, + "step": 19707 + }, + { + "epoch": 0.59, + "learning_rate": 1.8696369845818252e-06, + "loss": 1.1464, + "step": 19708 + }, + { + "epoch": 0.59, + "learning_rate": 1.8694009487348878e-06, + "loss": 1.1681, + "step": 19709 + }, + { + "epoch": 0.59, + "learning_rate": 1.8691649188909493e-06, + "loss": 1.1689, + "step": 19710 + }, + { + "epoch": 0.59, + "learning_rate": 1.8689288950522589e-06, + "loss": 1.0861, + "step": 19711 + }, + { + "epoch": 0.59, + "learning_rate": 1.8686928772210596e-06, + "loss": 1.1899, + "step": 19712 + }, + { + "epoch": 0.59, + "learning_rate": 1.8684568653996004e-06, + "loss": 1.052, + "step": 19713 + }, + { + "epoch": 0.59, + "learning_rate": 1.8682208595901278e-06, + "loss": 1.0875, + "step": 19714 + }, + { + "epoch": 0.59, + "learning_rate": 1.8679848597948885e-06, + "loss": 1.1494, + "step": 19715 + }, + { + "epoch": 0.59, + "learning_rate": 1.8677488660161294e-06, + "loss": 1.0391, + "step": 19716 + }, + { + "epoch": 0.59, + "learning_rate": 1.8675128782560958e-06, + "loss": 1.1182, + "step": 19717 + }, + { + "epoch": 0.59, + "learning_rate": 1.8672768965170352e-06, + "loss": 0.9877, + "step": 19718 + }, + { + "epoch": 0.59, + "learning_rate": 1.8670409208011941e-06, + "loss": 1.1202, + "step": 19719 + }, + { + "epoch": 0.59, + "learning_rate": 1.8668049511108183e-06, + "loss": 1.1036, + "step": 19720 + }, + { + "epoch": 0.59, + "learning_rate": 1.866568987448154e-06, + "loss": 1.1713, + "step": 19721 + }, + { + "epoch": 0.59, + "learning_rate": 1.866333029815448e-06, + "loss": 1.0742, + "step": 19722 + }, + { + "epoch": 0.59, + "learning_rate": 1.8660970782149467e-06, + "loss": 1.0635, + "step": 19723 + }, + { + "epoch": 0.59, + "learning_rate": 1.8658611326488967e-06, + "loss": 1.0978, + "step": 19724 + }, + { + "epoch": 0.59, + "learning_rate": 1.8656251931195424e-06, + "loss": 1.02, + "step": 19725 + }, + { + "epoch": 0.59, + "learning_rate": 1.8653892596291306e-06, + "loss": 1.1094, + "step": 19726 + }, + { + "epoch": 0.59, + "learning_rate": 1.8651533321799075e-06, + "loss": 1.0511, + "step": 19727 + }, + { + "epoch": 0.59, + "learning_rate": 1.8649174107741197e-06, + "loss": 1.0503, + "step": 19728 + }, + { + "epoch": 0.59, + "learning_rate": 1.8646814954140115e-06, + "loss": 1.0798, + "step": 19729 + }, + { + "epoch": 0.59, + "learning_rate": 1.8644455861018295e-06, + "loss": 1.1756, + "step": 19730 + }, + { + "epoch": 0.59, + "learning_rate": 1.8642096828398192e-06, + "loss": 1.1442, + "step": 19731 + }, + { + "epoch": 0.59, + "learning_rate": 1.8639737856302276e-06, + "loss": 1.1299, + "step": 19732 + }, + { + "epoch": 0.59, + "learning_rate": 1.8637378944752982e-06, + "loss": 1.0923, + "step": 19733 + }, + { + "epoch": 0.59, + "learning_rate": 1.8635020093772776e-06, + "loss": 0.9417, + "step": 19734 + }, + { + "epoch": 0.59, + "learning_rate": 1.8632661303384117e-06, + "loss": 1.2097, + "step": 19735 + }, + { + "epoch": 0.59, + "learning_rate": 1.8630302573609455e-06, + "loss": 1.165, + "step": 19736 + }, + { + "epoch": 0.59, + "learning_rate": 1.8627943904471251e-06, + "loss": 1.0358, + "step": 19737 + }, + { + "epoch": 0.59, + "learning_rate": 1.8625585295991943e-06, + "loss": 1.0024, + "step": 19738 + }, + { + "epoch": 0.59, + "learning_rate": 1.8623226748193996e-06, + "loss": 1.1334, + "step": 19739 + }, + { + "epoch": 0.59, + "learning_rate": 1.8620868261099855e-06, + "loss": 1.1582, + "step": 19740 + }, + { + "epoch": 0.59, + "learning_rate": 1.861850983473199e-06, + "loss": 1.0803, + "step": 19741 + }, + { + "epoch": 0.59, + "learning_rate": 1.8616151469112827e-06, + "loss": 1.2327, + "step": 19742 + }, + { + "epoch": 0.59, + "learning_rate": 1.8613793164264826e-06, + "loss": 1.1816, + "step": 19743 + }, + { + "epoch": 0.59, + "learning_rate": 1.8611434920210442e-06, + "loss": 1.1311, + "step": 19744 + }, + { + "epoch": 0.59, + "learning_rate": 1.8609076736972121e-06, + "loss": 1.0773, + "step": 19745 + }, + { + "epoch": 0.59, + "learning_rate": 1.8606718614572308e-06, + "loss": 1.0945, + "step": 19746 + }, + { + "epoch": 0.59, + "learning_rate": 1.8604360553033456e-06, + "loss": 1.1379, + "step": 19747 + }, + { + "epoch": 0.59, + "learning_rate": 1.8602002552378009e-06, + "loss": 1.3244, + "step": 19748 + }, + { + "epoch": 0.59, + "learning_rate": 1.859964461262842e-06, + "loss": 1.2075, + "step": 19749 + }, + { + "epoch": 0.59, + "learning_rate": 1.859728673380714e-06, + "loss": 1.189, + "step": 19750 + }, + { + "epoch": 0.59, + "learning_rate": 1.8594928915936594e-06, + "loss": 1.1244, + "step": 19751 + }, + { + "epoch": 0.6, + "learning_rate": 1.859257115903924e-06, + "loss": 1.0948, + "step": 19752 + }, + { + "epoch": 0.6, + "learning_rate": 1.8590213463137527e-06, + "loss": 1.042, + "step": 19753 + }, + { + "epoch": 0.6, + "learning_rate": 1.8587855828253903e-06, + "loss": 1.0693, + "step": 19754 + }, + { + "epoch": 0.6, + "learning_rate": 1.8585498254410794e-06, + "loss": 1.2063, + "step": 19755 + }, + { + "epoch": 0.6, + "learning_rate": 1.8583140741630651e-06, + "loss": 1.2446, + "step": 19756 + }, + { + "epoch": 0.6, + "learning_rate": 1.8580783289935917e-06, + "loss": 1.0886, + "step": 19757 + }, + { + "epoch": 0.6, + "learning_rate": 1.857842589934904e-06, + "loss": 1.1038, + "step": 19758 + }, + { + "epoch": 0.6, + "learning_rate": 1.857606856989245e-06, + "loss": 1.0103, + "step": 19759 + }, + { + "epoch": 0.6, + "learning_rate": 1.8573711301588592e-06, + "loss": 1.1086, + "step": 19760 + }, + { + "epoch": 0.6, + "learning_rate": 1.8571354094459912e-06, + "loss": 1.1223, + "step": 19761 + }, + { + "epoch": 0.6, + "learning_rate": 1.8568996948528842e-06, + "loss": 1.1328, + "step": 19762 + }, + { + "epoch": 0.6, + "learning_rate": 1.8566639863817838e-06, + "loss": 1.0945, + "step": 19763 + }, + { + "epoch": 0.6, + "learning_rate": 1.8564282840349306e-06, + "loss": 1.1261, + "step": 19764 + }, + { + "epoch": 0.6, + "learning_rate": 1.8561925878145708e-06, + "loss": 0.9662, + "step": 19765 + }, + { + "epoch": 0.6, + "learning_rate": 1.8559568977229472e-06, + "loss": 1.1016, + "step": 19766 + }, + { + "epoch": 0.6, + "learning_rate": 1.855721213762305e-06, + "loss": 1.1871, + "step": 19767 + }, + { + "epoch": 0.6, + "learning_rate": 1.8554855359348855e-06, + "loss": 1.1087, + "step": 19768 + }, + { + "epoch": 0.6, + "learning_rate": 1.8552498642429332e-06, + "loss": 1.2037, + "step": 19769 + }, + { + "epoch": 0.6, + "learning_rate": 1.8550141986886916e-06, + "loss": 1.0897, + "step": 19770 + }, + { + "epoch": 0.6, + "learning_rate": 1.8547785392744048e-06, + "loss": 1.1192, + "step": 19771 + }, + { + "epoch": 0.6, + "learning_rate": 1.854542886002315e-06, + "loss": 1.1369, + "step": 19772 + }, + { + "epoch": 0.6, + "learning_rate": 1.854307238874666e-06, + "loss": 1.1652, + "step": 19773 + }, + { + "epoch": 0.6, + "learning_rate": 1.8540715978937012e-06, + "loss": 1.072, + "step": 19774 + }, + { + "epoch": 0.6, + "learning_rate": 1.8538359630616636e-06, + "loss": 1.0978, + "step": 19775 + }, + { + "epoch": 0.6, + "learning_rate": 1.8536003343807977e-06, + "loss": 1.0897, + "step": 19776 + }, + { + "epoch": 0.6, + "learning_rate": 1.853364711853344e-06, + "loss": 1.0651, + "step": 19777 + }, + { + "epoch": 0.6, + "learning_rate": 1.853129095481547e-06, + "loss": 0.9971, + "step": 19778 + }, + { + "epoch": 0.6, + "learning_rate": 1.8528934852676496e-06, + "loss": 1.207, + "step": 19779 + }, + { + "epoch": 0.6, + "learning_rate": 1.8526578812138952e-06, + "loss": 1.2112, + "step": 19780 + }, + { + "epoch": 0.6, + "learning_rate": 1.8524222833225252e-06, + "loss": 1.1487, + "step": 19781 + }, + { + "epoch": 0.6, + "learning_rate": 1.8521866915957832e-06, + "loss": 1.2094, + "step": 19782 + }, + { + "epoch": 0.6, + "learning_rate": 1.851951106035912e-06, + "loss": 1.0262, + "step": 19783 + }, + { + "epoch": 0.6, + "learning_rate": 1.8517155266451543e-06, + "loss": 1.082, + "step": 19784 + }, + { + "epoch": 0.6, + "learning_rate": 1.8514799534257522e-06, + "loss": 1.1595, + "step": 19785 + }, + { + "epoch": 0.6, + "learning_rate": 1.8512443863799487e-06, + "loss": 1.2726, + "step": 19786 + }, + { + "epoch": 0.6, + "learning_rate": 1.8510088255099868e-06, + "loss": 1.179, + "step": 19787 + }, + { + "epoch": 0.6, + "learning_rate": 1.8507732708181076e-06, + "loss": 1.1151, + "step": 19788 + }, + { + "epoch": 0.6, + "learning_rate": 1.8505377223065545e-06, + "loss": 1.1166, + "step": 19789 + }, + { + "epoch": 0.6, + "learning_rate": 1.8503021799775695e-06, + "loss": 1.023, + "step": 19790 + }, + { + "epoch": 0.6, + "learning_rate": 1.8500666438333945e-06, + "loss": 1.074, + "step": 19791 + }, + { + "epoch": 0.6, + "learning_rate": 1.849831113876272e-06, + "loss": 1.0047, + "step": 19792 + }, + { + "epoch": 0.6, + "learning_rate": 1.8495955901084456e-06, + "loss": 1.1277, + "step": 19793 + }, + { + "epoch": 0.6, + "learning_rate": 1.8493600725321544e-06, + "loss": 1.2181, + "step": 19794 + }, + { + "epoch": 0.6, + "learning_rate": 1.8491245611496422e-06, + "loss": 1.064, + "step": 19795 + }, + { + "epoch": 0.6, + "learning_rate": 1.8488890559631506e-06, + "loss": 1.1323, + "step": 19796 + }, + { + "epoch": 0.6, + "learning_rate": 1.8486535569749225e-06, + "loss": 1.1722, + "step": 19797 + }, + { + "epoch": 0.6, + "learning_rate": 1.8484180641871986e-06, + "loss": 1.0954, + "step": 19798 + }, + { + "epoch": 0.6, + "learning_rate": 1.84818257760222e-06, + "loss": 1.2046, + "step": 19799 + }, + { + "epoch": 0.6, + "learning_rate": 1.8479470972222297e-06, + "loss": 1.2183, + "step": 19800 + }, + { + "epoch": 0.6, + "learning_rate": 1.847711623049469e-06, + "loss": 1.1359, + "step": 19801 + }, + { + "epoch": 0.6, + "learning_rate": 1.84747615508618e-06, + "loss": 1.2567, + "step": 19802 + }, + { + "epoch": 0.6, + "learning_rate": 1.8472406933346032e-06, + "loss": 1.1042, + "step": 19803 + }, + { + "epoch": 0.6, + "learning_rate": 1.8470052377969804e-06, + "loss": 1.1525, + "step": 19804 + }, + { + "epoch": 0.6, + "learning_rate": 1.8467697884755537e-06, + "loss": 1.0449, + "step": 19805 + }, + { + "epoch": 0.6, + "learning_rate": 1.8465343453725649e-06, + "loss": 1.222, + "step": 19806 + }, + { + "epoch": 0.6, + "learning_rate": 1.8462989084902532e-06, + "loss": 1.0964, + "step": 19807 + }, + { + "epoch": 0.6, + "learning_rate": 1.8460634778308611e-06, + "loss": 1.106, + "step": 19808 + }, + { + "epoch": 0.6, + "learning_rate": 1.84582805339663e-06, + "loss": 1.0836, + "step": 19809 + }, + { + "epoch": 0.6, + "learning_rate": 1.8455926351898013e-06, + "loss": 1.2059, + "step": 19810 + }, + { + "epoch": 0.6, + "learning_rate": 1.8453572232126149e-06, + "loss": 1.154, + "step": 19811 + }, + { + "epoch": 0.6, + "learning_rate": 1.8451218174673125e-06, + "loss": 1.0463, + "step": 19812 + }, + { + "epoch": 0.6, + "learning_rate": 1.8448864179561347e-06, + "loss": 0.9445, + "step": 19813 + }, + { + "epoch": 0.6, + "learning_rate": 1.8446510246813227e-06, + "loss": 1.0513, + "step": 19814 + }, + { + "epoch": 0.6, + "learning_rate": 1.844415637645118e-06, + "loss": 1.1002, + "step": 19815 + }, + { + "epoch": 0.6, + "learning_rate": 1.8441802568497602e-06, + "loss": 1.0986, + "step": 19816 + }, + { + "epoch": 0.6, + "learning_rate": 1.8439448822974903e-06, + "loss": 1.1066, + "step": 19817 + }, + { + "epoch": 0.6, + "learning_rate": 1.8437095139905493e-06, + "loss": 1.0417, + "step": 19818 + }, + { + "epoch": 0.6, + "learning_rate": 1.8434741519311788e-06, + "loss": 1.1701, + "step": 19819 + }, + { + "epoch": 0.6, + "learning_rate": 1.8432387961216169e-06, + "loss": 1.1854, + "step": 19820 + }, + { + "epoch": 0.6, + "learning_rate": 1.8430034465641055e-06, + "loss": 1.1019, + "step": 19821 + }, + { + "epoch": 0.6, + "learning_rate": 1.8427681032608849e-06, + "loss": 1.0452, + "step": 19822 + }, + { + "epoch": 0.6, + "learning_rate": 1.8425327662141962e-06, + "loss": 1.1967, + "step": 19823 + }, + { + "epoch": 0.6, + "learning_rate": 1.8422974354262783e-06, + "loss": 1.2016, + "step": 19824 + }, + { + "epoch": 0.6, + "learning_rate": 1.8420621108993719e-06, + "loss": 1.118, + "step": 19825 + }, + { + "epoch": 0.6, + "learning_rate": 1.841826792635717e-06, + "loss": 1.0986, + "step": 19826 + }, + { + "epoch": 0.6, + "learning_rate": 1.8415914806375546e-06, + "loss": 1.1247, + "step": 19827 + }, + { + "epoch": 0.6, + "learning_rate": 1.8413561749071243e-06, + "loss": 1.0417, + "step": 19828 + }, + { + "epoch": 0.6, + "learning_rate": 1.8411208754466655e-06, + "loss": 1.0687, + "step": 19829 + }, + { + "epoch": 0.6, + "learning_rate": 1.8408855822584188e-06, + "loss": 1.2295, + "step": 19830 + }, + { + "epoch": 0.6, + "learning_rate": 1.840650295344624e-06, + "loss": 1.1931, + "step": 19831 + }, + { + "epoch": 0.6, + "learning_rate": 1.8404150147075218e-06, + "loss": 1.0934, + "step": 19832 + }, + { + "epoch": 0.6, + "learning_rate": 1.8401797403493498e-06, + "loss": 1.1923, + "step": 19833 + }, + { + "epoch": 0.6, + "learning_rate": 1.839944472272349e-06, + "loss": 1.1019, + "step": 19834 + }, + { + "epoch": 0.6, + "learning_rate": 1.839709210478759e-06, + "loss": 1.193, + "step": 19835 + }, + { + "epoch": 0.6, + "learning_rate": 1.8394739549708201e-06, + "loss": 1.1839, + "step": 19836 + }, + { + "epoch": 0.6, + "learning_rate": 1.8392387057507702e-06, + "loss": 1.2446, + "step": 19837 + }, + { + "epoch": 0.6, + "learning_rate": 1.8390034628208498e-06, + "loss": 1.1224, + "step": 19838 + }, + { + "epoch": 0.6, + "learning_rate": 1.8387682261832975e-06, + "loss": 1.0116, + "step": 19839 + }, + { + "epoch": 0.6, + "learning_rate": 1.8385329958403537e-06, + "loss": 1.0789, + "step": 19840 + }, + { + "epoch": 0.6, + "learning_rate": 1.8382977717942574e-06, + "loss": 1.1144, + "step": 19841 + }, + { + "epoch": 0.6, + "learning_rate": 1.8380625540472474e-06, + "loss": 1.1519, + "step": 19842 + }, + { + "epoch": 0.6, + "learning_rate": 1.837827342601563e-06, + "loss": 1.2446, + "step": 19843 + }, + { + "epoch": 0.6, + "learning_rate": 1.8375921374594433e-06, + "loss": 1.1429, + "step": 19844 + }, + { + "epoch": 0.6, + "learning_rate": 1.8373569386231285e-06, + "loss": 1.1629, + "step": 19845 + }, + { + "epoch": 0.6, + "learning_rate": 1.8371217460948555e-06, + "loss": 1.1399, + "step": 19846 + }, + { + "epoch": 0.6, + "learning_rate": 1.8368865598768642e-06, + "loss": 1.0792, + "step": 19847 + }, + { + "epoch": 0.6, + "learning_rate": 1.8366513799713937e-06, + "loss": 1.1135, + "step": 19848 + }, + { + "epoch": 0.6, + "learning_rate": 1.8364162063806833e-06, + "loss": 1.1899, + "step": 19849 + }, + { + "epoch": 0.6, + "learning_rate": 1.8361810391069701e-06, + "loss": 1.1084, + "step": 19850 + }, + { + "epoch": 0.6, + "learning_rate": 1.8359458781524935e-06, + "loss": 1.0707, + "step": 19851 + }, + { + "epoch": 0.6, + "learning_rate": 1.8357107235194926e-06, + "loss": 1.1323, + "step": 19852 + }, + { + "epoch": 0.6, + "learning_rate": 1.8354755752102057e-06, + "loss": 0.9926, + "step": 19853 + }, + { + "epoch": 0.6, + "learning_rate": 1.8352404332268717e-06, + "loss": 1.1796, + "step": 19854 + }, + { + "epoch": 0.6, + "learning_rate": 1.835005297571728e-06, + "loss": 1.2086, + "step": 19855 + }, + { + "epoch": 0.6, + "learning_rate": 1.8347701682470136e-06, + "loss": 1.1851, + "step": 19856 + }, + { + "epoch": 0.6, + "learning_rate": 1.834535045254967e-06, + "loss": 1.1375, + "step": 19857 + }, + { + "epoch": 0.6, + "learning_rate": 1.8342999285978275e-06, + "loss": 1.1865, + "step": 19858 + }, + { + "epoch": 0.6, + "learning_rate": 1.8340648182778306e-06, + "loss": 1.0667, + "step": 19859 + }, + { + "epoch": 0.6, + "learning_rate": 1.8338297142972162e-06, + "loss": 1.1578, + "step": 19860 + }, + { + "epoch": 0.6, + "learning_rate": 1.833594616658222e-06, + "loss": 1.2303, + "step": 19861 + }, + { + "epoch": 0.6, + "learning_rate": 1.833359525363087e-06, + "loss": 1.1462, + "step": 19862 + }, + { + "epoch": 0.6, + "learning_rate": 1.8331244404140469e-06, + "loss": 1.1522, + "step": 19863 + }, + { + "epoch": 0.6, + "learning_rate": 1.8328893618133415e-06, + "loss": 1.1474, + "step": 19864 + }, + { + "epoch": 0.6, + "learning_rate": 1.832654289563208e-06, + "loss": 1.1276, + "step": 19865 + }, + { + "epoch": 0.6, + "learning_rate": 1.8324192236658848e-06, + "loss": 1.1496, + "step": 19866 + }, + { + "epoch": 0.6, + "learning_rate": 1.8321841641236083e-06, + "loss": 1.1887, + "step": 19867 + }, + { + "epoch": 0.6, + "learning_rate": 1.831949110938617e-06, + "loss": 1.1438, + "step": 19868 + }, + { + "epoch": 0.6, + "learning_rate": 1.8317140641131487e-06, + "loss": 1.0962, + "step": 19869 + }, + { + "epoch": 0.6, + "learning_rate": 1.8314790236494407e-06, + "loss": 1.0242, + "step": 19870 + }, + { + "epoch": 0.6, + "learning_rate": 1.8312439895497309e-06, + "loss": 1.069, + "step": 19871 + }, + { + "epoch": 0.6, + "learning_rate": 1.8310089618162553e-06, + "loss": 1.0868, + "step": 19872 + }, + { + "epoch": 0.6, + "learning_rate": 1.8307739404512526e-06, + "loss": 1.1796, + "step": 19873 + }, + { + "epoch": 0.6, + "learning_rate": 1.8305389254569594e-06, + "loss": 1.2183, + "step": 19874 + }, + { + "epoch": 0.6, + "learning_rate": 1.8303039168356144e-06, + "loss": 1.0625, + "step": 19875 + }, + { + "epoch": 0.6, + "learning_rate": 1.8300689145894523e-06, + "loss": 1.0726, + "step": 19876 + }, + { + "epoch": 0.6, + "learning_rate": 1.8298339187207116e-06, + "loss": 1.1098, + "step": 19877 + }, + { + "epoch": 0.6, + "learning_rate": 1.8295989292316293e-06, + "loss": 1.0068, + "step": 19878 + }, + { + "epoch": 0.6, + "learning_rate": 1.8293639461244428e-06, + "loss": 1.0712, + "step": 19879 + }, + { + "epoch": 0.6, + "learning_rate": 1.829128969401388e-06, + "loss": 1.1914, + "step": 19880 + }, + { + "epoch": 0.6, + "learning_rate": 1.8288939990647028e-06, + "loss": 1.2217, + "step": 19881 + }, + { + "epoch": 0.6, + "learning_rate": 1.828659035116623e-06, + "loss": 1.0304, + "step": 19882 + }, + { + "epoch": 0.6, + "learning_rate": 1.828424077559386e-06, + "loss": 1.0726, + "step": 19883 + }, + { + "epoch": 0.6, + "learning_rate": 1.828189126395229e-06, + "loss": 1.0176, + "step": 19884 + }, + { + "epoch": 0.6, + "learning_rate": 1.8279541816263868e-06, + "loss": 1.2953, + "step": 19885 + }, + { + "epoch": 0.6, + "learning_rate": 1.8277192432550976e-06, + "loss": 1.0952, + "step": 19886 + }, + { + "epoch": 0.6, + "learning_rate": 1.8274843112835975e-06, + "loss": 1.2147, + "step": 19887 + }, + { + "epoch": 0.6, + "learning_rate": 1.827249385714124e-06, + "loss": 1.1571, + "step": 19888 + }, + { + "epoch": 0.6, + "learning_rate": 1.8270144665489108e-06, + "loss": 0.9963, + "step": 19889 + }, + { + "epoch": 0.6, + "learning_rate": 1.826779553790196e-06, + "loss": 1.09, + "step": 19890 + }, + { + "epoch": 0.6, + "learning_rate": 1.8265446474402154e-06, + "loss": 1.0807, + "step": 19891 + }, + { + "epoch": 0.6, + "learning_rate": 1.826309747501207e-06, + "loss": 1.0657, + "step": 19892 + }, + { + "epoch": 0.6, + "learning_rate": 1.8260748539754037e-06, + "loss": 1.1951, + "step": 19893 + }, + { + "epoch": 0.6, + "learning_rate": 1.8258399668650437e-06, + "loss": 1.0937, + "step": 19894 + }, + { + "epoch": 0.6, + "learning_rate": 1.8256050861723623e-06, + "loss": 1.0955, + "step": 19895 + }, + { + "epoch": 0.6, + "learning_rate": 1.8253702118995955e-06, + "loss": 1.165, + "step": 19896 + }, + { + "epoch": 0.6, + "learning_rate": 1.8251353440489803e-06, + "loss": 1.1974, + "step": 19897 + }, + { + "epoch": 0.6, + "learning_rate": 1.8249004826227506e-06, + "loss": 1.1481, + "step": 19898 + }, + { + "epoch": 0.6, + "learning_rate": 1.8246656276231437e-06, + "loss": 1.0814, + "step": 19899 + }, + { + "epoch": 0.6, + "learning_rate": 1.8244307790523943e-06, + "loss": 1.032, + "step": 19900 + }, + { + "epoch": 0.6, + "learning_rate": 1.82419593691274e-06, + "loss": 1.1415, + "step": 19901 + }, + { + "epoch": 0.6, + "learning_rate": 1.8239611012064135e-06, + "loss": 1.0507, + "step": 19902 + }, + { + "epoch": 0.6, + "learning_rate": 1.823726271935652e-06, + "loss": 1.0953, + "step": 19903 + }, + { + "epoch": 0.6, + "learning_rate": 1.8234914491026902e-06, + "loss": 1.1796, + "step": 19904 + }, + { + "epoch": 0.6, + "learning_rate": 1.8232566327097655e-06, + "loss": 1.1277, + "step": 19905 + }, + { + "epoch": 0.6, + "learning_rate": 1.8230218227591106e-06, + "loss": 1.1268, + "step": 19906 + }, + { + "epoch": 0.6, + "learning_rate": 1.8227870192529617e-06, + "loss": 1.101, + "step": 19907 + }, + { + "epoch": 0.6, + "learning_rate": 1.8225522221935547e-06, + "loss": 1.1666, + "step": 19908 + }, + { + "epoch": 0.6, + "learning_rate": 1.8223174315831239e-06, + "loss": 1.0615, + "step": 19909 + }, + { + "epoch": 0.6, + "learning_rate": 1.822082647423905e-06, + "loss": 1.0641, + "step": 19910 + }, + { + "epoch": 0.6, + "learning_rate": 1.821847869718133e-06, + "loss": 1.233, + "step": 19911 + }, + { + "epoch": 0.6, + "learning_rate": 1.8216130984680422e-06, + "loss": 1.1423, + "step": 19912 + }, + { + "epoch": 0.6, + "learning_rate": 1.8213783336758678e-06, + "loss": 1.1627, + "step": 19913 + }, + { + "epoch": 0.6, + "learning_rate": 1.8211435753438465e-06, + "loss": 1.121, + "step": 19914 + }, + { + "epoch": 0.6, + "learning_rate": 1.82090882347421e-06, + "loss": 1.054, + "step": 19915 + }, + { + "epoch": 0.6, + "learning_rate": 1.8206740780691945e-06, + "loss": 1.123, + "step": 19916 + }, + { + "epoch": 0.6, + "learning_rate": 1.8204393391310344e-06, + "loss": 1.1771, + "step": 19917 + }, + { + "epoch": 0.6, + "learning_rate": 1.8202046066619655e-06, + "loss": 1.1347, + "step": 19918 + }, + { + "epoch": 0.6, + "learning_rate": 1.8199698806642207e-06, + "loss": 1.1284, + "step": 19919 + }, + { + "epoch": 0.6, + "learning_rate": 1.819735161140035e-06, + "loss": 1.2062, + "step": 19920 + }, + { + "epoch": 0.6, + "learning_rate": 1.8195004480916429e-06, + "loss": 1.0996, + "step": 19921 + }, + { + "epoch": 0.6, + "learning_rate": 1.8192657415212787e-06, + "loss": 1.1387, + "step": 19922 + }, + { + "epoch": 0.6, + "learning_rate": 1.8190310414311774e-06, + "loss": 1.0894, + "step": 19923 + }, + { + "epoch": 0.6, + "learning_rate": 1.818796347823572e-06, + "loss": 1.0775, + "step": 19924 + }, + { + "epoch": 0.6, + "learning_rate": 1.8185616607006973e-06, + "loss": 1.1882, + "step": 19925 + }, + { + "epoch": 0.6, + "learning_rate": 1.8183269800647873e-06, + "loss": 1.1122, + "step": 19926 + }, + { + "epoch": 0.6, + "learning_rate": 1.8180923059180774e-06, + "loss": 1.0231, + "step": 19927 + }, + { + "epoch": 0.6, + "learning_rate": 1.8178576382627994e-06, + "loss": 1.1058, + "step": 19928 + }, + { + "epoch": 0.6, + "learning_rate": 1.8176229771011878e-06, + "loss": 1.0843, + "step": 19929 + }, + { + "epoch": 0.6, + "learning_rate": 1.8173883224354772e-06, + "loss": 1.1053, + "step": 19930 + }, + { + "epoch": 0.6, + "learning_rate": 1.817153674267902e-06, + "loss": 1.1666, + "step": 19931 + }, + { + "epoch": 0.6, + "learning_rate": 1.8169190326006937e-06, + "loss": 1.1081, + "step": 19932 + }, + { + "epoch": 0.6, + "learning_rate": 1.816684397436087e-06, + "loss": 1.0461, + "step": 19933 + }, + { + "epoch": 0.6, + "learning_rate": 1.816449768776316e-06, + "loss": 1.0635, + "step": 19934 + }, + { + "epoch": 0.6, + "learning_rate": 1.8162151466236138e-06, + "loss": 1.0917, + "step": 19935 + }, + { + "epoch": 0.6, + "learning_rate": 1.815980530980215e-06, + "loss": 1.0925, + "step": 19936 + }, + { + "epoch": 0.6, + "learning_rate": 1.8157459218483514e-06, + "loss": 1.2339, + "step": 19937 + }, + { + "epoch": 0.6, + "learning_rate": 1.8155113192302571e-06, + "loss": 1.1699, + "step": 19938 + }, + { + "epoch": 0.6, + "learning_rate": 1.8152767231281654e-06, + "loss": 1.1711, + "step": 19939 + }, + { + "epoch": 0.6, + "learning_rate": 1.8150421335443106e-06, + "loss": 1.0911, + "step": 19940 + }, + { + "epoch": 0.6, + "learning_rate": 1.8148075504809238e-06, + "loss": 1.114, + "step": 19941 + }, + { + "epoch": 0.6, + "learning_rate": 1.814572973940239e-06, + "loss": 1.1096, + "step": 19942 + }, + { + "epoch": 0.6, + "learning_rate": 1.8143384039244892e-06, + "loss": 1.116, + "step": 19943 + }, + { + "epoch": 0.6, + "learning_rate": 1.814103840435909e-06, + "loss": 1.1222, + "step": 19944 + }, + { + "epoch": 0.6, + "learning_rate": 1.8138692834767285e-06, + "loss": 0.9872, + "step": 19945 + }, + { + "epoch": 0.6, + "learning_rate": 1.8136347330491821e-06, + "loss": 1.0497, + "step": 19946 + }, + { + "epoch": 0.6, + "learning_rate": 1.8134001891555026e-06, + "loss": 1.1102, + "step": 19947 + }, + { + "epoch": 0.6, + "learning_rate": 1.8131656517979223e-06, + "loss": 0.9819, + "step": 19948 + }, + { + "epoch": 0.6, + "learning_rate": 1.8129311209786748e-06, + "loss": 1.1503, + "step": 19949 + }, + { + "epoch": 0.6, + "learning_rate": 1.812696596699992e-06, + "loss": 1.0425, + "step": 19950 + }, + { + "epoch": 0.6, + "learning_rate": 1.8124620789641061e-06, + "loss": 1.1026, + "step": 19951 + }, + { + "epoch": 0.6, + "learning_rate": 1.812227567773251e-06, + "loss": 1.1876, + "step": 19952 + }, + { + "epoch": 0.6, + "learning_rate": 1.8119930631296582e-06, + "loss": 1.0204, + "step": 19953 + }, + { + "epoch": 0.6, + "learning_rate": 1.8117585650355594e-06, + "loss": 1.0471, + "step": 19954 + }, + { + "epoch": 0.6, + "learning_rate": 1.8115240734931874e-06, + "loss": 1.1448, + "step": 19955 + }, + { + "epoch": 0.6, + "learning_rate": 1.811289588504775e-06, + "loss": 0.9832, + "step": 19956 + }, + { + "epoch": 0.6, + "learning_rate": 1.8110551100725548e-06, + "loss": 1.1405, + "step": 19957 + }, + { + "epoch": 0.6, + "learning_rate": 1.8108206381987573e-06, + "loss": 1.15, + "step": 19958 + }, + { + "epoch": 0.6, + "learning_rate": 1.8105861728856152e-06, + "loss": 1.0006, + "step": 19959 + }, + { + "epoch": 0.6, + "learning_rate": 1.8103517141353608e-06, + "loss": 0.9826, + "step": 19960 + }, + { + "epoch": 0.6, + "learning_rate": 1.810117261950226e-06, + "loss": 1.2191, + "step": 19961 + }, + { + "epoch": 0.6, + "learning_rate": 1.809882816332443e-06, + "loss": 1.1671, + "step": 19962 + }, + { + "epoch": 0.6, + "learning_rate": 1.8096483772842433e-06, + "loss": 1.1222, + "step": 19963 + }, + { + "epoch": 0.6, + "learning_rate": 1.8094139448078578e-06, + "loss": 1.0743, + "step": 19964 + }, + { + "epoch": 0.6, + "learning_rate": 1.8091795189055195e-06, + "loss": 1.0598, + "step": 19965 + }, + { + "epoch": 0.6, + "learning_rate": 1.8089450995794594e-06, + "loss": 1.0972, + "step": 19966 + }, + { + "epoch": 0.6, + "learning_rate": 1.8087106868319091e-06, + "loss": 1.2065, + "step": 19967 + }, + { + "epoch": 0.6, + "learning_rate": 1.8084762806650999e-06, + "loss": 1.0562, + "step": 19968 + }, + { + "epoch": 0.6, + "learning_rate": 1.8082418810812636e-06, + "loss": 1.202, + "step": 19969 + }, + { + "epoch": 0.6, + "learning_rate": 1.808007488082632e-06, + "loss": 1.2052, + "step": 19970 + }, + { + "epoch": 0.6, + "learning_rate": 1.8077731016714354e-06, + "loss": 1.12, + "step": 19971 + }, + { + "epoch": 0.6, + "learning_rate": 1.8075387218499053e-06, + "loss": 1.1133, + "step": 19972 + }, + { + "epoch": 0.6, + "learning_rate": 1.8073043486202728e-06, + "loss": 1.0619, + "step": 19973 + }, + { + "epoch": 0.6, + "learning_rate": 1.8070699819847693e-06, + "loss": 1.0869, + "step": 19974 + }, + { + "epoch": 0.6, + "learning_rate": 1.8068356219456273e-06, + "loss": 1.2502, + "step": 19975 + }, + { + "epoch": 0.6, + "learning_rate": 1.8066012685050749e-06, + "loss": 1.1232, + "step": 19976 + }, + { + "epoch": 0.6, + "learning_rate": 1.8063669216653445e-06, + "loss": 1.0923, + "step": 19977 + }, + { + "epoch": 0.6, + "learning_rate": 1.8061325814286674e-06, + "loss": 1.0808, + "step": 19978 + }, + { + "epoch": 0.6, + "learning_rate": 1.8058982477972742e-06, + "loss": 1.1892, + "step": 19979 + }, + { + "epoch": 0.6, + "learning_rate": 1.8056639207733946e-06, + "loss": 1.0878, + "step": 19980 + }, + { + "epoch": 0.6, + "learning_rate": 1.8054296003592603e-06, + "loss": 1.1274, + "step": 19981 + }, + { + "epoch": 0.6, + "learning_rate": 1.8051952865571016e-06, + "loss": 1.1678, + "step": 19982 + }, + { + "epoch": 0.6, + "learning_rate": 1.8049609793691502e-06, + "loss": 1.0356, + "step": 19983 + }, + { + "epoch": 0.6, + "learning_rate": 1.8047266787976347e-06, + "loss": 0.9158, + "step": 19984 + }, + { + "epoch": 0.6, + "learning_rate": 1.804492384844786e-06, + "loss": 1.191, + "step": 19985 + }, + { + "epoch": 0.6, + "learning_rate": 1.8042580975128352e-06, + "loss": 1.0986, + "step": 19986 + }, + { + "epoch": 0.6, + "learning_rate": 1.804023816804012e-06, + "loss": 1.1691, + "step": 19987 + }, + { + "epoch": 0.6, + "learning_rate": 1.8037895427205478e-06, + "loss": 1.1005, + "step": 19988 + }, + { + "epoch": 0.6, + "learning_rate": 1.8035552752646712e-06, + "loss": 1.0938, + "step": 19989 + }, + { + "epoch": 0.6, + "learning_rate": 1.8033210144386127e-06, + "loss": 1.1456, + "step": 19990 + }, + { + "epoch": 0.6, + "learning_rate": 1.8030867602446026e-06, + "loss": 1.1761, + "step": 19991 + }, + { + "epoch": 0.6, + "learning_rate": 1.8028525126848715e-06, + "loss": 1.1002, + "step": 19992 + }, + { + "epoch": 0.6, + "learning_rate": 1.802618271761648e-06, + "loss": 1.1376, + "step": 19993 + }, + { + "epoch": 0.6, + "learning_rate": 1.8023840374771628e-06, + "loss": 1.1728, + "step": 19994 + }, + { + "epoch": 0.6, + "learning_rate": 1.802149809833646e-06, + "loss": 1.1602, + "step": 19995 + }, + { + "epoch": 0.6, + "learning_rate": 1.8019155888333274e-06, + "loss": 1.0687, + "step": 19996 + }, + { + "epoch": 0.6, + "learning_rate": 1.8016813744784354e-06, + "loss": 1.1523, + "step": 19997 + }, + { + "epoch": 0.6, + "learning_rate": 1.8014471667712002e-06, + "loss": 1.025, + "step": 19998 + }, + { + "epoch": 0.6, + "learning_rate": 1.8012129657138516e-06, + "loss": 1.2533, + "step": 19999 + }, + { + "epoch": 0.6, + "learning_rate": 1.8009787713086192e-06, + "loss": 1.1213, + "step": 20000 + }, + { + "epoch": 0.6, + "learning_rate": 1.800744583557733e-06, + "loss": 1.1194, + "step": 20001 + }, + { + "epoch": 0.6, + "learning_rate": 1.8005104024634206e-06, + "loss": 1.0847, + "step": 20002 + }, + { + "epoch": 0.6, + "learning_rate": 1.8002762280279126e-06, + "loss": 1.1537, + "step": 20003 + }, + { + "epoch": 0.6, + "learning_rate": 1.8000420602534378e-06, + "loss": 1.1457, + "step": 20004 + }, + { + "epoch": 0.6, + "learning_rate": 1.7998078991422258e-06, + "loss": 1.2397, + "step": 20005 + }, + { + "epoch": 0.6, + "learning_rate": 1.799573744696505e-06, + "loss": 1.147, + "step": 20006 + }, + { + "epoch": 0.6, + "learning_rate": 1.7993395969185047e-06, + "loss": 1.0157, + "step": 20007 + }, + { + "epoch": 0.6, + "learning_rate": 1.7991054558104539e-06, + "loss": 1.0848, + "step": 20008 + }, + { + "epoch": 0.6, + "learning_rate": 1.7988713213745828e-06, + "loss": 0.9249, + "step": 20009 + }, + { + "epoch": 0.6, + "learning_rate": 1.798637193613118e-06, + "loss": 1.3066, + "step": 20010 + }, + { + "epoch": 0.6, + "learning_rate": 1.7984030725282895e-06, + "loss": 1.0892, + "step": 20011 + }, + { + "epoch": 0.6, + "learning_rate": 1.7981689581223256e-06, + "loss": 1.1514, + "step": 20012 + }, + { + "epoch": 0.6, + "learning_rate": 1.7979348503974554e-06, + "loss": 1.1121, + "step": 20013 + }, + { + "epoch": 0.6, + "learning_rate": 1.7977007493559082e-06, + "loss": 1.1228, + "step": 20014 + }, + { + "epoch": 0.6, + "learning_rate": 1.7974666549999104e-06, + "loss": 1.0558, + "step": 20015 + }, + { + "epoch": 0.6, + "learning_rate": 1.797232567331692e-06, + "loss": 1.0118, + "step": 20016 + }, + { + "epoch": 0.6, + "learning_rate": 1.7969984863534812e-06, + "loss": 1.0948, + "step": 20017 + }, + { + "epoch": 0.6, + "learning_rate": 1.7967644120675066e-06, + "loss": 1.3743, + "step": 20018 + }, + { + "epoch": 0.6, + "learning_rate": 1.796530344475995e-06, + "loss": 1.0497, + "step": 20019 + }, + { + "epoch": 0.6, + "learning_rate": 1.7962962835811764e-06, + "loss": 1.1454, + "step": 20020 + }, + { + "epoch": 0.6, + "learning_rate": 1.7960622293852782e-06, + "loss": 1.1245, + "step": 20021 + }, + { + "epoch": 0.6, + "learning_rate": 1.7958281818905297e-06, + "loss": 1.0529, + "step": 20022 + }, + { + "epoch": 0.6, + "learning_rate": 1.7955941410991563e-06, + "loss": 1.2496, + "step": 20023 + }, + { + "epoch": 0.6, + "learning_rate": 1.7953601070133878e-06, + "loss": 1.2384, + "step": 20024 + }, + { + "epoch": 0.6, + "learning_rate": 1.7951260796354513e-06, + "loss": 0.9192, + "step": 20025 + }, + { + "epoch": 0.6, + "learning_rate": 1.7948920589675756e-06, + "loss": 1.0106, + "step": 20026 + }, + { + "epoch": 0.6, + "learning_rate": 1.7946580450119886e-06, + "loss": 1.2045, + "step": 20027 + }, + { + "epoch": 0.6, + "learning_rate": 1.7944240377709162e-06, + "loss": 1.2542, + "step": 20028 + }, + { + "epoch": 0.6, + "learning_rate": 1.7941900372465873e-06, + "loss": 1.1675, + "step": 20029 + }, + { + "epoch": 0.6, + "learning_rate": 1.7939560434412296e-06, + "loss": 1.0825, + "step": 20030 + }, + { + "epoch": 0.6, + "learning_rate": 1.7937220563570702e-06, + "loss": 0.9799, + "step": 20031 + }, + { + "epoch": 0.6, + "learning_rate": 1.7934880759963364e-06, + "loss": 1.1329, + "step": 20032 + }, + { + "epoch": 0.6, + "learning_rate": 1.793254102361256e-06, + "loss": 1.1906, + "step": 20033 + }, + { + "epoch": 0.6, + "learning_rate": 1.7930201354540566e-06, + "loss": 1.1116, + "step": 20034 + }, + { + "epoch": 0.6, + "learning_rate": 1.7927861752769651e-06, + "loss": 1.1352, + "step": 20035 + }, + { + "epoch": 0.6, + "learning_rate": 1.792552221832208e-06, + "loss": 1.1708, + "step": 20036 + }, + { + "epoch": 0.6, + "learning_rate": 1.792318275122013e-06, + "loss": 1.151, + "step": 20037 + }, + { + "epoch": 0.6, + "learning_rate": 1.7920843351486073e-06, + "loss": 1.0452, + "step": 20038 + }, + { + "epoch": 0.6, + "learning_rate": 1.7918504019142178e-06, + "loss": 1.1716, + "step": 20039 + }, + { + "epoch": 0.6, + "learning_rate": 1.7916164754210724e-06, + "loss": 1.0125, + "step": 20040 + }, + { + "epoch": 0.6, + "learning_rate": 1.791382555671396e-06, + "loss": 1.1174, + "step": 20041 + }, + { + "epoch": 0.6, + "learning_rate": 1.7911486426674164e-06, + "loss": 1.1636, + "step": 20042 + }, + { + "epoch": 0.6, + "learning_rate": 1.79091473641136e-06, + "loss": 1.1584, + "step": 20043 + }, + { + "epoch": 0.6, + "learning_rate": 1.7906808369054545e-06, + "loss": 1.1206, + "step": 20044 + }, + { + "epoch": 0.6, + "learning_rate": 1.790446944151926e-06, + "loss": 1.073, + "step": 20045 + }, + { + "epoch": 0.6, + "learning_rate": 1.7902130581530004e-06, + "loss": 1.0914, + "step": 20046 + }, + { + "epoch": 0.6, + "learning_rate": 1.7899791789109042e-06, + "loss": 1.0983, + "step": 20047 + }, + { + "epoch": 0.6, + "learning_rate": 1.789745306427865e-06, + "loss": 1.201, + "step": 20048 + }, + { + "epoch": 0.6, + "learning_rate": 1.7895114407061078e-06, + "loss": 1.1578, + "step": 20049 + }, + { + "epoch": 0.6, + "learning_rate": 1.7892775817478596e-06, + "loss": 0.9492, + "step": 20050 + }, + { + "epoch": 0.6, + "learning_rate": 1.7890437295553464e-06, + "loss": 1.2173, + "step": 20051 + }, + { + "epoch": 0.6, + "learning_rate": 1.788809884130796e-06, + "loss": 1.1174, + "step": 20052 + }, + { + "epoch": 0.6, + "learning_rate": 1.7885760454764316e-06, + "loss": 1.0229, + "step": 20053 + }, + { + "epoch": 0.6, + "learning_rate": 1.7883422135944806e-06, + "loss": 1.0797, + "step": 20054 + }, + { + "epoch": 0.6, + "learning_rate": 1.7881083884871691e-06, + "loss": 1.0804, + "step": 20055 + }, + { + "epoch": 0.6, + "learning_rate": 1.7878745701567226e-06, + "loss": 1.1874, + "step": 20056 + }, + { + "epoch": 0.6, + "learning_rate": 1.7876407586053684e-06, + "loss": 1.1908, + "step": 20057 + }, + { + "epoch": 0.6, + "learning_rate": 1.7874069538353303e-06, + "loss": 1.1255, + "step": 20058 + }, + { + "epoch": 0.6, + "learning_rate": 1.7871731558488345e-06, + "loss": 1.0368, + "step": 20059 + }, + { + "epoch": 0.6, + "learning_rate": 1.7869393646481071e-06, + "loss": 1.1204, + "step": 20060 + }, + { + "epoch": 0.6, + "learning_rate": 1.7867055802353738e-06, + "loss": 1.141, + "step": 20061 + }, + { + "epoch": 0.6, + "learning_rate": 1.7864718026128596e-06, + "loss": 1.1223, + "step": 20062 + }, + { + "epoch": 0.6, + "learning_rate": 1.7862380317827905e-06, + "loss": 1.1036, + "step": 20063 + }, + { + "epoch": 0.6, + "learning_rate": 1.786004267747391e-06, + "loss": 1.0153, + "step": 20064 + }, + { + "epoch": 0.6, + "learning_rate": 1.7857705105088882e-06, + "loss": 1.0723, + "step": 20065 + }, + { + "epoch": 0.6, + "learning_rate": 1.785536760069505e-06, + "loss": 1.0894, + "step": 20066 + }, + { + "epoch": 0.6, + "learning_rate": 1.785303016431468e-06, + "loss": 1.1023, + "step": 20067 + }, + { + "epoch": 0.6, + "learning_rate": 1.785069279597002e-06, + "loss": 1.0361, + "step": 20068 + }, + { + "epoch": 0.6, + "learning_rate": 1.7848355495683324e-06, + "loss": 1.0189, + "step": 20069 + }, + { + "epoch": 0.6, + "learning_rate": 1.7846018263476845e-06, + "loss": 1.2271, + "step": 20070 + }, + { + "epoch": 0.6, + "learning_rate": 1.7843681099372816e-06, + "loss": 1.1506, + "step": 20071 + }, + { + "epoch": 0.6, + "learning_rate": 1.7841344003393503e-06, + "loss": 1.1088, + "step": 20072 + }, + { + "epoch": 0.6, + "learning_rate": 1.783900697556114e-06, + "loss": 1.1296, + "step": 20073 + }, + { + "epoch": 0.6, + "learning_rate": 1.7836670015897988e-06, + "loss": 1.0932, + "step": 20074 + }, + { + "epoch": 0.6, + "learning_rate": 1.7834333124426284e-06, + "loss": 1.0684, + "step": 20075 + }, + { + "epoch": 0.6, + "learning_rate": 1.7831996301168277e-06, + "loss": 1.181, + "step": 20076 + }, + { + "epoch": 0.6, + "learning_rate": 1.7829659546146216e-06, + "loss": 1.0178, + "step": 20077 + }, + { + "epoch": 0.6, + "learning_rate": 1.7827322859382351e-06, + "loss": 1.0263, + "step": 20078 + }, + { + "epoch": 0.6, + "learning_rate": 1.7824986240898907e-06, + "loss": 1.1072, + "step": 20079 + }, + { + "epoch": 0.6, + "learning_rate": 1.7822649690718135e-06, + "loss": 1.2153, + "step": 20080 + }, + { + "epoch": 0.6, + "learning_rate": 1.782031320886229e-06, + "loss": 1.2266, + "step": 20081 + }, + { + "epoch": 0.6, + "learning_rate": 1.7817976795353597e-06, + "loss": 1.0706, + "step": 20082 + }, + { + "epoch": 0.61, + "learning_rate": 1.781564045021432e-06, + "loss": 1.149, + "step": 20083 + }, + { + "epoch": 0.61, + "learning_rate": 1.7813304173466674e-06, + "loss": 1.0936, + "step": 20084 + }, + { + "epoch": 0.61, + "learning_rate": 1.7810967965132914e-06, + "loss": 1.0762, + "step": 20085 + }, + { + "epoch": 0.61, + "learning_rate": 1.7808631825235274e-06, + "loss": 1.0901, + "step": 20086 + }, + { + "epoch": 0.61, + "learning_rate": 1.7806295753796e-06, + "loss": 1.2012, + "step": 20087 + }, + { + "epoch": 0.61, + "learning_rate": 1.7803959750837324e-06, + "loss": 1.077, + "step": 20088 + }, + { + "epoch": 0.61, + "learning_rate": 1.780162381638148e-06, + "loss": 1.1071, + "step": 20089 + }, + { + "epoch": 0.61, + "learning_rate": 1.7799287950450717e-06, + "loss": 1.1374, + "step": 20090 + }, + { + "epoch": 0.61, + "learning_rate": 1.7796952153067271e-06, + "loss": 0.9744, + "step": 20091 + }, + { + "epoch": 0.61, + "learning_rate": 1.7794616424253362e-06, + "loss": 1.1335, + "step": 20092 + }, + { + "epoch": 0.61, + "learning_rate": 1.7792280764031233e-06, + "loss": 1.0871, + "step": 20093 + }, + { + "epoch": 0.61, + "learning_rate": 1.7789945172423124e-06, + "loss": 1.0684, + "step": 20094 + }, + { + "epoch": 0.61, + "learning_rate": 1.778760964945126e-06, + "loss": 1.1111, + "step": 20095 + }, + { + "epoch": 0.61, + "learning_rate": 1.7785274195137893e-06, + "loss": 1.1359, + "step": 20096 + }, + { + "epoch": 0.61, + "learning_rate": 1.7782938809505224e-06, + "loss": 1.1425, + "step": 20097 + }, + { + "epoch": 0.61, + "learning_rate": 1.7780603492575503e-06, + "loss": 1.1142, + "step": 20098 + }, + { + "epoch": 0.61, + "learning_rate": 1.7778268244370966e-06, + "loss": 1.0266, + "step": 20099 + }, + { + "epoch": 0.61, + "learning_rate": 1.777593306491384e-06, + "loss": 1.1685, + "step": 20100 + }, + { + "epoch": 0.61, + "learning_rate": 1.7773597954226346e-06, + "loss": 1.0294, + "step": 20101 + }, + { + "epoch": 0.61, + "learning_rate": 1.7771262912330718e-06, + "loss": 1.1239, + "step": 20102 + }, + { + "epoch": 0.61, + "learning_rate": 1.7768927939249186e-06, + "loss": 1.0851, + "step": 20103 + }, + { + "epoch": 0.61, + "learning_rate": 1.7766593035003986e-06, + "loss": 1.1198, + "step": 20104 + }, + { + "epoch": 0.61, + "learning_rate": 1.7764258199617329e-06, + "loss": 1.1829, + "step": 20105 + }, + { + "epoch": 0.61, + "learning_rate": 1.776192343311145e-06, + "loss": 1.2559, + "step": 20106 + }, + { + "epoch": 0.61, + "learning_rate": 1.775958873550857e-06, + "loss": 1.0566, + "step": 20107 + }, + { + "epoch": 0.61, + "learning_rate": 1.7757254106830923e-06, + "loss": 1.1425, + "step": 20108 + }, + { + "epoch": 0.61, + "learning_rate": 1.7754919547100735e-06, + "loss": 0.9457, + "step": 20109 + }, + { + "epoch": 0.61, + "learning_rate": 1.7752585056340216e-06, + "loss": 1.1156, + "step": 20110 + }, + { + "epoch": 0.61, + "learning_rate": 1.7750250634571595e-06, + "loss": 1.1622, + "step": 20111 + }, + { + "epoch": 0.61, + "learning_rate": 1.7747916281817096e-06, + "loss": 0.9607, + "step": 20112 + }, + { + "epoch": 0.61, + "learning_rate": 1.7745581998098948e-06, + "loss": 1.0823, + "step": 20113 + }, + { + "epoch": 0.61, + "learning_rate": 1.774324778343936e-06, + "loss": 1.1738, + "step": 20114 + }, + { + "epoch": 0.61, + "learning_rate": 1.7740913637860557e-06, + "loss": 1.0475, + "step": 20115 + }, + { + "epoch": 0.61, + "learning_rate": 1.7738579561384761e-06, + "loss": 1.1296, + "step": 20116 + }, + { + "epoch": 0.61, + "learning_rate": 1.77362455540342e-06, + "loss": 1.0861, + "step": 20117 + }, + { + "epoch": 0.61, + "learning_rate": 1.7733911615831073e-06, + "loss": 1.2208, + "step": 20118 + }, + { + "epoch": 0.61, + "learning_rate": 1.773157774679761e-06, + "loss": 1.064, + "step": 20119 + }, + { + "epoch": 0.61, + "learning_rate": 1.7729243946956027e-06, + "loss": 1.1283, + "step": 20120 + }, + { + "epoch": 0.61, + "learning_rate": 1.7726910216328536e-06, + "loss": 1.12, + "step": 20121 + }, + { + "epoch": 0.61, + "learning_rate": 1.7724576554937368e-06, + "loss": 0.9951, + "step": 20122 + }, + { + "epoch": 0.61, + "learning_rate": 1.7722242962804717e-06, + "loss": 1.2339, + "step": 20123 + }, + { + "epoch": 0.61, + "learning_rate": 1.7719909439952809e-06, + "loss": 1.0972, + "step": 20124 + }, + { + "epoch": 0.61, + "learning_rate": 1.7717575986403858e-06, + "loss": 1.0711, + "step": 20125 + }, + { + "epoch": 0.61, + "learning_rate": 1.7715242602180077e-06, + "loss": 1.0701, + "step": 20126 + }, + { + "epoch": 0.61, + "learning_rate": 1.7712909287303675e-06, + "loss": 1.063, + "step": 20127 + }, + { + "epoch": 0.61, + "learning_rate": 1.7710576041796873e-06, + "loss": 1.0916, + "step": 20128 + }, + { + "epoch": 0.61, + "learning_rate": 1.7708242865681874e-06, + "loss": 1.0329, + "step": 20129 + }, + { + "epoch": 0.61, + "learning_rate": 1.7705909758980891e-06, + "loss": 1.1337, + "step": 20130 + }, + { + "epoch": 0.61, + "learning_rate": 1.7703576721716131e-06, + "loss": 1.2198, + "step": 20131 + }, + { + "epoch": 0.61, + "learning_rate": 1.7701243753909809e-06, + "loss": 1.0698, + "step": 20132 + }, + { + "epoch": 0.61, + "learning_rate": 1.7698910855584128e-06, + "loss": 1.1767, + "step": 20133 + }, + { + "epoch": 0.61, + "learning_rate": 1.7696578026761299e-06, + "loss": 1.1614, + "step": 20134 + }, + { + "epoch": 0.61, + "learning_rate": 1.7694245267463542e-06, + "loss": 0.9735, + "step": 20135 + }, + { + "epoch": 0.61, + "learning_rate": 1.7691912577713038e-06, + "loss": 1.1478, + "step": 20136 + }, + { + "epoch": 0.61, + "learning_rate": 1.768957995753201e-06, + "loss": 1.1613, + "step": 20137 + }, + { + "epoch": 0.61, + "learning_rate": 1.768724740694266e-06, + "loss": 1.1635, + "step": 20138 + }, + { + "epoch": 0.61, + "learning_rate": 1.7684914925967202e-06, + "loss": 1.0972, + "step": 20139 + }, + { + "epoch": 0.61, + "learning_rate": 1.768258251462782e-06, + "loss": 1.0757, + "step": 20140 + }, + { + "epoch": 0.61, + "learning_rate": 1.768025017294673e-06, + "loss": 1.0436, + "step": 20141 + }, + { + "epoch": 0.61, + "learning_rate": 1.767791790094613e-06, + "loss": 1.1481, + "step": 20142 + }, + { + "epoch": 0.61, + "learning_rate": 1.7675585698648234e-06, + "loss": 1.17, + "step": 20143 + }, + { + "epoch": 0.61, + "learning_rate": 1.7673253566075226e-06, + "loss": 1.0524, + "step": 20144 + }, + { + "epoch": 0.61, + "learning_rate": 1.7670921503249319e-06, + "loss": 1.0195, + "step": 20145 + }, + { + "epoch": 0.61, + "learning_rate": 1.7668589510192707e-06, + "loss": 1.0595, + "step": 20146 + }, + { + "epoch": 0.61, + "learning_rate": 1.7666257586927592e-06, + "loss": 1.119, + "step": 20147 + }, + { + "epoch": 0.61, + "learning_rate": 1.7663925733476183e-06, + "loss": 1.2543, + "step": 20148 + }, + { + "epoch": 0.61, + "learning_rate": 1.7661593949860662e-06, + "loss": 1.2253, + "step": 20149 + }, + { + "epoch": 0.61, + "learning_rate": 1.7659262236103224e-06, + "loss": 1.1647, + "step": 20150 + }, + { + "epoch": 0.61, + "learning_rate": 1.7656930592226079e-06, + "loss": 1.0472, + "step": 20151 + }, + { + "epoch": 0.61, + "learning_rate": 1.7654599018251429e-06, + "loss": 1.1239, + "step": 20152 + }, + { + "epoch": 0.61, + "learning_rate": 1.7652267514201449e-06, + "loss": 1.1552, + "step": 20153 + }, + { + "epoch": 0.61, + "learning_rate": 1.764993608009834e-06, + "loss": 1.1569, + "step": 20154 + }, + { + "epoch": 0.61, + "learning_rate": 1.76476047159643e-06, + "loss": 1.1062, + "step": 20155 + }, + { + "epoch": 0.61, + "learning_rate": 1.764527342182153e-06, + "loss": 1.1861, + "step": 20156 + }, + { + "epoch": 0.61, + "learning_rate": 1.764294219769221e-06, + "loss": 1.1324, + "step": 20157 + }, + { + "epoch": 0.61, + "learning_rate": 1.7640611043598536e-06, + "loss": 1.0588, + "step": 20158 + }, + { + "epoch": 0.61, + "learning_rate": 1.7638279959562699e-06, + "loss": 1.1172, + "step": 20159 + }, + { + "epoch": 0.61, + "learning_rate": 1.763594894560689e-06, + "loss": 0.9903, + "step": 20160 + }, + { + "epoch": 0.61, + "learning_rate": 1.7633618001753314e-06, + "loss": 1.2153, + "step": 20161 + }, + { + "epoch": 0.61, + "learning_rate": 1.7631287128024134e-06, + "loss": 1.079, + "step": 20162 + }, + { + "epoch": 0.61, + "learning_rate": 1.7628956324441554e-06, + "loss": 1.1052, + "step": 20163 + }, + { + "epoch": 0.61, + "learning_rate": 1.7626625591027757e-06, + "loss": 1.0496, + "step": 20164 + }, + { + "epoch": 0.61, + "learning_rate": 1.7624294927804946e-06, + "loss": 1.0941, + "step": 20165 + }, + { + "epoch": 0.61, + "learning_rate": 1.7621964334795286e-06, + "loss": 1.1921, + "step": 20166 + }, + { + "epoch": 0.61, + "learning_rate": 1.761963381202097e-06, + "loss": 1.1358, + "step": 20167 + }, + { + "epoch": 0.61, + "learning_rate": 1.7617303359504184e-06, + "loss": 1.0264, + "step": 20168 + }, + { + "epoch": 0.61, + "learning_rate": 1.7614972977267122e-06, + "loss": 1.0682, + "step": 20169 + }, + { + "epoch": 0.61, + "learning_rate": 1.7612642665331955e-06, + "loss": 1.1167, + "step": 20170 + }, + { + "epoch": 0.61, + "learning_rate": 1.7610312423720872e-06, + "loss": 1.1274, + "step": 20171 + }, + { + "epoch": 0.61, + "learning_rate": 1.7607982252456056e-06, + "loss": 1.0452, + "step": 20172 + }, + { + "epoch": 0.61, + "learning_rate": 1.7605652151559689e-06, + "loss": 1.1003, + "step": 20173 + }, + { + "epoch": 0.61, + "learning_rate": 1.7603322121053962e-06, + "loss": 1.046, + "step": 20174 + }, + { + "epoch": 0.61, + "learning_rate": 1.7600992160961033e-06, + "loss": 1.0183, + "step": 20175 + }, + { + "epoch": 0.61, + "learning_rate": 1.75986622713031e-06, + "loss": 1.1202, + "step": 20176 + }, + { + "epoch": 0.61, + "learning_rate": 1.7596332452102332e-06, + "loss": 1.0506, + "step": 20177 + }, + { + "epoch": 0.61, + "learning_rate": 1.759400270338093e-06, + "loss": 1.1081, + "step": 20178 + }, + { + "epoch": 0.61, + "learning_rate": 1.7591673025161042e-06, + "loss": 1.1375, + "step": 20179 + }, + { + "epoch": 0.61, + "learning_rate": 1.7589343417464856e-06, + "loss": 1.0924, + "step": 20180 + }, + { + "epoch": 0.61, + "learning_rate": 1.7587013880314558e-06, + "loss": 1.1103, + "step": 20181 + }, + { + "epoch": 0.61, + "learning_rate": 1.7584684413732317e-06, + "loss": 1.1449, + "step": 20182 + }, + { + "epoch": 0.61, + "learning_rate": 1.7582355017740304e-06, + "loss": 1.0456, + "step": 20183 + }, + { + "epoch": 0.61, + "learning_rate": 1.7580025692360702e-06, + "loss": 1.0999, + "step": 20184 + }, + { + "epoch": 0.61, + "learning_rate": 1.7577696437615682e-06, + "loss": 1.0911, + "step": 20185 + }, + { + "epoch": 0.61, + "learning_rate": 1.7575367253527414e-06, + "loss": 1.1414, + "step": 20186 + }, + { + "epoch": 0.61, + "learning_rate": 1.7573038140118087e-06, + "loss": 1.2897, + "step": 20187 + }, + { + "epoch": 0.61, + "learning_rate": 1.757070909740985e-06, + "loss": 1.107, + "step": 20188 + }, + { + "epoch": 0.61, + "learning_rate": 1.7568380125424883e-06, + "loss": 1.2739, + "step": 20189 + }, + { + "epoch": 0.61, + "learning_rate": 1.7566051224185357e-06, + "loss": 1.0771, + "step": 20190 + }, + { + "epoch": 0.61, + "learning_rate": 1.7563722393713456e-06, + "loss": 1.2247, + "step": 20191 + }, + { + "epoch": 0.61, + "learning_rate": 1.7561393634031324e-06, + "loss": 1.1463, + "step": 20192 + }, + { + "epoch": 0.61, + "learning_rate": 1.7559064945161142e-06, + "loss": 1.0013, + "step": 20193 + }, + { + "epoch": 0.61, + "learning_rate": 1.7556736327125079e-06, + "loss": 1.2675, + "step": 20194 + }, + { + "epoch": 0.61, + "learning_rate": 1.7554407779945304e-06, + "loss": 1.0573, + "step": 20195 + }, + { + "epoch": 0.61, + "learning_rate": 1.755207930364398e-06, + "loss": 1.0101, + "step": 20196 + }, + { + "epoch": 0.61, + "learning_rate": 1.7549750898243273e-06, + "loss": 1.1189, + "step": 20197 + }, + { + "epoch": 0.61, + "learning_rate": 1.7547422563765346e-06, + "loss": 1.1104, + "step": 20198 + }, + { + "epoch": 0.61, + "learning_rate": 1.7545094300232373e-06, + "loss": 1.1859, + "step": 20199 + }, + { + "epoch": 0.61, + "learning_rate": 1.7542766107666514e-06, + "loss": 1.0421, + "step": 20200 + }, + { + "epoch": 0.61, + "learning_rate": 1.7540437986089925e-06, + "loss": 1.1125, + "step": 20201 + }, + { + "epoch": 0.61, + "learning_rate": 1.7538109935524772e-06, + "loss": 1.0606, + "step": 20202 + }, + { + "epoch": 0.61, + "learning_rate": 1.753578195599322e-06, + "loss": 1.0841, + "step": 20203 + }, + { + "epoch": 0.61, + "learning_rate": 1.753345404751744e-06, + "loss": 0.9877, + "step": 20204 + }, + { + "epoch": 0.61, + "learning_rate": 1.753112621011957e-06, + "loss": 1.1541, + "step": 20205 + }, + { + "epoch": 0.61, + "learning_rate": 1.7528798443821782e-06, + "loss": 1.1722, + "step": 20206 + }, + { + "epoch": 0.61, + "learning_rate": 1.7526470748646231e-06, + "loss": 1.1609, + "step": 20207 + }, + { + "epoch": 0.61, + "learning_rate": 1.7524143124615088e-06, + "loss": 1.1108, + "step": 20208 + }, + { + "epoch": 0.61, + "learning_rate": 1.7521815571750494e-06, + "loss": 1.0745, + "step": 20209 + }, + { + "epoch": 0.61, + "learning_rate": 1.7519488090074622e-06, + "loss": 1.2244, + "step": 20210 + }, + { + "epoch": 0.61, + "learning_rate": 1.7517160679609615e-06, + "loss": 1.0923, + "step": 20211 + }, + { + "epoch": 0.61, + "learning_rate": 1.7514833340377635e-06, + "loss": 1.2546, + "step": 20212 + }, + { + "epoch": 0.61, + "learning_rate": 1.751250607240084e-06, + "loss": 1.134, + "step": 20213 + }, + { + "epoch": 0.61, + "learning_rate": 1.7510178875701377e-06, + "loss": 1.109, + "step": 20214 + }, + { + "epoch": 0.61, + "learning_rate": 1.7507851750301401e-06, + "loss": 1.1544, + "step": 20215 + }, + { + "epoch": 0.61, + "learning_rate": 1.7505524696223071e-06, + "loss": 1.1405, + "step": 20216 + }, + { + "epoch": 0.61, + "learning_rate": 1.7503197713488548e-06, + "loss": 1.2814, + "step": 20217 + }, + { + "epoch": 0.61, + "learning_rate": 1.7500870802119962e-06, + "loss": 1.0562, + "step": 20218 + }, + { + "epoch": 0.61, + "learning_rate": 1.7498543962139469e-06, + "loss": 1.0485, + "step": 20219 + }, + { + "epoch": 0.61, + "learning_rate": 1.7496217193569232e-06, + "loss": 1.1251, + "step": 20220 + }, + { + "epoch": 0.61, + "learning_rate": 1.7493890496431397e-06, + "loss": 1.195, + "step": 20221 + }, + { + "epoch": 0.61, + "learning_rate": 1.7491563870748102e-06, + "loss": 1.0358, + "step": 20222 + }, + { + "epoch": 0.61, + "learning_rate": 1.74892373165415e-06, + "loss": 1.0673, + "step": 20223 + }, + { + "epoch": 0.61, + "learning_rate": 1.7486910833833748e-06, + "loss": 1.1752, + "step": 20224 + }, + { + "epoch": 0.61, + "learning_rate": 1.748458442264699e-06, + "loss": 1.0399, + "step": 20225 + }, + { + "epoch": 0.61, + "learning_rate": 1.748225808300336e-06, + "loss": 1.1281, + "step": 20226 + }, + { + "epoch": 0.61, + "learning_rate": 1.7479931814925011e-06, + "loss": 1.2013, + "step": 20227 + }, + { + "epoch": 0.61, + "learning_rate": 1.7477605618434093e-06, + "loss": 1.1215, + "step": 20228 + }, + { + "epoch": 0.61, + "learning_rate": 1.7475279493552747e-06, + "loss": 1.1946, + "step": 20229 + }, + { + "epoch": 0.61, + "learning_rate": 1.7472953440303126e-06, + "loss": 1.0787, + "step": 20230 + }, + { + "epoch": 0.61, + "learning_rate": 1.747062745870735e-06, + "loss": 1.2128, + "step": 20231 + }, + { + "epoch": 0.61, + "learning_rate": 1.7468301548787576e-06, + "loss": 1.0733, + "step": 20232 + }, + { + "epoch": 0.61, + "learning_rate": 1.7465975710565946e-06, + "loss": 1.1057, + "step": 20233 + }, + { + "epoch": 0.61, + "learning_rate": 1.7463649944064606e-06, + "loss": 1.1359, + "step": 20234 + }, + { + "epoch": 0.61, + "learning_rate": 1.7461324249305677e-06, + "loss": 1.0006, + "step": 20235 + }, + { + "epoch": 0.61, + "learning_rate": 1.7458998626311317e-06, + "loss": 1.2484, + "step": 20236 + }, + { + "epoch": 0.61, + "learning_rate": 1.7456673075103653e-06, + "loss": 0.9534, + "step": 20237 + }, + { + "epoch": 0.61, + "learning_rate": 1.7454347595704835e-06, + "loss": 1.0474, + "step": 20238 + }, + { + "epoch": 0.61, + "learning_rate": 1.7452022188136988e-06, + "loss": 1.2321, + "step": 20239 + }, + { + "epoch": 0.61, + "learning_rate": 1.7449696852422254e-06, + "loss": 1.0316, + "step": 20240 + }, + { + "epoch": 0.61, + "learning_rate": 1.7447371588582774e-06, + "loss": 1.1091, + "step": 20241 + }, + { + "epoch": 0.61, + "learning_rate": 1.7445046396640675e-06, + "loss": 1.0366, + "step": 20242 + }, + { + "epoch": 0.61, + "learning_rate": 1.7442721276618105e-06, + "loss": 1.1499, + "step": 20243 + }, + { + "epoch": 0.61, + "learning_rate": 1.7440396228537183e-06, + "loss": 1.1652, + "step": 20244 + }, + { + "epoch": 0.61, + "learning_rate": 1.7438071252420041e-06, + "loss": 1.1909, + "step": 20245 + }, + { + "epoch": 0.61, + "learning_rate": 1.7435746348288823e-06, + "loss": 1.0298, + "step": 20246 + }, + { + "epoch": 0.61, + "learning_rate": 1.743342151616567e-06, + "loss": 1.0809, + "step": 20247 + }, + { + "epoch": 0.61, + "learning_rate": 1.7431096756072686e-06, + "loss": 1.1656, + "step": 20248 + }, + { + "epoch": 0.61, + "learning_rate": 1.7428772068032015e-06, + "loss": 1.1534, + "step": 20249 + }, + { + "epoch": 0.61, + "learning_rate": 1.7426447452065787e-06, + "loss": 1.1778, + "step": 20250 + }, + { + "epoch": 0.61, + "learning_rate": 1.742412290819614e-06, + "loss": 1.1065, + "step": 20251 + }, + { + "epoch": 0.61, + "learning_rate": 1.7421798436445187e-06, + "loss": 1.2784, + "step": 20252 + }, + { + "epoch": 0.61, + "learning_rate": 1.7419474036835066e-06, + "loss": 1.1086, + "step": 20253 + }, + { + "epoch": 0.61, + "learning_rate": 1.7417149709387898e-06, + "loss": 1.1354, + "step": 20254 + }, + { + "epoch": 0.61, + "learning_rate": 1.7414825454125811e-06, + "loss": 1.1271, + "step": 20255 + }, + { + "epoch": 0.61, + "learning_rate": 1.7412501271070948e-06, + "loss": 1.2703, + "step": 20256 + }, + { + "epoch": 0.61, + "learning_rate": 1.7410177160245407e-06, + "loss": 1.072, + "step": 20257 + }, + { + "epoch": 0.61, + "learning_rate": 1.7407853121671319e-06, + "loss": 1.0333, + "step": 20258 + }, + { + "epoch": 0.61, + "learning_rate": 1.740552915537082e-06, + "loss": 1.0751, + "step": 20259 + }, + { + "epoch": 0.61, + "learning_rate": 1.740320526136603e-06, + "loss": 1.1567, + "step": 20260 + }, + { + "epoch": 0.61, + "learning_rate": 1.7400881439679062e-06, + "loss": 1.1755, + "step": 20261 + }, + { + "epoch": 0.61, + "learning_rate": 1.7398557690332041e-06, + "loss": 1.1356, + "step": 20262 + }, + { + "epoch": 0.61, + "learning_rate": 1.7396234013347088e-06, + "loss": 1.0747, + "step": 20263 + }, + { + "epoch": 0.61, + "learning_rate": 1.739391040874633e-06, + "loss": 1.0604, + "step": 20264 + }, + { + "epoch": 0.61, + "learning_rate": 1.739158687655188e-06, + "loss": 1.0441, + "step": 20265 + }, + { + "epoch": 0.61, + "learning_rate": 1.7389263416785856e-06, + "loss": 1.0993, + "step": 20266 + }, + { + "epoch": 0.61, + "learning_rate": 1.738694002947038e-06, + "loss": 1.0006, + "step": 20267 + }, + { + "epoch": 0.61, + "learning_rate": 1.7384616714627567e-06, + "loss": 1.1021, + "step": 20268 + }, + { + "epoch": 0.61, + "learning_rate": 1.7382293472279545e-06, + "loss": 1.0762, + "step": 20269 + }, + { + "epoch": 0.61, + "learning_rate": 1.7379970302448412e-06, + "loss": 1.0817, + "step": 20270 + }, + { + "epoch": 0.61, + "learning_rate": 1.7377647205156292e-06, + "loss": 1.0563, + "step": 20271 + }, + { + "epoch": 0.61, + "learning_rate": 1.73753241804253e-06, + "loss": 1.0995, + "step": 20272 + }, + { + "epoch": 0.61, + "learning_rate": 1.7373001228277558e-06, + "loss": 1.2306, + "step": 20273 + }, + { + "epoch": 0.61, + "learning_rate": 1.737067834873516e-06, + "loss": 1.2653, + "step": 20274 + }, + { + "epoch": 0.61, + "learning_rate": 1.7368355541820232e-06, + "loss": 1.0119, + "step": 20275 + }, + { + "epoch": 0.61, + "learning_rate": 1.7366032807554884e-06, + "loss": 1.1311, + "step": 20276 + }, + { + "epoch": 0.61, + "learning_rate": 1.736371014596123e-06, + "loss": 1.1301, + "step": 20277 + }, + { + "epoch": 0.61, + "learning_rate": 1.7361387557061371e-06, + "loss": 1.0955, + "step": 20278 + }, + { + "epoch": 0.61, + "learning_rate": 1.7359065040877427e-06, + "loss": 1.1589, + "step": 20279 + }, + { + "epoch": 0.61, + "learning_rate": 1.7356742597431504e-06, + "loss": 1.2642, + "step": 20280 + }, + { + "epoch": 0.61, + "learning_rate": 1.7354420226745714e-06, + "loss": 1.1, + "step": 20281 + }, + { + "epoch": 0.61, + "learning_rate": 1.735209792884216e-06, + "loss": 1.1569, + "step": 20282 + }, + { + "epoch": 0.61, + "learning_rate": 1.734977570374295e-06, + "loss": 1.0859, + "step": 20283 + }, + { + "epoch": 0.61, + "learning_rate": 1.7347453551470186e-06, + "loss": 1.112, + "step": 20284 + }, + { + "epoch": 0.61, + "learning_rate": 1.7345131472045979e-06, + "loss": 1.158, + "step": 20285 + }, + { + "epoch": 0.61, + "learning_rate": 1.7342809465492447e-06, + "loss": 1.1807, + "step": 20286 + }, + { + "epoch": 0.61, + "learning_rate": 1.7340487531831668e-06, + "loss": 1.1459, + "step": 20287 + }, + { + "epoch": 0.61, + "learning_rate": 1.733816567108576e-06, + "loss": 1.0859, + "step": 20288 + }, + { + "epoch": 0.61, + "learning_rate": 1.7335843883276827e-06, + "loss": 1.2144, + "step": 20289 + }, + { + "epoch": 0.61, + "learning_rate": 1.7333522168426969e-06, + "loss": 1.0435, + "step": 20290 + }, + { + "epoch": 0.61, + "learning_rate": 1.7331200526558285e-06, + "loss": 1.0164, + "step": 20291 + }, + { + "epoch": 0.61, + "learning_rate": 1.7328878957692884e-06, + "loss": 1.1898, + "step": 20292 + }, + { + "epoch": 0.61, + "learning_rate": 1.7326557461852856e-06, + "loss": 1.123, + "step": 20293 + }, + { + "epoch": 0.61, + "learning_rate": 1.7324236039060306e-06, + "loss": 1.1381, + "step": 20294 + }, + { + "epoch": 0.61, + "learning_rate": 1.7321914689337332e-06, + "loss": 1.1229, + "step": 20295 + }, + { + "epoch": 0.61, + "learning_rate": 1.7319593412706032e-06, + "loss": 1.1104, + "step": 20296 + }, + { + "epoch": 0.61, + "learning_rate": 1.7317272209188505e-06, + "loss": 1.1221, + "step": 20297 + }, + { + "epoch": 0.61, + "learning_rate": 1.731495107880684e-06, + "loss": 1.1022, + "step": 20298 + }, + { + "epoch": 0.61, + "learning_rate": 1.7312630021583156e-06, + "loss": 1.1568, + "step": 20299 + }, + { + "epoch": 0.61, + "learning_rate": 1.7310309037539519e-06, + "loss": 0.9467, + "step": 20300 + }, + { + "epoch": 0.61, + "learning_rate": 1.730798812669804e-06, + "loss": 1.1472, + "step": 20301 + }, + { + "epoch": 0.61, + "learning_rate": 1.7305667289080805e-06, + "loss": 1.0687, + "step": 20302 + }, + { + "epoch": 0.61, + "learning_rate": 1.7303346524709924e-06, + "loss": 1.069, + "step": 20303 + }, + { + "epoch": 0.61, + "learning_rate": 1.7301025833607466e-06, + "loss": 1.0685, + "step": 20304 + }, + { + "epoch": 0.61, + "learning_rate": 1.7298705215795535e-06, + "loss": 1.1619, + "step": 20305 + }, + { + "epoch": 0.61, + "learning_rate": 1.7296384671296221e-06, + "loss": 1.1852, + "step": 20306 + }, + { + "epoch": 0.61, + "learning_rate": 1.7294064200131615e-06, + "loss": 1.1224, + "step": 20307 + }, + { + "epoch": 0.61, + "learning_rate": 1.729174380232381e-06, + "loss": 1.2053, + "step": 20308 + }, + { + "epoch": 0.61, + "learning_rate": 1.728942347789489e-06, + "loss": 1.207, + "step": 20309 + }, + { + "epoch": 0.61, + "learning_rate": 1.728710322686694e-06, + "loss": 1.2074, + "step": 20310 + }, + { + "epoch": 0.61, + "learning_rate": 1.7284783049262055e-06, + "loss": 1.0844, + "step": 20311 + }, + { + "epoch": 0.61, + "learning_rate": 1.728246294510233e-06, + "loss": 1.0509, + "step": 20312 + }, + { + "epoch": 0.61, + "learning_rate": 1.728014291440983e-06, + "loss": 1.0944, + "step": 20313 + }, + { + "epoch": 0.61, + "learning_rate": 1.7277822957206652e-06, + "loss": 1.1445, + "step": 20314 + }, + { + "epoch": 0.61, + "learning_rate": 1.7275503073514882e-06, + "loss": 1.1318, + "step": 20315 + }, + { + "epoch": 0.61, + "learning_rate": 1.7273183263356613e-06, + "loss": 1.0712, + "step": 20316 + }, + { + "epoch": 0.61, + "learning_rate": 1.7270863526753906e-06, + "loss": 1.3031, + "step": 20317 + }, + { + "epoch": 0.61, + "learning_rate": 1.7268543863728854e-06, + "loss": 1.0551, + "step": 20318 + }, + { + "epoch": 0.61, + "learning_rate": 1.7266224274303544e-06, + "loss": 1.0959, + "step": 20319 + }, + { + "epoch": 0.61, + "learning_rate": 1.726390475850005e-06, + "loss": 1.11, + "step": 20320 + }, + { + "epoch": 0.61, + "learning_rate": 1.7261585316340468e-06, + "loss": 1.2643, + "step": 20321 + }, + { + "epoch": 0.61, + "learning_rate": 1.7259265947846856e-06, + "loss": 1.0574, + "step": 20322 + }, + { + "epoch": 0.61, + "learning_rate": 1.7256946653041306e-06, + "loss": 1.2032, + "step": 20323 + }, + { + "epoch": 0.61, + "learning_rate": 1.7254627431945898e-06, + "loss": 1.1876, + "step": 20324 + }, + { + "epoch": 0.61, + "learning_rate": 1.7252308284582713e-06, + "loss": 1.1813, + "step": 20325 + }, + { + "epoch": 0.61, + "learning_rate": 1.724998921097381e-06, + "loss": 1.0862, + "step": 20326 + }, + { + "epoch": 0.61, + "learning_rate": 1.7247670211141283e-06, + "loss": 1.124, + "step": 20327 + }, + { + "epoch": 0.61, + "learning_rate": 1.7245351285107197e-06, + "loss": 1.0413, + "step": 20328 + }, + { + "epoch": 0.61, + "learning_rate": 1.7243032432893644e-06, + "loss": 1.1553, + "step": 20329 + }, + { + "epoch": 0.61, + "learning_rate": 1.7240713654522675e-06, + "loss": 1.0948, + "step": 20330 + }, + { + "epoch": 0.61, + "learning_rate": 1.7238394950016377e-06, + "loss": 1.3054, + "step": 20331 + }, + { + "epoch": 0.61, + "learning_rate": 1.723607631939682e-06, + "loss": 1.1418, + "step": 20332 + }, + { + "epoch": 0.61, + "learning_rate": 1.7233757762686076e-06, + "loss": 1.0972, + "step": 20333 + }, + { + "epoch": 0.61, + "learning_rate": 1.7231439279906227e-06, + "loss": 1.0348, + "step": 20334 + }, + { + "epoch": 0.61, + "learning_rate": 1.7229120871079325e-06, + "loss": 1.1414, + "step": 20335 + }, + { + "epoch": 0.61, + "learning_rate": 1.7226802536227449e-06, + "loss": 1.0862, + "step": 20336 + }, + { + "epoch": 0.61, + "learning_rate": 1.722448427537267e-06, + "loss": 1.1132, + "step": 20337 + }, + { + "epoch": 0.61, + "learning_rate": 1.722216608853707e-06, + "loss": 1.0273, + "step": 20338 + }, + { + "epoch": 0.61, + "learning_rate": 1.721984797574269e-06, + "loss": 1.0498, + "step": 20339 + }, + { + "epoch": 0.61, + "learning_rate": 1.7217529937011612e-06, + "loss": 1.1033, + "step": 20340 + }, + { + "epoch": 0.61, + "learning_rate": 1.7215211972365897e-06, + "loss": 1.1017, + "step": 20341 + }, + { + "epoch": 0.61, + "learning_rate": 1.7212894081827627e-06, + "loss": 1.1797, + "step": 20342 + }, + { + "epoch": 0.61, + "learning_rate": 1.7210576265418846e-06, + "loss": 1.2015, + "step": 20343 + }, + { + "epoch": 0.61, + "learning_rate": 1.7208258523161625e-06, + "loss": 1.1046, + "step": 20344 + }, + { + "epoch": 0.61, + "learning_rate": 1.7205940855078032e-06, + "loss": 1.1667, + "step": 20345 + }, + { + "epoch": 0.61, + "learning_rate": 1.7203623261190128e-06, + "loss": 1.1823, + "step": 20346 + }, + { + "epoch": 0.61, + "learning_rate": 1.720130574151998e-06, + "loss": 1.248, + "step": 20347 + }, + { + "epoch": 0.61, + "learning_rate": 1.719898829608964e-06, + "loss": 1.0759, + "step": 20348 + }, + { + "epoch": 0.61, + "learning_rate": 1.7196670924921178e-06, + "loss": 1.1426, + "step": 20349 + }, + { + "epoch": 0.61, + "learning_rate": 1.7194353628036648e-06, + "loss": 1.1287, + "step": 20350 + }, + { + "epoch": 0.61, + "learning_rate": 1.719203640545812e-06, + "loss": 1.2123, + "step": 20351 + }, + { + "epoch": 0.61, + "learning_rate": 1.7189719257207637e-06, + "loss": 1.1437, + "step": 20352 + }, + { + "epoch": 0.61, + "learning_rate": 1.7187402183307267e-06, + "loss": 1.1059, + "step": 20353 + }, + { + "epoch": 0.61, + "learning_rate": 1.7185085183779062e-06, + "loss": 1.1215, + "step": 20354 + }, + { + "epoch": 0.61, + "learning_rate": 1.7182768258645094e-06, + "loss": 1.0715, + "step": 20355 + }, + { + "epoch": 0.61, + "learning_rate": 1.7180451407927398e-06, + "loss": 1.2017, + "step": 20356 + }, + { + "epoch": 0.61, + "learning_rate": 1.7178134631648035e-06, + "loss": 1.0624, + "step": 20357 + }, + { + "epoch": 0.61, + "learning_rate": 1.7175817929829069e-06, + "loss": 1.1011, + "step": 20358 + }, + { + "epoch": 0.61, + "learning_rate": 1.7173501302492545e-06, + "loss": 1.0983, + "step": 20359 + }, + { + "epoch": 0.61, + "learning_rate": 1.7171184749660524e-06, + "loss": 1.0333, + "step": 20360 + }, + { + "epoch": 0.61, + "learning_rate": 1.716886827135505e-06, + "loss": 1.1681, + "step": 20361 + }, + { + "epoch": 0.61, + "learning_rate": 1.7166551867598174e-06, + "loss": 1.2614, + "step": 20362 + }, + { + "epoch": 0.61, + "learning_rate": 1.7164235538411956e-06, + "loss": 1.1542, + "step": 20363 + }, + { + "epoch": 0.61, + "learning_rate": 1.7161919283818451e-06, + "loss": 0.9973, + "step": 20364 + }, + { + "epoch": 0.61, + "learning_rate": 1.715960310383969e-06, + "loss": 1.0278, + "step": 20365 + }, + { + "epoch": 0.61, + "learning_rate": 1.715728699849773e-06, + "loss": 1.035, + "step": 20366 + }, + { + "epoch": 0.61, + "learning_rate": 1.7154970967814622e-06, + "loss": 1.1454, + "step": 20367 + }, + { + "epoch": 0.61, + "learning_rate": 1.715265501181242e-06, + "loss": 1.1696, + "step": 20368 + }, + { + "epoch": 0.61, + "learning_rate": 1.7150339130513156e-06, + "loss": 1.159, + "step": 20369 + }, + { + "epoch": 0.61, + "learning_rate": 1.7148023323938878e-06, + "loss": 1.0424, + "step": 20370 + }, + { + "epoch": 0.61, + "learning_rate": 1.7145707592111638e-06, + "loss": 1.094, + "step": 20371 + }, + { + "epoch": 0.61, + "learning_rate": 1.7143391935053483e-06, + "loss": 1.0916, + "step": 20372 + }, + { + "epoch": 0.61, + "learning_rate": 1.7141076352786453e-06, + "loss": 1.039, + "step": 20373 + }, + { + "epoch": 0.61, + "learning_rate": 1.7138760845332588e-06, + "loss": 1.0764, + "step": 20374 + }, + { + "epoch": 0.61, + "learning_rate": 1.7136445412713943e-06, + "loss": 1.1531, + "step": 20375 + }, + { + "epoch": 0.61, + "learning_rate": 1.7134130054952538e-06, + "loss": 1.0704, + "step": 20376 + }, + { + "epoch": 0.61, + "learning_rate": 1.7131814772070437e-06, + "loss": 1.2103, + "step": 20377 + }, + { + "epoch": 0.61, + "learning_rate": 1.7129499564089662e-06, + "loss": 1.2084, + "step": 20378 + }, + { + "epoch": 0.61, + "learning_rate": 1.7127184431032262e-06, + "loss": 1.1597, + "step": 20379 + }, + { + "epoch": 0.61, + "learning_rate": 1.7124869372920272e-06, + "loss": 1.0678, + "step": 20380 + }, + { + "epoch": 0.61, + "learning_rate": 1.7122554389775747e-06, + "loss": 1.0387, + "step": 20381 + }, + { + "epoch": 0.61, + "learning_rate": 1.71202394816207e-06, + "loss": 1.0276, + "step": 20382 + }, + { + "epoch": 0.61, + "learning_rate": 1.7117924648477174e-06, + "loss": 1.1099, + "step": 20383 + }, + { + "epoch": 0.61, + "learning_rate": 1.711560989036721e-06, + "loss": 1.1646, + "step": 20384 + }, + { + "epoch": 0.61, + "learning_rate": 1.7113295207312844e-06, + "loss": 1.129, + "step": 20385 + }, + { + "epoch": 0.61, + "learning_rate": 1.7110980599336119e-06, + "loss": 1.2493, + "step": 20386 + }, + { + "epoch": 0.61, + "learning_rate": 1.7108666066459052e-06, + "loss": 1.1077, + "step": 20387 + }, + { + "epoch": 0.61, + "learning_rate": 1.7106351608703681e-06, + "loss": 1.0812, + "step": 20388 + }, + { + "epoch": 0.61, + "learning_rate": 1.710403722609204e-06, + "loss": 1.0593, + "step": 20389 + }, + { + "epoch": 0.61, + "learning_rate": 1.7101722918646168e-06, + "loss": 1.1075, + "step": 20390 + }, + { + "epoch": 0.61, + "learning_rate": 1.7099408686388083e-06, + "loss": 1.1764, + "step": 20391 + }, + { + "epoch": 0.61, + "learning_rate": 1.7097094529339825e-06, + "loss": 1.1014, + "step": 20392 + }, + { + "epoch": 0.61, + "learning_rate": 1.7094780447523417e-06, + "loss": 1.1923, + "step": 20393 + }, + { + "epoch": 0.61, + "learning_rate": 1.709246644096091e-06, + "loss": 1.1036, + "step": 20394 + }, + { + "epoch": 0.61, + "learning_rate": 1.7090152509674297e-06, + "loss": 1.1027, + "step": 20395 + }, + { + "epoch": 0.61, + "learning_rate": 1.7087838653685623e-06, + "loss": 1.1488, + "step": 20396 + }, + { + "epoch": 0.61, + "learning_rate": 1.7085524873016915e-06, + "loss": 0.981, + "step": 20397 + }, + { + "epoch": 0.61, + "learning_rate": 1.7083211167690201e-06, + "loss": 1.0996, + "step": 20398 + }, + { + "epoch": 0.61, + "learning_rate": 1.708089753772751e-06, + "loss": 1.118, + "step": 20399 + }, + { + "epoch": 0.61, + "learning_rate": 1.7078583983150853e-06, + "loss": 1.3065, + "step": 20400 + }, + { + "epoch": 0.61, + "learning_rate": 1.7076270503982262e-06, + "loss": 1.1934, + "step": 20401 + }, + { + "epoch": 0.61, + "learning_rate": 1.7073957100243758e-06, + "loss": 1.0828, + "step": 20402 + }, + { + "epoch": 0.61, + "learning_rate": 1.7071643771957368e-06, + "loss": 1.0986, + "step": 20403 + }, + { + "epoch": 0.61, + "learning_rate": 1.706933051914511e-06, + "loss": 1.1548, + "step": 20404 + }, + { + "epoch": 0.61, + "learning_rate": 1.7067017341829003e-06, + "loss": 1.1533, + "step": 20405 + }, + { + "epoch": 0.61, + "learning_rate": 1.706470424003107e-06, + "loss": 1.3866, + "step": 20406 + }, + { + "epoch": 0.61, + "learning_rate": 1.7062391213773343e-06, + "loss": 1.0438, + "step": 20407 + }, + { + "epoch": 0.61, + "learning_rate": 1.706007826307782e-06, + "loss": 1.063, + "step": 20408 + }, + { + "epoch": 0.61, + "learning_rate": 1.7057765387966528e-06, + "loss": 1.1021, + "step": 20409 + }, + { + "epoch": 0.61, + "learning_rate": 1.7055452588461479e-06, + "loss": 1.1143, + "step": 20410 + }, + { + "epoch": 0.61, + "learning_rate": 1.7053139864584711e-06, + "loss": 1.0845, + "step": 20411 + }, + { + "epoch": 0.61, + "learning_rate": 1.7050827216358211e-06, + "loss": 1.2781, + "step": 20412 + }, + { + "epoch": 0.61, + "learning_rate": 1.704851464380401e-06, + "loss": 1.0727, + "step": 20413 + }, + { + "epoch": 0.61, + "learning_rate": 1.7046202146944116e-06, + "loss": 1.0361, + "step": 20414 + }, + { + "epoch": 0.62, + "learning_rate": 1.7043889725800549e-06, + "loss": 1.0052, + "step": 20415 + }, + { + "epoch": 0.62, + "learning_rate": 1.7041577380395324e-06, + "loss": 1.0577, + "step": 20416 + }, + { + "epoch": 0.62, + "learning_rate": 1.7039265110750446e-06, + "loss": 1.1254, + "step": 20417 + }, + { + "epoch": 0.62, + "learning_rate": 1.703695291688793e-06, + "loss": 1.0786, + "step": 20418 + }, + { + "epoch": 0.62, + "learning_rate": 1.7034640798829788e-06, + "loss": 1.0232, + "step": 20419 + }, + { + "epoch": 0.62, + "learning_rate": 1.7032328756598037e-06, + "loss": 1.0247, + "step": 20420 + }, + { + "epoch": 0.62, + "learning_rate": 1.703001679021467e-06, + "loss": 1.0344, + "step": 20421 + }, + { + "epoch": 0.62, + "learning_rate": 1.7027704899701706e-06, + "loss": 1.0483, + "step": 20422 + }, + { + "epoch": 0.62, + "learning_rate": 1.7025393085081148e-06, + "loss": 1.1572, + "step": 20423 + }, + { + "epoch": 0.62, + "learning_rate": 1.702308134637502e-06, + "loss": 1.1984, + "step": 20424 + }, + { + "epoch": 0.62, + "learning_rate": 1.7020769683605308e-06, + "loss": 1.1572, + "step": 20425 + }, + { + "epoch": 0.62, + "learning_rate": 1.7018458096794022e-06, + "loss": 1.104, + "step": 20426 + }, + { + "epoch": 0.62, + "learning_rate": 1.7016146585963173e-06, + "loss": 1.1666, + "step": 20427 + }, + { + "epoch": 0.62, + "learning_rate": 1.701383515113476e-06, + "loss": 1.154, + "step": 20428 + }, + { + "epoch": 0.62, + "learning_rate": 1.7011523792330798e-06, + "loss": 1.008, + "step": 20429 + }, + { + "epoch": 0.62, + "learning_rate": 1.7009212509573275e-06, + "loss": 1.1021, + "step": 20430 + }, + { + "epoch": 0.62, + "learning_rate": 1.7006901302884205e-06, + "loss": 1.0676, + "step": 20431 + }, + { + "epoch": 0.62, + "learning_rate": 1.7004590172285578e-06, + "loss": 1.0624, + "step": 20432 + }, + { + "epoch": 0.62, + "learning_rate": 1.700227911779942e-06, + "loss": 1.2388, + "step": 20433 + }, + { + "epoch": 0.62, + "learning_rate": 1.6999968139447698e-06, + "loss": 1.1608, + "step": 20434 + }, + { + "epoch": 0.62, + "learning_rate": 1.6997657237252424e-06, + "loss": 1.1814, + "step": 20435 + }, + { + "epoch": 0.62, + "learning_rate": 1.6995346411235603e-06, + "loss": 1.1113, + "step": 20436 + }, + { + "epoch": 0.62, + "learning_rate": 1.6993035661419238e-06, + "loss": 1.1113, + "step": 20437 + }, + { + "epoch": 0.62, + "learning_rate": 1.6990724987825307e-06, + "loss": 1.1016, + "step": 20438 + }, + { + "epoch": 0.62, + "learning_rate": 1.6988414390475819e-06, + "loss": 1.1586, + "step": 20439 + }, + { + "epoch": 0.62, + "learning_rate": 1.6986103869392764e-06, + "loss": 1.058, + "step": 20440 + }, + { + "epoch": 0.62, + "learning_rate": 1.6983793424598143e-06, + "loss": 1.0963, + "step": 20441 + }, + { + "epoch": 0.62, + "learning_rate": 1.698148305611395e-06, + "loss": 1.1208, + "step": 20442 + }, + { + "epoch": 0.62, + "learning_rate": 1.6979172763962175e-06, + "loss": 1.2195, + "step": 20443 + }, + { + "epoch": 0.62, + "learning_rate": 1.697686254816481e-06, + "loss": 1.1544, + "step": 20444 + }, + { + "epoch": 0.62, + "learning_rate": 1.697455240874385e-06, + "loss": 1.0601, + "step": 20445 + }, + { + "epoch": 0.62, + "learning_rate": 1.6972242345721295e-06, + "loss": 1.1862, + "step": 20446 + }, + { + "epoch": 0.62, + "learning_rate": 1.6969932359119118e-06, + "loss": 1.1526, + "step": 20447 + }, + { + "epoch": 0.62, + "learning_rate": 1.696762244895932e-06, + "loss": 1.1654, + "step": 20448 + }, + { + "epoch": 0.62, + "learning_rate": 1.6965312615263884e-06, + "loss": 1.0229, + "step": 20449 + }, + { + "epoch": 0.62, + "learning_rate": 1.6963002858054812e-06, + "loss": 1.1012, + "step": 20450 + }, + { + "epoch": 0.62, + "learning_rate": 1.6960693177354073e-06, + "loss": 1.1776, + "step": 20451 + }, + { + "epoch": 0.62, + "learning_rate": 1.6958383573183663e-06, + "loss": 1.115, + "step": 20452 + }, + { + "epoch": 0.62, + "learning_rate": 1.6956074045565568e-06, + "loss": 1.161, + "step": 20453 + }, + { + "epoch": 0.62, + "learning_rate": 1.6953764594521777e-06, + "loss": 1.1755, + "step": 20454 + }, + { + "epoch": 0.62, + "learning_rate": 1.6951455220074275e-06, + "loss": 1.1993, + "step": 20455 + }, + { + "epoch": 0.62, + "learning_rate": 1.6949145922245036e-06, + "loss": 1.1143, + "step": 20456 + }, + { + "epoch": 0.62, + "learning_rate": 1.6946836701056058e-06, + "loss": 1.1473, + "step": 20457 + }, + { + "epoch": 0.62, + "learning_rate": 1.6944527556529312e-06, + "loss": 1.1415, + "step": 20458 + }, + { + "epoch": 0.62, + "learning_rate": 1.6942218488686785e-06, + "loss": 1.1984, + "step": 20459 + }, + { + "epoch": 0.62, + "learning_rate": 1.6939909497550455e-06, + "loss": 1.1697, + "step": 20460 + }, + { + "epoch": 0.62, + "learning_rate": 1.6937600583142303e-06, + "loss": 1.1544, + "step": 20461 + }, + { + "epoch": 0.62, + "learning_rate": 1.693529174548431e-06, + "loss": 1.0541, + "step": 20462 + }, + { + "epoch": 0.62, + "learning_rate": 1.6932982984598467e-06, + "loss": 1.1233, + "step": 20463 + }, + { + "epoch": 0.62, + "learning_rate": 1.6930674300506733e-06, + "loss": 1.17, + "step": 20464 + }, + { + "epoch": 0.62, + "learning_rate": 1.692836569323109e-06, + "loss": 1.1216, + "step": 20465 + }, + { + "epoch": 0.62, + "learning_rate": 1.692605716279352e-06, + "loss": 1.1564, + "step": 20466 + }, + { + "epoch": 0.62, + "learning_rate": 1.6923748709215996e-06, + "loss": 1.1007, + "step": 20467 + }, + { + "epoch": 0.62, + "learning_rate": 1.6921440332520506e-06, + "loss": 1.109, + "step": 20468 + }, + { + "epoch": 0.62, + "learning_rate": 1.6919132032729002e-06, + "loss": 1.0897, + "step": 20469 + }, + { + "epoch": 0.62, + "learning_rate": 1.6916823809863469e-06, + "loss": 1.1644, + "step": 20470 + }, + { + "epoch": 0.62, + "learning_rate": 1.691451566394588e-06, + "loss": 1.0249, + "step": 20471 + }, + { + "epoch": 0.62, + "learning_rate": 1.6912207594998215e-06, + "loss": 1.0345, + "step": 20472 + }, + { + "epoch": 0.62, + "learning_rate": 1.6909899603042428e-06, + "loss": 1.1662, + "step": 20473 + }, + { + "epoch": 0.62, + "learning_rate": 1.6907591688100505e-06, + "loss": 1.1042, + "step": 20474 + }, + { + "epoch": 0.62, + "learning_rate": 1.6905283850194414e-06, + "loss": 1.0588, + "step": 20475 + }, + { + "epoch": 0.62, + "learning_rate": 1.690297608934613e-06, + "loss": 1.1536, + "step": 20476 + }, + { + "epoch": 0.62, + "learning_rate": 1.6900668405577603e-06, + "loss": 1.0732, + "step": 20477 + }, + { + "epoch": 0.62, + "learning_rate": 1.6898360798910812e-06, + "loss": 1.0789, + "step": 20478 + }, + { + "epoch": 0.62, + "learning_rate": 1.6896053269367724e-06, + "loss": 1.2347, + "step": 20479 + }, + { + "epoch": 0.62, + "learning_rate": 1.689374581697031e-06, + "loss": 1.2316, + "step": 20480 + }, + { + "epoch": 0.62, + "learning_rate": 1.6891438441740537e-06, + "loss": 1.036, + "step": 20481 + }, + { + "epoch": 0.62, + "learning_rate": 1.6889131143700354e-06, + "loss": 1.1569, + "step": 20482 + }, + { + "epoch": 0.62, + "learning_rate": 1.6886823922871737e-06, + "loss": 1.1392, + "step": 20483 + }, + { + "epoch": 0.62, + "learning_rate": 1.6884516779276651e-06, + "loss": 1.1107, + "step": 20484 + }, + { + "epoch": 0.62, + "learning_rate": 1.688220971293706e-06, + "loss": 1.0583, + "step": 20485 + }, + { + "epoch": 0.62, + "learning_rate": 1.687990272387492e-06, + "loss": 1.1496, + "step": 20486 + }, + { + "epoch": 0.62, + "learning_rate": 1.6877595812112197e-06, + "loss": 1.171, + "step": 20487 + }, + { + "epoch": 0.62, + "learning_rate": 1.6875288977670845e-06, + "loss": 1.2709, + "step": 20488 + }, + { + "epoch": 0.62, + "learning_rate": 1.6872982220572842e-06, + "loss": 1.0862, + "step": 20489 + }, + { + "epoch": 0.62, + "learning_rate": 1.687067554084012e-06, + "loss": 1.0618, + "step": 20490 + }, + { + "epoch": 0.62, + "learning_rate": 1.6868368938494656e-06, + "loss": 1.1508, + "step": 20491 + }, + { + "epoch": 0.62, + "learning_rate": 1.6866062413558404e-06, + "loss": 1.1927, + "step": 20492 + }, + { + "epoch": 0.62, + "learning_rate": 1.6863755966053315e-06, + "loss": 1.1035, + "step": 20493 + }, + { + "epoch": 0.62, + "learning_rate": 1.6861449596001368e-06, + "loss": 1.0994, + "step": 20494 + }, + { + "epoch": 0.62, + "learning_rate": 1.6859143303424486e-06, + "loss": 1.1191, + "step": 20495 + }, + { + "epoch": 0.62, + "learning_rate": 1.685683708834464e-06, + "loss": 1.0157, + "step": 20496 + }, + { + "epoch": 0.62, + "learning_rate": 1.685453095078378e-06, + "loss": 1.1529, + "step": 20497 + }, + { + "epoch": 0.62, + "learning_rate": 1.6852224890763875e-06, + "loss": 1.1559, + "step": 20498 + }, + { + "epoch": 0.62, + "learning_rate": 1.6849918908306856e-06, + "loss": 1.0327, + "step": 20499 + }, + { + "epoch": 0.62, + "learning_rate": 1.6847613003434682e-06, + "loss": 1.0403, + "step": 20500 + }, + { + "epoch": 0.62, + "learning_rate": 1.6845307176169306e-06, + "loss": 1.0503, + "step": 20501 + }, + { + "epoch": 0.62, + "learning_rate": 1.684300142653269e-06, + "loss": 1.0583, + "step": 20502 + }, + { + "epoch": 0.62, + "learning_rate": 1.6840695754546762e-06, + "loss": 1.1115, + "step": 20503 + }, + { + "epoch": 0.62, + "learning_rate": 1.6838390160233482e-06, + "loss": 1.1606, + "step": 20504 + }, + { + "epoch": 0.62, + "learning_rate": 1.6836084643614792e-06, + "loss": 1.0912, + "step": 20505 + }, + { + "epoch": 0.62, + "learning_rate": 1.6833779204712648e-06, + "loss": 1.1819, + "step": 20506 + }, + { + "epoch": 0.62, + "learning_rate": 1.6831473843549004e-06, + "loss": 1.1701, + "step": 20507 + }, + { + "epoch": 0.62, + "learning_rate": 1.682916856014578e-06, + "loss": 1.1086, + "step": 20508 + }, + { + "epoch": 0.62, + "learning_rate": 1.6826863354524942e-06, + "loss": 1.0965, + "step": 20509 + }, + { + "epoch": 0.62, + "learning_rate": 1.6824558226708427e-06, + "loss": 1.1295, + "step": 20510 + }, + { + "epoch": 0.62, + "learning_rate": 1.6822253176718185e-06, + "loss": 1.1428, + "step": 20511 + }, + { + "epoch": 0.62, + "learning_rate": 1.6819948204576148e-06, + "loss": 1.1672, + "step": 20512 + }, + { + "epoch": 0.62, + "learning_rate": 1.6817643310304263e-06, + "loss": 1.2443, + "step": 20513 + }, + { + "epoch": 0.62, + "learning_rate": 1.6815338493924477e-06, + "loss": 1.1054, + "step": 20514 + }, + { + "epoch": 0.62, + "learning_rate": 1.6813033755458733e-06, + "loss": 1.1649, + "step": 20515 + }, + { + "epoch": 0.62, + "learning_rate": 1.6810729094928956e-06, + "loss": 1.0629, + "step": 20516 + }, + { + "epoch": 0.62, + "learning_rate": 1.6808424512357094e-06, + "loss": 1.084, + "step": 20517 + }, + { + "epoch": 0.62, + "learning_rate": 1.6806120007765087e-06, + "loss": 1.0858, + "step": 20518 + }, + { + "epoch": 0.62, + "learning_rate": 1.6803815581174867e-06, + "loss": 1.0759, + "step": 20519 + }, + { + "epoch": 0.62, + "learning_rate": 1.680151123260839e-06, + "loss": 1.1282, + "step": 20520 + }, + { + "epoch": 0.62, + "learning_rate": 1.6799206962087567e-06, + "loss": 1.0757, + "step": 20521 + }, + { + "epoch": 0.62, + "learning_rate": 1.679690276963434e-06, + "loss": 1.1407, + "step": 20522 + }, + { + "epoch": 0.62, + "learning_rate": 1.679459865527065e-06, + "loss": 1.0677, + "step": 20523 + }, + { + "epoch": 0.62, + "learning_rate": 1.6792294619018434e-06, + "loss": 1.2825, + "step": 20524 + }, + { + "epoch": 0.62, + "learning_rate": 1.6789990660899616e-06, + "loss": 1.0065, + "step": 20525 + }, + { + "epoch": 0.62, + "learning_rate": 1.6787686780936132e-06, + "loss": 1.1272, + "step": 20526 + }, + { + "epoch": 0.62, + "learning_rate": 1.6785382979149917e-06, + "loss": 1.1388, + "step": 20527 + }, + { + "epoch": 0.62, + "learning_rate": 1.6783079255562907e-06, + "loss": 1.1566, + "step": 20528 + }, + { + "epoch": 0.62, + "learning_rate": 1.6780775610197017e-06, + "loss": 1.1521, + "step": 20529 + }, + { + "epoch": 0.62, + "learning_rate": 1.6778472043074185e-06, + "loss": 1.1672, + "step": 20530 + }, + { + "epoch": 0.62, + "learning_rate": 1.6776168554216338e-06, + "loss": 1.0753, + "step": 20531 + }, + { + "epoch": 0.62, + "learning_rate": 1.6773865143645403e-06, + "loss": 1.0811, + "step": 20532 + }, + { + "epoch": 0.62, + "learning_rate": 1.6771561811383325e-06, + "loss": 1.0716, + "step": 20533 + }, + { + "epoch": 0.62, + "learning_rate": 1.6769258557452e-06, + "loss": 1.0538, + "step": 20534 + }, + { + "epoch": 0.62, + "learning_rate": 1.6766955381873373e-06, + "loss": 1.1553, + "step": 20535 + }, + { + "epoch": 0.62, + "learning_rate": 1.676465228466937e-06, + "loss": 1.1518, + "step": 20536 + }, + { + "epoch": 0.62, + "learning_rate": 1.676234926586191e-06, + "loss": 1.1971, + "step": 20537 + }, + { + "epoch": 0.62, + "learning_rate": 1.6760046325472913e-06, + "loss": 1.1445, + "step": 20538 + }, + { + "epoch": 0.62, + "learning_rate": 1.6757743463524312e-06, + "loss": 1.1918, + "step": 20539 + }, + { + "epoch": 0.62, + "learning_rate": 1.6755440680038022e-06, + "loss": 1.1251, + "step": 20540 + }, + { + "epoch": 0.62, + "learning_rate": 1.6753137975035965e-06, + "loss": 1.2048, + "step": 20541 + }, + { + "epoch": 0.62, + "learning_rate": 1.6750835348540062e-06, + "loss": 1.098, + "step": 20542 + }, + { + "epoch": 0.62, + "learning_rate": 1.6748532800572232e-06, + "loss": 1.2518, + "step": 20543 + }, + { + "epoch": 0.62, + "learning_rate": 1.6746230331154394e-06, + "loss": 1.3361, + "step": 20544 + }, + { + "epoch": 0.62, + "learning_rate": 1.6743927940308474e-06, + "loss": 1.1293, + "step": 20545 + }, + { + "epoch": 0.62, + "learning_rate": 1.674162562805639e-06, + "loss": 1.0649, + "step": 20546 + }, + { + "epoch": 0.62, + "learning_rate": 1.6739323394420043e-06, + "loss": 1.146, + "step": 20547 + }, + { + "epoch": 0.62, + "learning_rate": 1.6737021239421358e-06, + "loss": 1.2328, + "step": 20548 + }, + { + "epoch": 0.62, + "learning_rate": 1.673471916308225e-06, + "loss": 1.105, + "step": 20549 + }, + { + "epoch": 0.62, + "learning_rate": 1.6732417165424647e-06, + "loss": 1.1097, + "step": 20550 + }, + { + "epoch": 0.62, + "learning_rate": 1.673011524647044e-06, + "loss": 1.0689, + "step": 20551 + }, + { + "epoch": 0.62, + "learning_rate": 1.6727813406241553e-06, + "loss": 1.0952, + "step": 20552 + }, + { + "epoch": 0.62, + "learning_rate": 1.6725511644759897e-06, + "loss": 1.0759, + "step": 20553 + }, + { + "epoch": 0.62, + "learning_rate": 1.6723209962047393e-06, + "loss": 1.0579, + "step": 20554 + }, + { + "epoch": 0.62, + "learning_rate": 1.6720908358125936e-06, + "loss": 1.1349, + "step": 20555 + }, + { + "epoch": 0.62, + "learning_rate": 1.6718606833017447e-06, + "loss": 1.0997, + "step": 20556 + }, + { + "epoch": 0.62, + "learning_rate": 1.6716305386743831e-06, + "loss": 1.1769, + "step": 20557 + }, + { + "epoch": 0.62, + "learning_rate": 1.6714004019326998e-06, + "loss": 1.2271, + "step": 20558 + }, + { + "epoch": 0.62, + "learning_rate": 1.6711702730788868e-06, + "loss": 1.1113, + "step": 20559 + }, + { + "epoch": 0.62, + "learning_rate": 1.6709401521151325e-06, + "loss": 1.0232, + "step": 20560 + }, + { + "epoch": 0.62, + "learning_rate": 1.6707100390436284e-06, + "loss": 1.0388, + "step": 20561 + }, + { + "epoch": 0.62, + "learning_rate": 1.6704799338665656e-06, + "loss": 1.2393, + "step": 20562 + }, + { + "epoch": 0.62, + "learning_rate": 1.6702498365861352e-06, + "loss": 1.0532, + "step": 20563 + }, + { + "epoch": 0.62, + "learning_rate": 1.670019747204526e-06, + "loss": 1.0727, + "step": 20564 + }, + { + "epoch": 0.62, + "learning_rate": 1.6697896657239288e-06, + "loss": 1.1329, + "step": 20565 + }, + { + "epoch": 0.62, + "learning_rate": 1.669559592146534e-06, + "loss": 1.0591, + "step": 20566 + }, + { + "epoch": 0.62, + "learning_rate": 1.6693295264745329e-06, + "loss": 1.1382, + "step": 20567 + }, + { + "epoch": 0.62, + "learning_rate": 1.6690994687101137e-06, + "loss": 1.1035, + "step": 20568 + }, + { + "epoch": 0.62, + "learning_rate": 1.6688694188554677e-06, + "loss": 1.0614, + "step": 20569 + }, + { + "epoch": 0.62, + "learning_rate": 1.6686393769127842e-06, + "loss": 1.0829, + "step": 20570 + }, + { + "epoch": 0.62, + "learning_rate": 1.6684093428842537e-06, + "loss": 1.1363, + "step": 20571 + }, + { + "epoch": 0.62, + "learning_rate": 1.6681793167720666e-06, + "loss": 1.1783, + "step": 20572 + }, + { + "epoch": 0.62, + "learning_rate": 1.667949298578411e-06, + "loss": 1.1328, + "step": 20573 + }, + { + "epoch": 0.62, + "learning_rate": 1.6677192883054772e-06, + "loss": 1.174, + "step": 20574 + }, + { + "epoch": 0.62, + "learning_rate": 1.667489285955455e-06, + "loss": 1.1145, + "step": 20575 + }, + { + "epoch": 0.62, + "learning_rate": 1.6672592915305346e-06, + "loss": 1.1407, + "step": 20576 + }, + { + "epoch": 0.62, + "learning_rate": 1.667029305032904e-06, + "loss": 1.0022, + "step": 20577 + }, + { + "epoch": 0.62, + "learning_rate": 1.666799326464753e-06, + "loss": 1.0821, + "step": 20578 + }, + { + "epoch": 0.62, + "learning_rate": 1.6665693558282713e-06, + "loss": 1.0085, + "step": 20579 + }, + { + "epoch": 0.62, + "learning_rate": 1.6663393931256485e-06, + "loss": 1.1294, + "step": 20580 + }, + { + "epoch": 0.62, + "learning_rate": 1.6661094383590725e-06, + "loss": 1.3506, + "step": 20581 + }, + { + "epoch": 0.62, + "learning_rate": 1.6658794915307333e-06, + "loss": 1.0543, + "step": 20582 + }, + { + "epoch": 0.62, + "learning_rate": 1.6656495526428196e-06, + "loss": 1.1542, + "step": 20583 + }, + { + "epoch": 0.62, + "learning_rate": 1.6654196216975199e-06, + "loss": 1.1168, + "step": 20584 + }, + { + "epoch": 0.62, + "learning_rate": 1.6651896986970247e-06, + "loss": 1.0868, + "step": 20585 + }, + { + "epoch": 0.62, + "learning_rate": 1.6649597836435204e-06, + "loss": 1.1641, + "step": 20586 + }, + { + "epoch": 0.62, + "learning_rate": 1.664729876539197e-06, + "loss": 1.1887, + "step": 20587 + }, + { + "epoch": 0.62, + "learning_rate": 1.6644999773862427e-06, + "loss": 1.1566, + "step": 20588 + }, + { + "epoch": 0.62, + "learning_rate": 1.6642700861868474e-06, + "loss": 1.1129, + "step": 20589 + }, + { + "epoch": 0.62, + "learning_rate": 1.6640402029431972e-06, + "loss": 1.1251, + "step": 20590 + }, + { + "epoch": 0.62, + "learning_rate": 1.663810327657482e-06, + "loss": 1.2083, + "step": 20591 + }, + { + "epoch": 0.62, + "learning_rate": 1.6635804603318894e-06, + "loss": 1.1613, + "step": 20592 + }, + { + "epoch": 0.62, + "learning_rate": 1.6633506009686084e-06, + "loss": 1.2306, + "step": 20593 + }, + { + "epoch": 0.62, + "learning_rate": 1.6631207495698266e-06, + "loss": 1.2046, + "step": 20594 + }, + { + "epoch": 0.62, + "learning_rate": 1.6628909061377318e-06, + "loss": 1.0706, + "step": 20595 + }, + { + "epoch": 0.62, + "learning_rate": 1.6626610706745127e-06, + "loss": 1.153, + "step": 20596 + }, + { + "epoch": 0.62, + "learning_rate": 1.662431243182358e-06, + "loss": 1.1036, + "step": 20597 + }, + { + "epoch": 0.62, + "learning_rate": 1.6622014236634535e-06, + "loss": 1.1254, + "step": 20598 + }, + { + "epoch": 0.62, + "learning_rate": 1.6619716121199878e-06, + "loss": 1.0309, + "step": 20599 + }, + { + "epoch": 0.62, + "learning_rate": 1.6617418085541486e-06, + "loss": 1.2561, + "step": 20600 + }, + { + "epoch": 0.62, + "learning_rate": 1.661512012968124e-06, + "loss": 1.1832, + "step": 20601 + }, + { + "epoch": 0.62, + "learning_rate": 1.661282225364102e-06, + "loss": 1.1546, + "step": 20602 + }, + { + "epoch": 0.62, + "learning_rate": 1.6610524457442684e-06, + "loss": 1.1491, + "step": 20603 + }, + { + "epoch": 0.62, + "learning_rate": 1.6608226741108113e-06, + "loss": 1.1546, + "step": 20604 + }, + { + "epoch": 0.62, + "learning_rate": 1.660592910465918e-06, + "loss": 1.1765, + "step": 20605 + }, + { + "epoch": 0.62, + "learning_rate": 1.6603631548117767e-06, + "loss": 1.321, + "step": 20606 + }, + { + "epoch": 0.62, + "learning_rate": 1.6601334071505732e-06, + "loss": 1.0618, + "step": 20607 + }, + { + "epoch": 0.62, + "learning_rate": 1.6599036674844955e-06, + "loss": 1.0745, + "step": 20608 + }, + { + "epoch": 0.62, + "learning_rate": 1.65967393581573e-06, + "loss": 1.0245, + "step": 20609 + }, + { + "epoch": 0.62, + "learning_rate": 1.659444212146465e-06, + "loss": 1.1068, + "step": 20610 + }, + { + "epoch": 0.62, + "learning_rate": 1.6592144964788847e-06, + "loss": 1.2224, + "step": 20611 + }, + { + "epoch": 0.62, + "learning_rate": 1.6589847888151784e-06, + "loss": 1.0288, + "step": 20612 + }, + { + "epoch": 0.62, + "learning_rate": 1.6587550891575311e-06, + "loss": 1.0158, + "step": 20613 + }, + { + "epoch": 0.62, + "learning_rate": 1.6585253975081306e-06, + "loss": 1.1963, + "step": 20614 + }, + { + "epoch": 0.62, + "learning_rate": 1.6582957138691639e-06, + "loss": 1.0624, + "step": 20615 + }, + { + "epoch": 0.62, + "learning_rate": 1.6580660382428157e-06, + "loss": 1.1561, + "step": 20616 + }, + { + "epoch": 0.62, + "learning_rate": 1.6578363706312734e-06, + "loss": 1.0811, + "step": 20617 + }, + { + "epoch": 0.62, + "learning_rate": 1.657606711036723e-06, + "loss": 1.2802, + "step": 20618 + }, + { + "epoch": 0.62, + "learning_rate": 1.6573770594613516e-06, + "loss": 1.0156, + "step": 20619 + }, + { + "epoch": 0.62, + "learning_rate": 1.6571474159073442e-06, + "loss": 1.1706, + "step": 20620 + }, + { + "epoch": 0.62, + "learning_rate": 1.6569177803768876e-06, + "loss": 1.1688, + "step": 20621 + }, + { + "epoch": 0.62, + "learning_rate": 1.6566881528721684e-06, + "loss": 1.1142, + "step": 20622 + }, + { + "epoch": 0.62, + "learning_rate": 1.6564585333953714e-06, + "loss": 1.0935, + "step": 20623 + }, + { + "epoch": 0.62, + "learning_rate": 1.6562289219486827e-06, + "loss": 1.1658, + "step": 20624 + }, + { + "epoch": 0.62, + "learning_rate": 1.6559993185342882e-06, + "loss": 1.267, + "step": 20625 + }, + { + "epoch": 0.62, + "learning_rate": 1.6557697231543737e-06, + "loss": 1.1319, + "step": 20626 + }, + { + "epoch": 0.62, + "learning_rate": 1.655540135811125e-06, + "loss": 1.0227, + "step": 20627 + }, + { + "epoch": 0.62, + "learning_rate": 1.6553105565067284e-06, + "loss": 1.058, + "step": 20628 + }, + { + "epoch": 0.62, + "learning_rate": 1.6550809852433674e-06, + "loss": 1.1074, + "step": 20629 + }, + { + "epoch": 0.62, + "learning_rate": 1.6548514220232284e-06, + "loss": 1.2101, + "step": 20630 + }, + { + "epoch": 0.62, + "learning_rate": 1.654621866848497e-06, + "loss": 1.2293, + "step": 20631 + }, + { + "epoch": 0.62, + "learning_rate": 1.6543923197213584e-06, + "loss": 1.1075, + "step": 20632 + }, + { + "epoch": 0.62, + "learning_rate": 1.6541627806439984e-06, + "loss": 1.1876, + "step": 20633 + }, + { + "epoch": 0.62, + "learning_rate": 1.6539332496186002e-06, + "loss": 1.2081, + "step": 20634 + }, + { + "epoch": 0.62, + "learning_rate": 1.6537037266473505e-06, + "loss": 1.1216, + "step": 20635 + }, + { + "epoch": 0.62, + "learning_rate": 1.6534742117324337e-06, + "loss": 1.2676, + "step": 20636 + }, + { + "epoch": 0.62, + "learning_rate": 1.6532447048760348e-06, + "loss": 1.0696, + "step": 20637 + }, + { + "epoch": 0.62, + "learning_rate": 1.6530152060803379e-06, + "loss": 1.1919, + "step": 20638 + }, + { + "epoch": 0.62, + "learning_rate": 1.6527857153475286e-06, + "loss": 1.1508, + "step": 20639 + }, + { + "epoch": 0.62, + "learning_rate": 1.652556232679791e-06, + "loss": 1.2732, + "step": 20640 + }, + { + "epoch": 0.62, + "learning_rate": 1.6523267580793112e-06, + "loss": 1.0785, + "step": 20641 + }, + { + "epoch": 0.62, + "learning_rate": 1.6520972915482713e-06, + "loss": 1.135, + "step": 20642 + }, + { + "epoch": 0.62, + "learning_rate": 1.651867833088857e-06, + "loss": 1.1226, + "step": 20643 + }, + { + "epoch": 0.62, + "learning_rate": 1.6516383827032524e-06, + "loss": 1.0162, + "step": 20644 + }, + { + "epoch": 0.62, + "learning_rate": 1.651408940393643e-06, + "loss": 1.031, + "step": 20645 + }, + { + "epoch": 0.62, + "learning_rate": 1.6511795061622104e-06, + "loss": 1.0283, + "step": 20646 + }, + { + "epoch": 0.62, + "learning_rate": 1.6509500800111403e-06, + "loss": 1.1321, + "step": 20647 + }, + { + "epoch": 0.62, + "learning_rate": 1.6507206619426164e-06, + "loss": 1.0995, + "step": 20648 + }, + { + "epoch": 0.62, + "learning_rate": 1.6504912519588233e-06, + "loss": 1.1398, + "step": 20649 + }, + { + "epoch": 0.62, + "learning_rate": 1.650261850061944e-06, + "loss": 1.0372, + "step": 20650 + }, + { + "epoch": 0.62, + "learning_rate": 1.6500324562541625e-06, + "loss": 1.1115, + "step": 20651 + }, + { + "epoch": 0.62, + "learning_rate": 1.6498030705376628e-06, + "loss": 1.1276, + "step": 20652 + }, + { + "epoch": 0.62, + "learning_rate": 1.649573692914628e-06, + "loss": 1.0811, + "step": 20653 + }, + { + "epoch": 0.62, + "learning_rate": 1.6493443233872435e-06, + "loss": 1.2594, + "step": 20654 + }, + { + "epoch": 0.62, + "learning_rate": 1.6491149619576901e-06, + "loss": 1.1448, + "step": 20655 + }, + { + "epoch": 0.62, + "learning_rate": 1.6488856086281523e-06, + "loss": 1.1625, + "step": 20656 + }, + { + "epoch": 0.62, + "learning_rate": 1.6486562634008141e-06, + "loss": 1.0806, + "step": 20657 + }, + { + "epoch": 0.62, + "learning_rate": 1.648426926277859e-06, + "loss": 1.085, + "step": 20658 + }, + { + "epoch": 0.62, + "learning_rate": 1.6481975972614683e-06, + "loss": 1.1081, + "step": 20659 + }, + { + "epoch": 0.62, + "learning_rate": 1.6479682763538263e-06, + "loss": 1.1102, + "step": 20660 + }, + { + "epoch": 0.62, + "learning_rate": 1.6477389635571161e-06, + "loss": 1.2875, + "step": 20661 + }, + { + "epoch": 0.62, + "learning_rate": 1.6475096588735211e-06, + "loss": 1.0178, + "step": 20662 + }, + { + "epoch": 0.62, + "learning_rate": 1.6472803623052228e-06, + "loss": 1.135, + "step": 20663 + }, + { + "epoch": 0.62, + "learning_rate": 1.6470510738544048e-06, + "loss": 1.0337, + "step": 20664 + }, + { + "epoch": 0.62, + "learning_rate": 1.64682179352325e-06, + "loss": 1.1421, + "step": 20665 + }, + { + "epoch": 0.62, + "learning_rate": 1.6465925213139406e-06, + "loss": 1.1156, + "step": 20666 + }, + { + "epoch": 0.62, + "learning_rate": 1.6463632572286604e-06, + "loss": 1.029, + "step": 20667 + }, + { + "epoch": 0.62, + "learning_rate": 1.6461340012695898e-06, + "loss": 1.1249, + "step": 20668 + }, + { + "epoch": 0.62, + "learning_rate": 1.6459047534389125e-06, + "loss": 1.0874, + "step": 20669 + }, + { + "epoch": 0.62, + "learning_rate": 1.6456755137388105e-06, + "loss": 1.2084, + "step": 20670 + }, + { + "epoch": 0.62, + "learning_rate": 1.6454462821714673e-06, + "loss": 1.0551, + "step": 20671 + }, + { + "epoch": 0.62, + "learning_rate": 1.6452170587390625e-06, + "loss": 1.009, + "step": 20672 + }, + { + "epoch": 0.62, + "learning_rate": 1.64498784344378e-06, + "loss": 1.1467, + "step": 20673 + }, + { + "epoch": 0.62, + "learning_rate": 1.6447586362878015e-06, + "loss": 1.2963, + "step": 20674 + }, + { + "epoch": 0.62, + "learning_rate": 1.644529437273309e-06, + "loss": 1.0593, + "step": 20675 + }, + { + "epoch": 0.62, + "learning_rate": 1.6443002464024841e-06, + "loss": 1.0727, + "step": 20676 + }, + { + "epoch": 0.62, + "learning_rate": 1.6440710636775086e-06, + "loss": 1.0885, + "step": 20677 + }, + { + "epoch": 0.62, + "learning_rate": 1.6438418891005643e-06, + "loss": 1.0236, + "step": 20678 + }, + { + "epoch": 0.62, + "learning_rate": 1.643612722673833e-06, + "loss": 1.1366, + "step": 20679 + }, + { + "epoch": 0.62, + "learning_rate": 1.6433835643994968e-06, + "loss": 1.0717, + "step": 20680 + }, + { + "epoch": 0.62, + "learning_rate": 1.643154414279736e-06, + "loss": 1.1678, + "step": 20681 + }, + { + "epoch": 0.62, + "learning_rate": 1.6429252723167323e-06, + "loss": 1.0205, + "step": 20682 + }, + { + "epoch": 0.62, + "learning_rate": 1.6426961385126673e-06, + "loss": 1.2291, + "step": 20683 + }, + { + "epoch": 0.62, + "learning_rate": 1.642467012869723e-06, + "loss": 1.0876, + "step": 20684 + }, + { + "epoch": 0.62, + "learning_rate": 1.6422378953900786e-06, + "loss": 1.0847, + "step": 20685 + }, + { + "epoch": 0.62, + "learning_rate": 1.6420087860759166e-06, + "loss": 1.0652, + "step": 20686 + }, + { + "epoch": 0.62, + "learning_rate": 1.6417796849294176e-06, + "loss": 1.2084, + "step": 20687 + }, + { + "epoch": 0.62, + "learning_rate": 1.641550591952763e-06, + "loss": 1.0186, + "step": 20688 + }, + { + "epoch": 0.62, + "learning_rate": 1.6413215071481332e-06, + "loss": 1.1705, + "step": 20689 + }, + { + "epoch": 0.62, + "learning_rate": 1.641092430517709e-06, + "loss": 1.1496, + "step": 20690 + }, + { + "epoch": 0.62, + "learning_rate": 1.640863362063671e-06, + "loss": 1.119, + "step": 20691 + }, + { + "epoch": 0.62, + "learning_rate": 1.6406343017882004e-06, + "loss": 1.0247, + "step": 20692 + }, + { + "epoch": 0.62, + "learning_rate": 1.640405249693478e-06, + "loss": 1.2053, + "step": 20693 + }, + { + "epoch": 0.62, + "learning_rate": 1.6401762057816828e-06, + "loss": 1.021, + "step": 20694 + }, + { + "epoch": 0.62, + "learning_rate": 1.6399471700549957e-06, + "loss": 1.0746, + "step": 20695 + }, + { + "epoch": 0.62, + "learning_rate": 1.6397181425155977e-06, + "loss": 1.1463, + "step": 20696 + }, + { + "epoch": 0.62, + "learning_rate": 1.6394891231656694e-06, + "loss": 1.0364, + "step": 20697 + }, + { + "epoch": 0.62, + "learning_rate": 1.6392601120073896e-06, + "loss": 1.1656, + "step": 20698 + }, + { + "epoch": 0.62, + "learning_rate": 1.6390311090429386e-06, + "loss": 1.2449, + "step": 20699 + }, + { + "epoch": 0.62, + "learning_rate": 1.638802114274497e-06, + "loss": 1.0572, + "step": 20700 + }, + { + "epoch": 0.62, + "learning_rate": 1.638573127704245e-06, + "loss": 1.1092, + "step": 20701 + }, + { + "epoch": 0.62, + "learning_rate": 1.6383441493343614e-06, + "loss": 1.1133, + "step": 20702 + }, + { + "epoch": 0.62, + "learning_rate": 1.6381151791670264e-06, + "loss": 1.1445, + "step": 20703 + }, + { + "epoch": 0.62, + "learning_rate": 1.6378862172044203e-06, + "loss": 1.1227, + "step": 20704 + }, + { + "epoch": 0.62, + "learning_rate": 1.637657263448722e-06, + "loss": 1.095, + "step": 20705 + }, + { + "epoch": 0.62, + "learning_rate": 1.6374283179021114e-06, + "loss": 1.1878, + "step": 20706 + }, + { + "epoch": 0.62, + "learning_rate": 1.6371993805667674e-06, + "loss": 1.1207, + "step": 20707 + }, + { + "epoch": 0.62, + "learning_rate": 1.6369704514448698e-06, + "loss": 0.9993, + "step": 20708 + }, + { + "epoch": 0.62, + "learning_rate": 1.6367415305385976e-06, + "loss": 1.199, + "step": 20709 + }, + { + "epoch": 0.62, + "learning_rate": 1.6365126178501317e-06, + "loss": 1.1639, + "step": 20710 + }, + { + "epoch": 0.62, + "learning_rate": 1.6362837133816483e-06, + "loss": 1.133, + "step": 20711 + }, + { + "epoch": 0.62, + "learning_rate": 1.6360548171353285e-06, + "loss": 1.0903, + "step": 20712 + }, + { + "epoch": 0.62, + "learning_rate": 1.6358259291133504e-06, + "loss": 1.0027, + "step": 20713 + }, + { + "epoch": 0.62, + "learning_rate": 1.635597049317894e-06, + "loss": 1.0969, + "step": 20714 + }, + { + "epoch": 0.62, + "learning_rate": 1.635368177751137e-06, + "loss": 0.9799, + "step": 20715 + }, + { + "epoch": 0.62, + "learning_rate": 1.6351393144152582e-06, + "loss": 1.109, + "step": 20716 + }, + { + "epoch": 0.62, + "learning_rate": 1.6349104593124371e-06, + "loss": 1.1699, + "step": 20717 + }, + { + "epoch": 0.62, + "learning_rate": 1.6346816124448511e-06, + "loss": 1.0736, + "step": 20718 + }, + { + "epoch": 0.62, + "learning_rate": 1.6344527738146804e-06, + "loss": 1.1418, + "step": 20719 + }, + { + "epoch": 0.62, + "learning_rate": 1.6342239434241014e-06, + "loss": 1.1236, + "step": 20720 + }, + { + "epoch": 0.62, + "learning_rate": 1.6339951212752939e-06, + "loss": 1.1028, + "step": 20721 + }, + { + "epoch": 0.62, + "learning_rate": 1.6337663073704357e-06, + "loss": 1.0975, + "step": 20722 + }, + { + "epoch": 0.62, + "learning_rate": 1.6335375017117062e-06, + "loss": 1.0668, + "step": 20723 + }, + { + "epoch": 0.62, + "learning_rate": 1.6333087043012808e-06, + "loss": 1.0222, + "step": 20724 + }, + { + "epoch": 0.62, + "learning_rate": 1.6330799151413395e-06, + "loss": 1.3018, + "step": 20725 + }, + { + "epoch": 0.62, + "learning_rate": 1.63285113423406e-06, + "loss": 1.0915, + "step": 20726 + }, + { + "epoch": 0.62, + "learning_rate": 1.632622361581621e-06, + "loss": 1.027, + "step": 20727 + }, + { + "epoch": 0.62, + "learning_rate": 1.6323935971861982e-06, + "loss": 1.0916, + "step": 20728 + }, + { + "epoch": 0.62, + "learning_rate": 1.6321648410499708e-06, + "loss": 1.1973, + "step": 20729 + }, + { + "epoch": 0.62, + "learning_rate": 1.631936093175116e-06, + "loss": 1.2028, + "step": 20730 + }, + { + "epoch": 0.62, + "learning_rate": 1.6317073535638113e-06, + "loss": 1.0401, + "step": 20731 + }, + { + "epoch": 0.62, + "learning_rate": 1.631478622218235e-06, + "loss": 1.0579, + "step": 20732 + }, + { + "epoch": 0.62, + "learning_rate": 1.6312498991405636e-06, + "loss": 1.1409, + "step": 20733 + }, + { + "epoch": 0.62, + "learning_rate": 1.631021184332975e-06, + "loss": 1.0306, + "step": 20734 + }, + { + "epoch": 0.62, + "learning_rate": 1.6307924777976455e-06, + "loss": 1.1142, + "step": 20735 + }, + { + "epoch": 0.62, + "learning_rate": 1.6305637795367545e-06, + "loss": 1.0988, + "step": 20736 + }, + { + "epoch": 0.62, + "learning_rate": 1.6303350895524766e-06, + "loss": 1.1965, + "step": 20737 + }, + { + "epoch": 0.62, + "learning_rate": 1.6301064078469897e-06, + "loss": 1.0605, + "step": 20738 + }, + { + "epoch": 0.62, + "learning_rate": 1.6298777344224706e-06, + "loss": 1.1545, + "step": 20739 + }, + { + "epoch": 0.62, + "learning_rate": 1.6296490692810979e-06, + "loss": 1.0445, + "step": 20740 + }, + { + "epoch": 0.62, + "learning_rate": 1.6294204124250453e-06, + "loss": 1.1274, + "step": 20741 + }, + { + "epoch": 0.62, + "learning_rate": 1.6291917638564914e-06, + "loss": 1.1202, + "step": 20742 + }, + { + "epoch": 0.62, + "learning_rate": 1.6289631235776127e-06, + "loss": 1.1221, + "step": 20743 + }, + { + "epoch": 0.62, + "learning_rate": 1.628734491590585e-06, + "loss": 1.2371, + "step": 20744 + }, + { + "epoch": 0.62, + "learning_rate": 1.6285058678975862e-06, + "loss": 1.0919, + "step": 20745 + }, + { + "epoch": 0.62, + "learning_rate": 1.6282772525007915e-06, + "loss": 1.2288, + "step": 20746 + }, + { + "epoch": 0.63, + "learning_rate": 1.6280486454023772e-06, + "loss": 1.1461, + "step": 20747 + }, + { + "epoch": 0.63, + "learning_rate": 1.6278200466045202e-06, + "loss": 1.1207, + "step": 20748 + }, + { + "epoch": 0.63, + "learning_rate": 1.6275914561093969e-06, + "loss": 1.0553, + "step": 20749 + }, + { + "epoch": 0.63, + "learning_rate": 1.6273628739191821e-06, + "loss": 0.9282, + "step": 20750 + }, + { + "epoch": 0.63, + "learning_rate": 1.6271343000360522e-06, + "loss": 1.1493, + "step": 20751 + }, + { + "epoch": 0.63, + "learning_rate": 1.6269057344621836e-06, + "loss": 1.1035, + "step": 20752 + }, + { + "epoch": 0.63, + "learning_rate": 1.6266771771997525e-06, + "loss": 1.1111, + "step": 20753 + }, + { + "epoch": 0.63, + "learning_rate": 1.6264486282509335e-06, + "loss": 1.0629, + "step": 20754 + }, + { + "epoch": 0.63, + "learning_rate": 1.6262200876179026e-06, + "loss": 1.1324, + "step": 20755 + }, + { + "epoch": 0.63, + "learning_rate": 1.6259915553028358e-06, + "loss": 1.2769, + "step": 20756 + }, + { + "epoch": 0.63, + "learning_rate": 1.6257630313079083e-06, + "loss": 1.1312, + "step": 20757 + }, + { + "epoch": 0.63, + "learning_rate": 1.6255345156352964e-06, + "loss": 1.1519, + "step": 20758 + }, + { + "epoch": 0.63, + "learning_rate": 1.6253060082871741e-06, + "loss": 0.9642, + "step": 20759 + }, + { + "epoch": 0.63, + "learning_rate": 1.6250775092657174e-06, + "loss": 1.0139, + "step": 20760 + }, + { + "epoch": 0.63, + "learning_rate": 1.6248490185731015e-06, + "loss": 1.1042, + "step": 20761 + }, + { + "epoch": 0.63, + "learning_rate": 1.6246205362115023e-06, + "loss": 1.1234, + "step": 20762 + }, + { + "epoch": 0.63, + "learning_rate": 1.624392062183093e-06, + "loss": 1.0893, + "step": 20763 + }, + { + "epoch": 0.63, + "learning_rate": 1.6241635964900496e-06, + "loss": 1.1453, + "step": 20764 + }, + { + "epoch": 0.63, + "learning_rate": 1.623935139134547e-06, + "loss": 1.0034, + "step": 20765 + }, + { + "epoch": 0.63, + "learning_rate": 1.623706690118761e-06, + "loss": 1.0804, + "step": 20766 + }, + { + "epoch": 0.63, + "learning_rate": 1.6234782494448642e-06, + "loss": 1.1604, + "step": 20767 + }, + { + "epoch": 0.63, + "learning_rate": 1.6232498171150323e-06, + "loss": 1.1227, + "step": 20768 + }, + { + "epoch": 0.63, + "learning_rate": 1.6230213931314398e-06, + "loss": 1.0143, + "step": 20769 + }, + { + "epoch": 0.63, + "learning_rate": 1.6227929774962613e-06, + "loss": 0.9989, + "step": 20770 + }, + { + "epoch": 0.63, + "learning_rate": 1.6225645702116716e-06, + "loss": 1.1246, + "step": 20771 + }, + { + "epoch": 0.63, + "learning_rate": 1.6223361712798444e-06, + "loss": 1.1011, + "step": 20772 + }, + { + "epoch": 0.63, + "learning_rate": 1.6221077807029539e-06, + "loss": 1.185, + "step": 20773 + }, + { + "epoch": 0.63, + "learning_rate": 1.6218793984831748e-06, + "loss": 1.1401, + "step": 20774 + }, + { + "epoch": 0.63, + "learning_rate": 1.6216510246226815e-06, + "loss": 1.155, + "step": 20775 + }, + { + "epoch": 0.63, + "learning_rate": 1.6214226591236467e-06, + "loss": 1.0698, + "step": 20776 + }, + { + "epoch": 0.63, + "learning_rate": 1.621194301988245e-06, + "loss": 1.0639, + "step": 20777 + }, + { + "epoch": 0.63, + "learning_rate": 1.6209659532186502e-06, + "loss": 1.1216, + "step": 20778 + }, + { + "epoch": 0.63, + "learning_rate": 1.6207376128170375e-06, + "loss": 1.1492, + "step": 20779 + }, + { + "epoch": 0.63, + "learning_rate": 1.620509280785578e-06, + "loss": 1.1499, + "step": 20780 + }, + { + "epoch": 0.63, + "learning_rate": 1.6202809571264466e-06, + "loss": 1.2648, + "step": 20781 + }, + { + "epoch": 0.63, + "learning_rate": 1.6200526418418167e-06, + "loss": 1.0879, + "step": 20782 + }, + { + "epoch": 0.63, + "learning_rate": 1.6198243349338624e-06, + "loss": 1.0479, + "step": 20783 + }, + { + "epoch": 0.63, + "learning_rate": 1.6195960364047561e-06, + "loss": 1.0274, + "step": 20784 + }, + { + "epoch": 0.63, + "learning_rate": 1.6193677462566715e-06, + "loss": 1.1365, + "step": 20785 + }, + { + "epoch": 0.63, + "learning_rate": 1.6191394644917823e-06, + "loss": 1.0763, + "step": 20786 + }, + { + "epoch": 0.63, + "learning_rate": 1.6189111911122608e-06, + "loss": 1.1938, + "step": 20787 + }, + { + "epoch": 0.63, + "learning_rate": 1.6186829261202808e-06, + "loss": 1.0224, + "step": 20788 + }, + { + "epoch": 0.63, + "learning_rate": 1.6184546695180143e-06, + "loss": 1.1277, + "step": 20789 + }, + { + "epoch": 0.63, + "learning_rate": 1.6182264213076348e-06, + "loss": 1.1766, + "step": 20790 + }, + { + "epoch": 0.63, + "learning_rate": 1.6179981814913148e-06, + "loss": 1.0624, + "step": 20791 + }, + { + "epoch": 0.63, + "learning_rate": 1.6177699500712292e-06, + "loss": 1.1085, + "step": 20792 + }, + { + "epoch": 0.63, + "learning_rate": 1.617541727049547e-06, + "loss": 0.9952, + "step": 20793 + }, + { + "epoch": 0.63, + "learning_rate": 1.6173135124284429e-06, + "loss": 1.2997, + "step": 20794 + }, + { + "epoch": 0.63, + "learning_rate": 1.617085306210089e-06, + "loss": 1.1051, + "step": 20795 + }, + { + "epoch": 0.63, + "learning_rate": 1.6168571083966577e-06, + "loss": 1.0735, + "step": 20796 + }, + { + "epoch": 0.63, + "learning_rate": 1.6166289189903223e-06, + "loss": 1.1087, + "step": 20797 + }, + { + "epoch": 0.63, + "learning_rate": 1.616400737993253e-06, + "loss": 1.1505, + "step": 20798 + }, + { + "epoch": 0.63, + "learning_rate": 1.6161725654076236e-06, + "loss": 1.2211, + "step": 20799 + }, + { + "epoch": 0.63, + "learning_rate": 1.615944401235605e-06, + "loss": 1.186, + "step": 20800 + }, + { + "epoch": 0.63, + "learning_rate": 1.6157162454793713e-06, + "loss": 1.1853, + "step": 20801 + }, + { + "epoch": 0.63, + "learning_rate": 1.615488098141092e-06, + "loss": 1.1893, + "step": 20802 + }, + { + "epoch": 0.63, + "learning_rate": 1.61525995922294e-06, + "loss": 1.0496, + "step": 20803 + }, + { + "epoch": 0.63, + "learning_rate": 1.6150318287270874e-06, + "loss": 1.1453, + "step": 20804 + }, + { + "epoch": 0.63, + "learning_rate": 1.6148037066557065e-06, + "loss": 1.2557, + "step": 20805 + }, + { + "epoch": 0.63, + "learning_rate": 1.6145755930109668e-06, + "loss": 1.1957, + "step": 20806 + }, + { + "epoch": 0.63, + "learning_rate": 1.614347487795041e-06, + "loss": 1.0755, + "step": 20807 + }, + { + "epoch": 0.63, + "learning_rate": 1.6141193910101007e-06, + "loss": 1.0626, + "step": 20808 + }, + { + "epoch": 0.63, + "learning_rate": 1.6138913026583184e-06, + "loss": 1.0321, + "step": 20809 + }, + { + "epoch": 0.63, + "learning_rate": 1.6136632227418627e-06, + "loss": 1.0884, + "step": 20810 + }, + { + "epoch": 0.63, + "learning_rate": 1.6134351512629065e-06, + "loss": 1.1382, + "step": 20811 + }, + { + "epoch": 0.63, + "learning_rate": 1.6132070882236207e-06, + "loss": 1.2062, + "step": 20812 + }, + { + "epoch": 0.63, + "learning_rate": 1.612979033626176e-06, + "loss": 1.1064, + "step": 20813 + }, + { + "epoch": 0.63, + "learning_rate": 1.6127509874727446e-06, + "loss": 1.0576, + "step": 20814 + }, + { + "epoch": 0.63, + "learning_rate": 1.6125229497654956e-06, + "loss": 0.9991, + "step": 20815 + }, + { + "epoch": 0.63, + "learning_rate": 1.612294920506601e-06, + "loss": 1.2234, + "step": 20816 + }, + { + "epoch": 0.63, + "learning_rate": 1.6120668996982312e-06, + "loss": 1.2117, + "step": 20817 + }, + { + "epoch": 0.63, + "learning_rate": 1.6118388873425578e-06, + "loss": 1.1923, + "step": 20818 + }, + { + "epoch": 0.63, + "learning_rate": 1.6116108834417492e-06, + "loss": 1.1642, + "step": 20819 + }, + { + "epoch": 0.63, + "learning_rate": 1.6113828879979776e-06, + "loss": 1.1511, + "step": 20820 + }, + { + "epoch": 0.63, + "learning_rate": 1.6111549010134125e-06, + "loss": 1.1719, + "step": 20821 + }, + { + "epoch": 0.63, + "learning_rate": 1.6109269224902258e-06, + "loss": 0.9404, + "step": 20822 + }, + { + "epoch": 0.63, + "learning_rate": 1.6106989524305857e-06, + "loss": 1.0604, + "step": 20823 + }, + { + "epoch": 0.63, + "learning_rate": 1.6104709908366634e-06, + "loss": 1.1924, + "step": 20824 + }, + { + "epoch": 0.63, + "learning_rate": 1.6102430377106287e-06, + "loss": 1.2078, + "step": 20825 + }, + { + "epoch": 0.63, + "learning_rate": 1.6100150930546515e-06, + "loss": 1.1255, + "step": 20826 + }, + { + "epoch": 0.63, + "learning_rate": 1.6097871568709028e-06, + "loss": 1.1358, + "step": 20827 + }, + { + "epoch": 0.63, + "learning_rate": 1.609559229161551e-06, + "loss": 1.2499, + "step": 20828 + }, + { + "epoch": 0.63, + "learning_rate": 1.6093313099287667e-06, + "loss": 1.0754, + "step": 20829 + }, + { + "epoch": 0.63, + "learning_rate": 1.609103399174719e-06, + "loss": 1.172, + "step": 20830 + }, + { + "epoch": 0.63, + "learning_rate": 1.6088754969015791e-06, + "loss": 1.1371, + "step": 20831 + }, + { + "epoch": 0.63, + "learning_rate": 1.6086476031115146e-06, + "loss": 1.0791, + "step": 20832 + }, + { + "epoch": 0.63, + "learning_rate": 1.608419717806695e-06, + "loss": 1.1041, + "step": 20833 + }, + { + "epoch": 0.63, + "learning_rate": 1.6081918409892904e-06, + "loss": 1.1971, + "step": 20834 + }, + { + "epoch": 0.63, + "learning_rate": 1.6079639726614716e-06, + "loss": 1.0802, + "step": 20835 + }, + { + "epoch": 0.63, + "learning_rate": 1.6077361128254044e-06, + "loss": 1.1248, + "step": 20836 + }, + { + "epoch": 0.63, + "learning_rate": 1.60750826148326e-06, + "loss": 1.1147, + "step": 20837 + }, + { + "epoch": 0.63, + "learning_rate": 1.6072804186372072e-06, + "loss": 1.1087, + "step": 20838 + }, + { + "epoch": 0.63, + "learning_rate": 1.6070525842894146e-06, + "loss": 1.1169, + "step": 20839 + }, + { + "epoch": 0.63, + "learning_rate": 1.6068247584420521e-06, + "loss": 1.0674, + "step": 20840 + }, + { + "epoch": 0.63, + "learning_rate": 1.606596941097287e-06, + "loss": 1.1893, + "step": 20841 + }, + { + "epoch": 0.63, + "learning_rate": 1.6063691322572888e-06, + "loss": 1.0522, + "step": 20842 + }, + { + "epoch": 0.63, + "learning_rate": 1.6061413319242263e-06, + "loss": 1.1133, + "step": 20843 + }, + { + "epoch": 0.63, + "learning_rate": 1.6059135401002685e-06, + "loss": 1.2883, + "step": 20844 + }, + { + "epoch": 0.63, + "learning_rate": 1.6056857567875824e-06, + "loss": 1.1417, + "step": 20845 + }, + { + "epoch": 0.63, + "learning_rate": 1.6054579819883374e-06, + "loss": 1.1047, + "step": 20846 + }, + { + "epoch": 0.63, + "learning_rate": 1.6052302157047013e-06, + "loss": 1.2097, + "step": 20847 + }, + { + "epoch": 0.63, + "learning_rate": 1.6050024579388435e-06, + "loss": 1.0649, + "step": 20848 + }, + { + "epoch": 0.63, + "learning_rate": 1.6047747086929306e-06, + "loss": 1.1509, + "step": 20849 + }, + { + "epoch": 0.63, + "learning_rate": 1.604546967969131e-06, + "loss": 1.0778, + "step": 20850 + }, + { + "epoch": 0.63, + "learning_rate": 1.6043192357696131e-06, + "loss": 1.0065, + "step": 20851 + }, + { + "epoch": 0.63, + "learning_rate": 1.6040915120965445e-06, + "loss": 1.0954, + "step": 20852 + }, + { + "epoch": 0.63, + "learning_rate": 1.603863796952094e-06, + "loss": 1.0944, + "step": 20853 + }, + { + "epoch": 0.63, + "learning_rate": 1.603636090338428e-06, + "loss": 1.2009, + "step": 20854 + }, + { + "epoch": 0.63, + "learning_rate": 1.6034083922577148e-06, + "loss": 1.1616, + "step": 20855 + }, + { + "epoch": 0.63, + "learning_rate": 1.6031807027121216e-06, + "loss": 1.0681, + "step": 20856 + }, + { + "epoch": 0.63, + "learning_rate": 1.6029530217038176e-06, + "loss": 1.0759, + "step": 20857 + }, + { + "epoch": 0.63, + "learning_rate": 1.6027253492349676e-06, + "loss": 1.1026, + "step": 20858 + }, + { + "epoch": 0.63, + "learning_rate": 1.60249768530774e-06, + "loss": 1.1077, + "step": 20859 + }, + { + "epoch": 0.63, + "learning_rate": 1.6022700299243022e-06, + "loss": 1.1705, + "step": 20860 + }, + { + "epoch": 0.63, + "learning_rate": 1.6020423830868226e-06, + "loss": 1.1505, + "step": 20861 + }, + { + "epoch": 0.63, + "learning_rate": 1.6018147447974658e-06, + "loss": 1.095, + "step": 20862 + }, + { + "epoch": 0.63, + "learning_rate": 1.6015871150584e-06, + "loss": 1.0161, + "step": 20863 + }, + { + "epoch": 0.63, + "learning_rate": 1.6013594938717925e-06, + "loss": 0.9828, + "step": 20864 + }, + { + "epoch": 0.63, + "learning_rate": 1.6011318812398096e-06, + "loss": 1.0673, + "step": 20865 + }, + { + "epoch": 0.63, + "learning_rate": 1.6009042771646189e-06, + "loss": 1.0803, + "step": 20866 + }, + { + "epoch": 0.63, + "learning_rate": 1.600676681648386e-06, + "loss": 1.1875, + "step": 20867 + }, + { + "epoch": 0.63, + "learning_rate": 1.6004490946932782e-06, + "loss": 1.0597, + "step": 20868 + }, + { + "epoch": 0.63, + "learning_rate": 1.6002215163014612e-06, + "loss": 1.1159, + "step": 20869 + }, + { + "epoch": 0.63, + "learning_rate": 1.5999939464751029e-06, + "loss": 1.128, + "step": 20870 + }, + { + "epoch": 0.63, + "learning_rate": 1.599766385216368e-06, + "loss": 1.1103, + "step": 20871 + }, + { + "epoch": 0.63, + "learning_rate": 1.5995388325274236e-06, + "loss": 1.1393, + "step": 20872 + }, + { + "epoch": 0.63, + "learning_rate": 1.5993112884104361e-06, + "loss": 1.064, + "step": 20873 + }, + { + "epoch": 0.63, + "learning_rate": 1.599083752867572e-06, + "loss": 1.1253, + "step": 20874 + }, + { + "epoch": 0.63, + "learning_rate": 1.598856225900996e-06, + "loss": 1.202, + "step": 20875 + }, + { + "epoch": 0.63, + "learning_rate": 1.5986287075128743e-06, + "loss": 1.0526, + "step": 20876 + }, + { + "epoch": 0.63, + "learning_rate": 1.5984011977053737e-06, + "loss": 1.1811, + "step": 20877 + }, + { + "epoch": 0.63, + "learning_rate": 1.598173696480659e-06, + "loss": 1.0847, + "step": 20878 + }, + { + "epoch": 0.63, + "learning_rate": 1.5979462038408977e-06, + "loss": 1.1459, + "step": 20879 + }, + { + "epoch": 0.63, + "learning_rate": 1.5977187197882529e-06, + "loss": 1.1592, + "step": 20880 + }, + { + "epoch": 0.63, + "learning_rate": 1.5974912443248913e-06, + "loss": 1.1102, + "step": 20881 + }, + { + "epoch": 0.63, + "learning_rate": 1.5972637774529788e-06, + "loss": 1.174, + "step": 20882 + }, + { + "epoch": 0.63, + "learning_rate": 1.5970363191746805e-06, + "loss": 1.0474, + "step": 20883 + }, + { + "epoch": 0.63, + "learning_rate": 1.596808869492161e-06, + "loss": 1.1772, + "step": 20884 + }, + { + "epoch": 0.63, + "learning_rate": 1.5965814284075862e-06, + "loss": 1.1298, + "step": 20885 + }, + { + "epoch": 0.63, + "learning_rate": 1.596353995923121e-06, + "loss": 1.1747, + "step": 20886 + }, + { + "epoch": 0.63, + "learning_rate": 1.596126572040932e-06, + "loss": 1.116, + "step": 20887 + }, + { + "epoch": 0.63, + "learning_rate": 1.5958991567631809e-06, + "loss": 1.0175, + "step": 20888 + }, + { + "epoch": 0.63, + "learning_rate": 1.5956717500920348e-06, + "loss": 1.117, + "step": 20889 + }, + { + "epoch": 0.63, + "learning_rate": 1.5954443520296584e-06, + "loss": 1.0201, + "step": 20890 + }, + { + "epoch": 0.63, + "learning_rate": 1.595216962578216e-06, + "loss": 1.0742, + "step": 20891 + }, + { + "epoch": 0.63, + "learning_rate": 1.594989581739873e-06, + "loss": 1.1682, + "step": 20892 + }, + { + "epoch": 0.63, + "learning_rate": 1.5947622095167926e-06, + "loss": 1.1078, + "step": 20893 + }, + { + "epoch": 0.63, + "learning_rate": 1.5945348459111398e-06, + "loss": 1.1151, + "step": 20894 + }, + { + "epoch": 0.63, + "learning_rate": 1.5943074909250794e-06, + "loss": 1.1, + "step": 20895 + }, + { + "epoch": 0.63, + "learning_rate": 1.594080144560776e-06, + "loss": 1.1376, + "step": 20896 + }, + { + "epoch": 0.63, + "learning_rate": 1.5938528068203927e-06, + "loss": 1.12, + "step": 20897 + }, + { + "epoch": 0.63, + "learning_rate": 1.5936254777060944e-06, + "loss": 1.1473, + "step": 20898 + }, + { + "epoch": 0.63, + "learning_rate": 1.5933981572200446e-06, + "loss": 1.1165, + "step": 20899 + }, + { + "epoch": 0.63, + "learning_rate": 1.593170845364409e-06, + "loss": 1.2193, + "step": 20900 + }, + { + "epoch": 0.63, + "learning_rate": 1.5929435421413495e-06, + "loss": 1.182, + "step": 20901 + }, + { + "epoch": 0.63, + "learning_rate": 1.5927162475530303e-06, + "loss": 1.1072, + "step": 20902 + }, + { + "epoch": 0.63, + "learning_rate": 1.5924889616016154e-06, + "loss": 1.0954, + "step": 20903 + }, + { + "epoch": 0.63, + "learning_rate": 1.5922616842892684e-06, + "loss": 1.0984, + "step": 20904 + }, + { + "epoch": 0.63, + "learning_rate": 1.5920344156181545e-06, + "loss": 1.1656, + "step": 20905 + }, + { + "epoch": 0.63, + "learning_rate": 1.5918071555904344e-06, + "loss": 1.295, + "step": 20906 + }, + { + "epoch": 0.63, + "learning_rate": 1.5915799042082728e-06, + "loss": 1.1141, + "step": 20907 + }, + { + "epoch": 0.63, + "learning_rate": 1.5913526614738328e-06, + "loss": 1.1277, + "step": 20908 + }, + { + "epoch": 0.63, + "learning_rate": 1.5911254273892785e-06, + "loss": 1.0248, + "step": 20909 + }, + { + "epoch": 0.63, + "learning_rate": 1.590898201956772e-06, + "loss": 1.0494, + "step": 20910 + }, + { + "epoch": 0.63, + "learning_rate": 1.5906709851784768e-06, + "loss": 1.2122, + "step": 20911 + }, + { + "epoch": 0.63, + "learning_rate": 1.5904437770565557e-06, + "loss": 1.1796, + "step": 20912 + }, + { + "epoch": 0.63, + "learning_rate": 1.5902165775931727e-06, + "loss": 1.1287, + "step": 20913 + }, + { + "epoch": 0.63, + "learning_rate": 1.589989386790489e-06, + "loss": 1.1038, + "step": 20914 + }, + { + "epoch": 0.63, + "learning_rate": 1.5897622046506678e-06, + "loss": 1.1021, + "step": 20915 + }, + { + "epoch": 0.63, + "learning_rate": 1.5895350311758723e-06, + "loss": 1.1649, + "step": 20916 + }, + { + "epoch": 0.63, + "learning_rate": 1.5893078663682646e-06, + "loss": 1.077, + "step": 20917 + }, + { + "epoch": 0.63, + "learning_rate": 1.5890807102300085e-06, + "loss": 1.1151, + "step": 20918 + }, + { + "epoch": 0.63, + "learning_rate": 1.5888535627632642e-06, + "loss": 1.1143, + "step": 20919 + }, + { + "epoch": 0.63, + "learning_rate": 1.5886264239701953e-06, + "loss": 1.1523, + "step": 20920 + }, + { + "epoch": 0.63, + "learning_rate": 1.5883992938529639e-06, + "loss": 1.0549, + "step": 20921 + }, + { + "epoch": 0.63, + "learning_rate": 1.5881721724137328e-06, + "loss": 1.1741, + "step": 20922 + }, + { + "epoch": 0.63, + "learning_rate": 1.5879450596546626e-06, + "loss": 1.1847, + "step": 20923 + }, + { + "epoch": 0.63, + "learning_rate": 1.5877179555779165e-06, + "loss": 1.1355, + "step": 20924 + }, + { + "epoch": 0.63, + "learning_rate": 1.587490860185656e-06, + "loss": 1.1067, + "step": 20925 + }, + { + "epoch": 0.63, + "learning_rate": 1.5872637734800439e-06, + "loss": 1.058, + "step": 20926 + }, + { + "epoch": 0.63, + "learning_rate": 1.5870366954632402e-06, + "loss": 1.1423, + "step": 20927 + }, + { + "epoch": 0.63, + "learning_rate": 1.5868096261374071e-06, + "loss": 1.0383, + "step": 20928 + }, + { + "epoch": 0.63, + "learning_rate": 1.5865825655047073e-06, + "loss": 1.1082, + "step": 20929 + }, + { + "epoch": 0.63, + "learning_rate": 1.5863555135673008e-06, + "loss": 1.1346, + "step": 20930 + }, + { + "epoch": 0.63, + "learning_rate": 1.5861284703273514e-06, + "loss": 1.1755, + "step": 20931 + }, + { + "epoch": 0.63, + "learning_rate": 1.5859014357870176e-06, + "loss": 1.0244, + "step": 20932 + }, + { + "epoch": 0.63, + "learning_rate": 1.5856744099484617e-06, + "loss": 1.1313, + "step": 20933 + }, + { + "epoch": 0.63, + "learning_rate": 1.5854473928138452e-06, + "loss": 1.1688, + "step": 20934 + }, + { + "epoch": 0.63, + "learning_rate": 1.5852203843853298e-06, + "loss": 1.181, + "step": 20935 + }, + { + "epoch": 0.63, + "learning_rate": 1.584993384665075e-06, + "loss": 1.0555, + "step": 20936 + }, + { + "epoch": 0.63, + "learning_rate": 1.5847663936552427e-06, + "loss": 1.2039, + "step": 20937 + }, + { + "epoch": 0.63, + "learning_rate": 1.5845394113579931e-06, + "loss": 1.1519, + "step": 20938 + }, + { + "epoch": 0.63, + "learning_rate": 1.5843124377754887e-06, + "loss": 1.0216, + "step": 20939 + }, + { + "epoch": 0.63, + "learning_rate": 1.5840854729098881e-06, + "loss": 1.0601, + "step": 20940 + }, + { + "epoch": 0.63, + "learning_rate": 1.5838585167633525e-06, + "loss": 1.2139, + "step": 20941 + }, + { + "epoch": 0.63, + "learning_rate": 1.5836315693380422e-06, + "loss": 1.1111, + "step": 20942 + }, + { + "epoch": 0.63, + "learning_rate": 1.5834046306361184e-06, + "loss": 1.153, + "step": 20943 + }, + { + "epoch": 0.63, + "learning_rate": 1.583177700659742e-06, + "loss": 1.2159, + "step": 20944 + }, + { + "epoch": 0.63, + "learning_rate": 1.5829507794110716e-06, + "loss": 1.1591, + "step": 20945 + }, + { + "epoch": 0.63, + "learning_rate": 1.582723866892268e-06, + "loss": 1.0974, + "step": 20946 + }, + { + "epoch": 0.63, + "learning_rate": 1.582496963105491e-06, + "loss": 1.0943, + "step": 20947 + }, + { + "epoch": 0.63, + "learning_rate": 1.5822700680529018e-06, + "loss": 1.1465, + "step": 20948 + }, + { + "epoch": 0.63, + "learning_rate": 1.5820431817366591e-06, + "loss": 1.1669, + "step": 20949 + }, + { + "epoch": 0.63, + "learning_rate": 1.5818163041589232e-06, + "loss": 1.1115, + "step": 20950 + }, + { + "epoch": 0.63, + "learning_rate": 1.5815894353218542e-06, + "loss": 1.1812, + "step": 20951 + }, + { + "epoch": 0.63, + "learning_rate": 1.5813625752276118e-06, + "loss": 1.1049, + "step": 20952 + }, + { + "epoch": 0.63, + "learning_rate": 1.5811357238783546e-06, + "loss": 0.9398, + "step": 20953 + }, + { + "epoch": 0.63, + "learning_rate": 1.5809088812762428e-06, + "loss": 1.2678, + "step": 20954 + }, + { + "epoch": 0.63, + "learning_rate": 1.5806820474234355e-06, + "loss": 1.2136, + "step": 20955 + }, + { + "epoch": 0.63, + "learning_rate": 1.5804552223220927e-06, + "loss": 1.1293, + "step": 20956 + }, + { + "epoch": 0.63, + "learning_rate": 1.5802284059743741e-06, + "loss": 1.0716, + "step": 20957 + }, + { + "epoch": 0.63, + "learning_rate": 1.5800015983824375e-06, + "loss": 1.1602, + "step": 20958 + }, + { + "epoch": 0.63, + "learning_rate": 1.5797747995484418e-06, + "loss": 1.0491, + "step": 20959 + }, + { + "epoch": 0.63, + "learning_rate": 1.5795480094745475e-06, + "loss": 1.11, + "step": 20960 + }, + { + "epoch": 0.63, + "learning_rate": 1.5793212281629134e-06, + "loss": 1.1774, + "step": 20961 + }, + { + "epoch": 0.63, + "learning_rate": 1.5790944556156974e-06, + "loss": 1.11, + "step": 20962 + }, + { + "epoch": 0.63, + "learning_rate": 1.5788676918350583e-06, + "loss": 1.1577, + "step": 20963 + }, + { + "epoch": 0.63, + "learning_rate": 1.5786409368231552e-06, + "loss": 1.1344, + "step": 20964 + }, + { + "epoch": 0.63, + "learning_rate": 1.5784141905821471e-06, + "loss": 1.0864, + "step": 20965 + }, + { + "epoch": 0.63, + "learning_rate": 1.5781874531141914e-06, + "loss": 1.0026, + "step": 20966 + }, + { + "epoch": 0.63, + "learning_rate": 1.5779607244214474e-06, + "loss": 1.2198, + "step": 20967 + }, + { + "epoch": 0.63, + "learning_rate": 1.577734004506073e-06, + "loss": 1.0182, + "step": 20968 + }, + { + "epoch": 0.63, + "learning_rate": 1.577507293370228e-06, + "loss": 1.1848, + "step": 20969 + }, + { + "epoch": 0.63, + "learning_rate": 1.577280591016068e-06, + "loss": 1.0487, + "step": 20970 + }, + { + "epoch": 0.63, + "learning_rate": 1.5770538974457524e-06, + "loss": 1.089, + "step": 20971 + }, + { + "epoch": 0.63, + "learning_rate": 1.5768272126614393e-06, + "loss": 1.0938, + "step": 20972 + }, + { + "epoch": 0.63, + "learning_rate": 1.5766005366652865e-06, + "loss": 1.1181, + "step": 20973 + }, + { + "epoch": 0.63, + "learning_rate": 1.576373869459453e-06, + "loss": 1.2036, + "step": 20974 + }, + { + "epoch": 0.63, + "learning_rate": 1.5761472110460944e-06, + "loss": 1.1845, + "step": 20975 + }, + { + "epoch": 0.63, + "learning_rate": 1.5759205614273692e-06, + "loss": 1.1495, + "step": 20976 + }, + { + "epoch": 0.63, + "learning_rate": 1.5756939206054352e-06, + "loss": 1.1151, + "step": 20977 + }, + { + "epoch": 0.63, + "learning_rate": 1.5754672885824507e-06, + "loss": 1.141, + "step": 20978 + }, + { + "epoch": 0.63, + "learning_rate": 1.5752406653605718e-06, + "loss": 1.1412, + "step": 20979 + }, + { + "epoch": 0.63, + "learning_rate": 1.5750140509419562e-06, + "loss": 1.3185, + "step": 20980 + }, + { + "epoch": 0.63, + "learning_rate": 1.5747874453287615e-06, + "loss": 1.2095, + "step": 20981 + }, + { + "epoch": 0.63, + "learning_rate": 1.5745608485231455e-06, + "loss": 1.1144, + "step": 20982 + }, + { + "epoch": 0.63, + "learning_rate": 1.5743342605272637e-06, + "loss": 1.1744, + "step": 20983 + }, + { + "epoch": 0.63, + "learning_rate": 1.5741076813432738e-06, + "loss": 1.1185, + "step": 20984 + }, + { + "epoch": 0.63, + "learning_rate": 1.573881110973333e-06, + "loss": 1.1763, + "step": 20985 + }, + { + "epoch": 0.63, + "learning_rate": 1.573654549419598e-06, + "loss": 1.123, + "step": 20986 + }, + { + "epoch": 0.63, + "learning_rate": 1.5734279966842264e-06, + "loss": 1.163, + "step": 20987 + }, + { + "epoch": 0.63, + "learning_rate": 1.573201452769373e-06, + "loss": 1.1205, + "step": 20988 + }, + { + "epoch": 0.63, + "learning_rate": 1.5729749176771954e-06, + "loss": 1.1544, + "step": 20989 + }, + { + "epoch": 0.63, + "learning_rate": 1.5727483914098501e-06, + "loss": 1.198, + "step": 20990 + }, + { + "epoch": 0.63, + "learning_rate": 1.5725218739694942e-06, + "loss": 1.0872, + "step": 20991 + }, + { + "epoch": 0.63, + "learning_rate": 1.5722953653582829e-06, + "loss": 1.1189, + "step": 20992 + }, + { + "epoch": 0.63, + "learning_rate": 1.5720688655783727e-06, + "loss": 1.2479, + "step": 20993 + }, + { + "epoch": 0.63, + "learning_rate": 1.5718423746319204e-06, + "loss": 1.0686, + "step": 20994 + }, + { + "epoch": 0.63, + "learning_rate": 1.5716158925210823e-06, + "loss": 1.0531, + "step": 20995 + }, + { + "epoch": 0.63, + "learning_rate": 1.5713894192480129e-06, + "loss": 1.0817, + "step": 20996 + }, + { + "epoch": 0.63, + "learning_rate": 1.5711629548148687e-06, + "loss": 1.132, + "step": 20997 + }, + { + "epoch": 0.63, + "learning_rate": 1.5709364992238062e-06, + "loss": 1.1365, + "step": 20998 + }, + { + "epoch": 0.63, + "learning_rate": 1.5707100524769809e-06, + "loss": 1.0616, + "step": 20999 + }, + { + "epoch": 0.63, + "learning_rate": 1.570483614576549e-06, + "loss": 0.9748, + "step": 21000 + }, + { + "epoch": 0.63, + "learning_rate": 1.5702571855246645e-06, + "loss": 1.1283, + "step": 21001 + }, + { + "epoch": 0.63, + "learning_rate": 1.570030765323484e-06, + "loss": 1.0892, + "step": 21002 + }, + { + "epoch": 0.63, + "learning_rate": 1.5698043539751626e-06, + "loss": 1.0352, + "step": 21003 + }, + { + "epoch": 0.63, + "learning_rate": 1.569577951481856e-06, + "loss": 1.1371, + "step": 21004 + }, + { + "epoch": 0.63, + "learning_rate": 1.569351557845719e-06, + "loss": 1.0471, + "step": 21005 + }, + { + "epoch": 0.63, + "learning_rate": 1.5691251730689069e-06, + "loss": 1.0976, + "step": 21006 + }, + { + "epoch": 0.63, + "learning_rate": 1.5688987971535746e-06, + "loss": 1.1419, + "step": 21007 + }, + { + "epoch": 0.63, + "learning_rate": 1.5686724301018789e-06, + "loss": 1.0262, + "step": 21008 + }, + { + "epoch": 0.63, + "learning_rate": 1.5684460719159717e-06, + "loss": 1.0452, + "step": 21009 + }, + { + "epoch": 0.63, + "learning_rate": 1.5682197225980091e-06, + "loss": 1.1008, + "step": 21010 + }, + { + "epoch": 0.63, + "learning_rate": 1.5679933821501463e-06, + "loss": 1.0916, + "step": 21011 + }, + { + "epoch": 0.63, + "learning_rate": 1.5677670505745373e-06, + "loss": 1.0837, + "step": 21012 + }, + { + "epoch": 0.63, + "learning_rate": 1.5675407278733385e-06, + "loss": 1.1556, + "step": 21013 + }, + { + "epoch": 0.63, + "learning_rate": 1.5673144140487014e-06, + "loss": 1.0617, + "step": 21014 + }, + { + "epoch": 0.63, + "learning_rate": 1.5670881091027821e-06, + "loss": 1.1069, + "step": 21015 + }, + { + "epoch": 0.63, + "learning_rate": 1.5668618130377345e-06, + "loss": 1.0157, + "step": 21016 + }, + { + "epoch": 0.63, + "learning_rate": 1.5666355258557137e-06, + "loss": 1.0734, + "step": 21017 + }, + { + "epoch": 0.63, + "learning_rate": 1.5664092475588727e-06, + "loss": 1.0997, + "step": 21018 + }, + { + "epoch": 0.63, + "learning_rate": 1.566182978149366e-06, + "loss": 1.0228, + "step": 21019 + }, + { + "epoch": 0.63, + "learning_rate": 1.5659567176293477e-06, + "loss": 1.1641, + "step": 21020 + }, + { + "epoch": 0.63, + "learning_rate": 1.5657304660009725e-06, + "loss": 1.2411, + "step": 21021 + }, + { + "epoch": 0.63, + "learning_rate": 1.5655042232663921e-06, + "loss": 1.1208, + "step": 21022 + }, + { + "epoch": 0.63, + "learning_rate": 1.5652779894277618e-06, + "loss": 1.1721, + "step": 21023 + }, + { + "epoch": 0.63, + "learning_rate": 1.5650517644872345e-06, + "loss": 1.0756, + "step": 21024 + }, + { + "epoch": 0.63, + "learning_rate": 1.5648255484469644e-06, + "loss": 1.215, + "step": 21025 + }, + { + "epoch": 0.63, + "learning_rate": 1.5645993413091057e-06, + "loss": 1.1627, + "step": 21026 + }, + { + "epoch": 0.63, + "learning_rate": 1.5643731430758098e-06, + "loss": 1.0616, + "step": 21027 + }, + { + "epoch": 0.63, + "learning_rate": 1.5641469537492304e-06, + "loss": 1.0146, + "step": 21028 + }, + { + "epoch": 0.63, + "learning_rate": 1.563920773331522e-06, + "loss": 1.1543, + "step": 21029 + }, + { + "epoch": 0.63, + "learning_rate": 1.5636946018248373e-06, + "loss": 1.1744, + "step": 21030 + }, + { + "epoch": 0.63, + "learning_rate": 1.5634684392313282e-06, + "loss": 1.1055, + "step": 21031 + }, + { + "epoch": 0.63, + "learning_rate": 1.5632422855531488e-06, + "loss": 1.2343, + "step": 21032 + }, + { + "epoch": 0.63, + "learning_rate": 1.563016140792452e-06, + "loss": 0.994, + "step": 21033 + }, + { + "epoch": 0.63, + "learning_rate": 1.5627900049513906e-06, + "loss": 1.072, + "step": 21034 + }, + { + "epoch": 0.63, + "learning_rate": 1.5625638780321162e-06, + "loss": 1.1554, + "step": 21035 + }, + { + "epoch": 0.63, + "learning_rate": 1.5623377600367822e-06, + "loss": 1.2567, + "step": 21036 + }, + { + "epoch": 0.63, + "learning_rate": 1.5621116509675413e-06, + "loss": 1.0911, + "step": 21037 + }, + { + "epoch": 0.63, + "learning_rate": 1.5618855508265457e-06, + "loss": 1.2721, + "step": 21038 + }, + { + "epoch": 0.63, + "learning_rate": 1.561659459615949e-06, + "loss": 1.1462, + "step": 21039 + }, + { + "epoch": 0.63, + "learning_rate": 1.561433377337901e-06, + "loss": 1.1715, + "step": 21040 + }, + { + "epoch": 0.63, + "learning_rate": 1.5612073039945553e-06, + "loss": 1.2261, + "step": 21041 + }, + { + "epoch": 0.63, + "learning_rate": 1.560981239588064e-06, + "loss": 1.1224, + "step": 21042 + }, + { + "epoch": 0.63, + "learning_rate": 1.5607551841205798e-06, + "loss": 1.0969, + "step": 21043 + }, + { + "epoch": 0.63, + "learning_rate": 1.5605291375942536e-06, + "loss": 1.0197, + "step": 21044 + }, + { + "epoch": 0.63, + "learning_rate": 1.560303100011237e-06, + "loss": 1.1096, + "step": 21045 + }, + { + "epoch": 0.63, + "learning_rate": 1.5600770713736824e-06, + "loss": 1.0578, + "step": 21046 + }, + { + "epoch": 0.63, + "learning_rate": 1.5598510516837418e-06, + "loss": 1.0981, + "step": 21047 + }, + { + "epoch": 0.63, + "learning_rate": 1.5596250409435662e-06, + "loss": 1.1197, + "step": 21048 + }, + { + "epoch": 0.63, + "learning_rate": 1.5593990391553072e-06, + "loss": 1.1752, + "step": 21049 + }, + { + "epoch": 0.63, + "learning_rate": 1.559173046321116e-06, + "loss": 1.1948, + "step": 21050 + }, + { + "epoch": 0.63, + "learning_rate": 1.5589470624431446e-06, + "loss": 1.0805, + "step": 21051 + }, + { + "epoch": 0.63, + "learning_rate": 1.5587210875235449e-06, + "loss": 1.1268, + "step": 21052 + }, + { + "epoch": 0.63, + "learning_rate": 1.5584951215644661e-06, + "loss": 1.0688, + "step": 21053 + }, + { + "epoch": 0.63, + "learning_rate": 1.5582691645680602e-06, + "loss": 1.1136, + "step": 21054 + }, + { + "epoch": 0.63, + "learning_rate": 1.5580432165364783e-06, + "loss": 1.044, + "step": 21055 + }, + { + "epoch": 0.63, + "learning_rate": 1.5578172774718726e-06, + "loss": 1.1325, + "step": 21056 + }, + { + "epoch": 0.63, + "learning_rate": 1.5575913473763916e-06, + "loss": 1.0808, + "step": 21057 + }, + { + "epoch": 0.63, + "learning_rate": 1.5573654262521868e-06, + "loss": 1.0441, + "step": 21058 + }, + { + "epoch": 0.63, + "learning_rate": 1.5571395141014092e-06, + "loss": 1.0684, + "step": 21059 + }, + { + "epoch": 0.63, + "learning_rate": 1.55691361092621e-06, + "loss": 1.126, + "step": 21060 + }, + { + "epoch": 0.63, + "learning_rate": 1.5566877167287386e-06, + "loss": 1.1588, + "step": 21061 + }, + { + "epoch": 0.63, + "learning_rate": 1.5564618315111458e-06, + "loss": 1.1375, + "step": 21062 + }, + { + "epoch": 0.63, + "learning_rate": 1.5562359552755814e-06, + "loss": 1.1273, + "step": 21063 + }, + { + "epoch": 0.63, + "learning_rate": 1.5560100880241967e-06, + "loss": 1.0529, + "step": 21064 + }, + { + "epoch": 0.63, + "learning_rate": 1.5557842297591421e-06, + "loss": 1.1273, + "step": 21065 + }, + { + "epoch": 0.63, + "learning_rate": 1.555558380482566e-06, + "loss": 1.1429, + "step": 21066 + }, + { + "epoch": 0.63, + "learning_rate": 1.5553325401966193e-06, + "loss": 1.054, + "step": 21067 + }, + { + "epoch": 0.63, + "learning_rate": 1.5551067089034518e-06, + "loss": 1.1755, + "step": 21068 + }, + { + "epoch": 0.63, + "learning_rate": 1.5548808866052146e-06, + "loss": 1.1118, + "step": 21069 + }, + { + "epoch": 0.63, + "learning_rate": 1.5546550733040546e-06, + "loss": 1.0911, + "step": 21070 + }, + { + "epoch": 0.63, + "learning_rate": 1.5544292690021234e-06, + "loss": 1.1147, + "step": 21071 + }, + { + "epoch": 0.63, + "learning_rate": 1.5542034737015702e-06, + "loss": 1.0753, + "step": 21072 + }, + { + "epoch": 0.63, + "learning_rate": 1.5539776874045448e-06, + "loss": 1.1021, + "step": 21073 + }, + { + "epoch": 0.63, + "learning_rate": 1.5537519101131957e-06, + "loss": 1.189, + "step": 21074 + }, + { + "epoch": 0.63, + "learning_rate": 1.5535261418296727e-06, + "loss": 1.1917, + "step": 21075 + }, + { + "epoch": 0.63, + "learning_rate": 1.553300382556125e-06, + "loss": 1.0444, + "step": 21076 + }, + { + "epoch": 0.63, + "learning_rate": 1.5530746322947015e-06, + "loss": 1.0624, + "step": 21077 + }, + { + "epoch": 0.63, + "learning_rate": 1.5528488910475528e-06, + "loss": 1.0218, + "step": 21078 + }, + { + "epoch": 0.64, + "learning_rate": 1.5526231588168253e-06, + "loss": 1.1838, + "step": 21079 + }, + { + "epoch": 0.64, + "learning_rate": 1.552397435604669e-06, + "loss": 1.0865, + "step": 21080 + }, + { + "epoch": 0.64, + "learning_rate": 1.5521717214132328e-06, + "loss": 1.168, + "step": 21081 + }, + { + "epoch": 0.64, + "learning_rate": 1.5519460162446665e-06, + "loss": 1.0704, + "step": 21082 + }, + { + "epoch": 0.64, + "learning_rate": 1.5517203201011164e-06, + "loss": 0.9963, + "step": 21083 + }, + { + "epoch": 0.64, + "learning_rate": 1.5514946329847318e-06, + "loss": 1.1591, + "step": 21084 + }, + { + "epoch": 0.64, + "learning_rate": 1.551268954897662e-06, + "loss": 1.0641, + "step": 21085 + }, + { + "epoch": 0.64, + "learning_rate": 1.5510432858420552e-06, + "loss": 1.0937, + "step": 21086 + }, + { + "epoch": 0.64, + "learning_rate": 1.5508176258200585e-06, + "loss": 1.0924, + "step": 21087 + }, + { + "epoch": 0.64, + "learning_rate": 1.550591974833821e-06, + "loss": 1.1202, + "step": 21088 + }, + { + "epoch": 0.64, + "learning_rate": 1.5503663328854909e-06, + "loss": 1.1232, + "step": 21089 + }, + { + "epoch": 0.64, + "learning_rate": 1.5501406999772157e-06, + "loss": 1.0344, + "step": 21090 + }, + { + "epoch": 0.64, + "learning_rate": 1.5499150761111447e-06, + "loss": 1.2241, + "step": 21091 + }, + { + "epoch": 0.64, + "learning_rate": 1.5496894612894237e-06, + "loss": 1.0379, + "step": 21092 + }, + { + "epoch": 0.64, + "learning_rate": 1.549463855514201e-06, + "loss": 1.1333, + "step": 21093 + }, + { + "epoch": 0.64, + "learning_rate": 1.5492382587876248e-06, + "loss": 1.1172, + "step": 21094 + }, + { + "epoch": 0.64, + "learning_rate": 1.5490126711118435e-06, + "loss": 1.0446, + "step": 21095 + }, + { + "epoch": 0.64, + "learning_rate": 1.5487870924890026e-06, + "loss": 1.1646, + "step": 21096 + }, + { + "epoch": 0.64, + "learning_rate": 1.5485615229212502e-06, + "loss": 1.1043, + "step": 21097 + }, + { + "epoch": 0.64, + "learning_rate": 1.5483359624107342e-06, + "loss": 1.1377, + "step": 21098 + }, + { + "epoch": 0.64, + "learning_rate": 1.5481104109596018e-06, + "loss": 1.2593, + "step": 21099 + }, + { + "epoch": 0.64, + "learning_rate": 1.5478848685699994e-06, + "loss": 1.1187, + "step": 21100 + }, + { + "epoch": 0.64, + "learning_rate": 1.5476593352440744e-06, + "loss": 1.1731, + "step": 21101 + }, + { + "epoch": 0.64, + "learning_rate": 1.547433810983974e-06, + "loss": 0.9746, + "step": 21102 + }, + { + "epoch": 0.64, + "learning_rate": 1.547208295791845e-06, + "loss": 1.0703, + "step": 21103 + }, + { + "epoch": 0.64, + "learning_rate": 1.5469827896698348e-06, + "loss": 1.0991, + "step": 21104 + }, + { + "epoch": 0.64, + "learning_rate": 1.546757292620089e-06, + "loss": 1.1459, + "step": 21105 + }, + { + "epoch": 0.64, + "learning_rate": 1.5465318046447542e-06, + "loss": 1.1173, + "step": 21106 + }, + { + "epoch": 0.64, + "learning_rate": 1.5463063257459776e-06, + "loss": 1.027, + "step": 21107 + }, + { + "epoch": 0.64, + "learning_rate": 1.5460808559259063e-06, + "loss": 1.116, + "step": 21108 + }, + { + "epoch": 0.64, + "learning_rate": 1.545855395186685e-06, + "loss": 1.1266, + "step": 21109 + }, + { + "epoch": 0.64, + "learning_rate": 1.545629943530461e-06, + "loss": 1.0853, + "step": 21110 + }, + { + "epoch": 0.64, + "learning_rate": 1.5454045009593799e-06, + "loss": 1.1507, + "step": 21111 + }, + { + "epoch": 0.64, + "learning_rate": 1.545179067475589e-06, + "loss": 1.0987, + "step": 21112 + }, + { + "epoch": 0.64, + "learning_rate": 1.544953643081233e-06, + "loss": 1.1865, + "step": 21113 + }, + { + "epoch": 0.64, + "learning_rate": 1.544728227778458e-06, + "loss": 1.1477, + "step": 21114 + }, + { + "epoch": 0.64, + "learning_rate": 1.544502821569411e-06, + "loss": 1.0167, + "step": 21115 + }, + { + "epoch": 0.64, + "learning_rate": 1.5442774244562363e-06, + "loss": 1.1144, + "step": 21116 + }, + { + "epoch": 0.64, + "learning_rate": 1.544052036441081e-06, + "loss": 1.0677, + "step": 21117 + }, + { + "epoch": 0.64, + "learning_rate": 1.5438266575260892e-06, + "loss": 1.0608, + "step": 21118 + }, + { + "epoch": 0.64, + "learning_rate": 1.5436012877134072e-06, + "loss": 1.1541, + "step": 21119 + }, + { + "epoch": 0.64, + "learning_rate": 1.5433759270051802e-06, + "loss": 1.1154, + "step": 21120 + }, + { + "epoch": 0.64, + "learning_rate": 1.5431505754035547e-06, + "loss": 1.1252, + "step": 21121 + }, + { + "epoch": 0.64, + "learning_rate": 1.5429252329106743e-06, + "loss": 1.1479, + "step": 21122 + }, + { + "epoch": 0.64, + "learning_rate": 1.542699899528684e-06, + "loss": 1.0854, + "step": 21123 + }, + { + "epoch": 0.64, + "learning_rate": 1.54247457525973e-06, + "loss": 1.2039, + "step": 21124 + }, + { + "epoch": 0.64, + "learning_rate": 1.5422492601059575e-06, + "loss": 1.0754, + "step": 21125 + }, + { + "epoch": 0.64, + "learning_rate": 1.5420239540695104e-06, + "loss": 1.0243, + "step": 21126 + }, + { + "epoch": 0.64, + "learning_rate": 1.5417986571525336e-06, + "loss": 1.0276, + "step": 21127 + }, + { + "epoch": 0.64, + "learning_rate": 1.5415733693571722e-06, + "loss": 1.1554, + "step": 21128 + }, + { + "epoch": 0.64, + "learning_rate": 1.5413480906855704e-06, + "loss": 1.204, + "step": 21129 + }, + { + "epoch": 0.64, + "learning_rate": 1.541122821139874e-06, + "loss": 1.1323, + "step": 21130 + }, + { + "epoch": 0.64, + "learning_rate": 1.540897560722226e-06, + "loss": 1.0614, + "step": 21131 + }, + { + "epoch": 0.64, + "learning_rate": 1.540672309434771e-06, + "loss": 1.1507, + "step": 21132 + }, + { + "epoch": 0.64, + "learning_rate": 1.5404470672796537e-06, + "loss": 1.1849, + "step": 21133 + }, + { + "epoch": 0.64, + "learning_rate": 1.5402218342590192e-06, + "loss": 1.0086, + "step": 21134 + }, + { + "epoch": 0.64, + "learning_rate": 1.5399966103750097e-06, + "loss": 1.2108, + "step": 21135 + }, + { + "epoch": 0.64, + "learning_rate": 1.53977139562977e-06, + "loss": 1.0177, + "step": 21136 + }, + { + "epoch": 0.64, + "learning_rate": 1.5395461900254441e-06, + "loss": 1.2343, + "step": 21137 + }, + { + "epoch": 0.64, + "learning_rate": 1.539320993564177e-06, + "loss": 1.0784, + "step": 21138 + }, + { + "epoch": 0.64, + "learning_rate": 1.5390958062481104e-06, + "loss": 1.0416, + "step": 21139 + }, + { + "epoch": 0.64, + "learning_rate": 1.5388706280793888e-06, + "loss": 1.1097, + "step": 21140 + }, + { + "epoch": 0.64, + "learning_rate": 1.538645459060156e-06, + "loss": 1.1667, + "step": 21141 + }, + { + "epoch": 0.64, + "learning_rate": 1.5384202991925554e-06, + "loss": 1.0802, + "step": 21142 + }, + { + "epoch": 0.64, + "learning_rate": 1.538195148478731e-06, + "loss": 0.9866, + "step": 21143 + }, + { + "epoch": 0.64, + "learning_rate": 1.537970006920825e-06, + "loss": 1.1005, + "step": 21144 + }, + { + "epoch": 0.64, + "learning_rate": 1.537744874520981e-06, + "loss": 1.092, + "step": 21145 + }, + { + "epoch": 0.64, + "learning_rate": 1.5375197512813427e-06, + "loss": 1.0916, + "step": 21146 + }, + { + "epoch": 0.64, + "learning_rate": 1.5372946372040536e-06, + "loss": 0.9981, + "step": 21147 + }, + { + "epoch": 0.64, + "learning_rate": 1.5370695322912551e-06, + "loss": 1.1993, + "step": 21148 + }, + { + "epoch": 0.64, + "learning_rate": 1.5368444365450908e-06, + "loss": 1.1683, + "step": 21149 + }, + { + "epoch": 0.64, + "learning_rate": 1.5366193499677038e-06, + "loss": 0.975, + "step": 21150 + }, + { + "epoch": 0.64, + "learning_rate": 1.5363942725612375e-06, + "loss": 1.1731, + "step": 21151 + }, + { + "epoch": 0.64, + "learning_rate": 1.5361692043278323e-06, + "loss": 1.0912, + "step": 21152 + }, + { + "epoch": 0.64, + "learning_rate": 1.5359441452696321e-06, + "loss": 1.0897, + "step": 21153 + }, + { + "epoch": 0.64, + "learning_rate": 1.5357190953887795e-06, + "loss": 1.1607, + "step": 21154 + }, + { + "epoch": 0.64, + "learning_rate": 1.5354940546874176e-06, + "loss": 1.1505, + "step": 21155 + }, + { + "epoch": 0.64, + "learning_rate": 1.535269023167687e-06, + "loss": 1.1066, + "step": 21156 + }, + { + "epoch": 0.64, + "learning_rate": 1.5350440008317303e-06, + "loss": 0.9783, + "step": 21157 + }, + { + "epoch": 0.64, + "learning_rate": 1.5348189876816905e-06, + "loss": 1.0876, + "step": 21158 + }, + { + "epoch": 0.64, + "learning_rate": 1.5345939837197088e-06, + "loss": 1.1224, + "step": 21159 + }, + { + "epoch": 0.64, + "learning_rate": 1.5343689889479286e-06, + "loss": 1.1141, + "step": 21160 + }, + { + "epoch": 0.64, + "learning_rate": 1.534144003368489e-06, + "loss": 1.1471, + "step": 21161 + }, + { + "epoch": 0.64, + "learning_rate": 1.533919026983534e-06, + "loss": 1.1537, + "step": 21162 + }, + { + "epoch": 0.64, + "learning_rate": 1.5336940597952045e-06, + "loss": 1.0537, + "step": 21163 + }, + { + "epoch": 0.64, + "learning_rate": 1.5334691018056427e-06, + "loss": 1.063, + "step": 21164 + }, + { + "epoch": 0.64, + "learning_rate": 1.533244153016989e-06, + "loss": 1.0515, + "step": 21165 + }, + { + "epoch": 0.64, + "learning_rate": 1.533019213431385e-06, + "loss": 1.0581, + "step": 21166 + }, + { + "epoch": 0.64, + "learning_rate": 1.5327942830509728e-06, + "loss": 1.2468, + "step": 21167 + }, + { + "epoch": 0.64, + "learning_rate": 1.5325693618778934e-06, + "loss": 1.095, + "step": 21168 + }, + { + "epoch": 0.64, + "learning_rate": 1.5323444499142873e-06, + "loss": 1.0906, + "step": 21169 + }, + { + "epoch": 0.64, + "learning_rate": 1.532119547162296e-06, + "loss": 1.0199, + "step": 21170 + }, + { + "epoch": 0.64, + "learning_rate": 1.5318946536240603e-06, + "loss": 1.1376, + "step": 21171 + }, + { + "epoch": 0.64, + "learning_rate": 1.5316697693017216e-06, + "loss": 1.0542, + "step": 21172 + }, + { + "epoch": 0.64, + "learning_rate": 1.5314448941974214e-06, + "loss": 1.1357, + "step": 21173 + }, + { + "epoch": 0.64, + "learning_rate": 1.5312200283132977e-06, + "loss": 1.0705, + "step": 21174 + }, + { + "epoch": 0.64, + "learning_rate": 1.530995171651493e-06, + "loss": 1.1627, + "step": 21175 + }, + { + "epoch": 0.64, + "learning_rate": 1.530770324214148e-06, + "loss": 1.1562, + "step": 21176 + }, + { + "epoch": 0.64, + "learning_rate": 1.5305454860034036e-06, + "loss": 1.1921, + "step": 21177 + }, + { + "epoch": 0.64, + "learning_rate": 1.530320657021398e-06, + "loss": 1.0984, + "step": 21178 + }, + { + "epoch": 0.64, + "learning_rate": 1.530095837270273e-06, + "loss": 1.2198, + "step": 21179 + }, + { + "epoch": 0.64, + "learning_rate": 1.5298710267521683e-06, + "loss": 1.0974, + "step": 21180 + }, + { + "epoch": 0.64, + "learning_rate": 1.5296462254692245e-06, + "loss": 1.2466, + "step": 21181 + }, + { + "epoch": 0.64, + "learning_rate": 1.5294214334235813e-06, + "loss": 1.1121, + "step": 21182 + }, + { + "epoch": 0.64, + "learning_rate": 1.5291966506173784e-06, + "loss": 1.11, + "step": 21183 + }, + { + "epoch": 0.64, + "learning_rate": 1.5289718770527556e-06, + "loss": 1.1357, + "step": 21184 + }, + { + "epoch": 0.64, + "learning_rate": 1.528747112731853e-06, + "loss": 1.1635, + "step": 21185 + }, + { + "epoch": 0.64, + "learning_rate": 1.5285223576568111e-06, + "loss": 1.0782, + "step": 21186 + }, + { + "epoch": 0.64, + "learning_rate": 1.5282976118297676e-06, + "loss": 1.1296, + "step": 21187 + }, + { + "epoch": 0.64, + "learning_rate": 1.5280728752528628e-06, + "loss": 1.0533, + "step": 21188 + }, + { + "epoch": 0.64, + "learning_rate": 1.527848147928236e-06, + "loss": 1.1323, + "step": 21189 + }, + { + "epoch": 0.64, + "learning_rate": 1.5276234298580278e-06, + "loss": 1.059, + "step": 21190 + }, + { + "epoch": 0.64, + "learning_rate": 1.5273987210443753e-06, + "loss": 1.1218, + "step": 21191 + }, + { + "epoch": 0.64, + "learning_rate": 1.5271740214894182e-06, + "loss": 1.2083, + "step": 21192 + }, + { + "epoch": 0.64, + "learning_rate": 1.5269493311952962e-06, + "loss": 1.2083, + "step": 21193 + }, + { + "epoch": 0.64, + "learning_rate": 1.5267246501641484e-06, + "loss": 1.0804, + "step": 21194 + }, + { + "epoch": 0.64, + "learning_rate": 1.5264999783981127e-06, + "loss": 1.1136, + "step": 21195 + }, + { + "epoch": 0.64, + "learning_rate": 1.5262753158993282e-06, + "loss": 1.1373, + "step": 21196 + }, + { + "epoch": 0.64, + "learning_rate": 1.5260506626699339e-06, + "loss": 1.0634, + "step": 21197 + }, + { + "epoch": 0.64, + "learning_rate": 1.5258260187120686e-06, + "loss": 1.1578, + "step": 21198 + }, + { + "epoch": 0.64, + "learning_rate": 1.5256013840278706e-06, + "loss": 0.9919, + "step": 21199 + }, + { + "epoch": 0.64, + "learning_rate": 1.5253767586194773e-06, + "loss": 1.1544, + "step": 21200 + }, + { + "epoch": 0.64, + "learning_rate": 1.5251521424890282e-06, + "loss": 1.1774, + "step": 21201 + }, + { + "epoch": 0.64, + "learning_rate": 1.5249275356386608e-06, + "loss": 0.9694, + "step": 21202 + }, + { + "epoch": 0.64, + "learning_rate": 1.524702938070515e-06, + "loss": 1.0739, + "step": 21203 + }, + { + "epoch": 0.64, + "learning_rate": 1.5244783497867266e-06, + "loss": 1.0325, + "step": 21204 + }, + { + "epoch": 0.64, + "learning_rate": 1.5242537707894338e-06, + "loss": 1.1222, + "step": 21205 + }, + { + "epoch": 0.64, + "learning_rate": 1.5240292010807761e-06, + "loss": 1.1163, + "step": 21206 + }, + { + "epoch": 0.64, + "learning_rate": 1.5238046406628903e-06, + "loss": 1.1035, + "step": 21207 + }, + { + "epoch": 0.64, + "learning_rate": 1.5235800895379138e-06, + "loss": 1.0787, + "step": 21208 + }, + { + "epoch": 0.64, + "learning_rate": 1.523355547707985e-06, + "loss": 1.1546, + "step": 21209 + }, + { + "epoch": 0.64, + "learning_rate": 1.5231310151752408e-06, + "loss": 1.1053, + "step": 21210 + }, + { + "epoch": 0.64, + "learning_rate": 1.5229064919418185e-06, + "loss": 1.0997, + "step": 21211 + }, + { + "epoch": 0.64, + "learning_rate": 1.5226819780098564e-06, + "loss": 1.1917, + "step": 21212 + }, + { + "epoch": 0.64, + "learning_rate": 1.522457473381491e-06, + "loss": 1.2139, + "step": 21213 + }, + { + "epoch": 0.64, + "learning_rate": 1.5222329780588593e-06, + "loss": 1.0984, + "step": 21214 + }, + { + "epoch": 0.64, + "learning_rate": 1.5220084920440985e-06, + "loss": 1.0688, + "step": 21215 + }, + { + "epoch": 0.64, + "learning_rate": 1.5217840153393476e-06, + "loss": 1.0344, + "step": 21216 + }, + { + "epoch": 0.64, + "learning_rate": 1.5215595479467404e-06, + "loss": 1.2052, + "step": 21217 + }, + { + "epoch": 0.64, + "learning_rate": 1.5213350898684149e-06, + "loss": 1.1208, + "step": 21218 + }, + { + "epoch": 0.64, + "learning_rate": 1.521110641106508e-06, + "loss": 1.0996, + "step": 21219 + }, + { + "epoch": 0.64, + "learning_rate": 1.5208862016631575e-06, + "loss": 0.9837, + "step": 21220 + }, + { + "epoch": 0.64, + "learning_rate": 1.520661771540498e-06, + "loss": 1.1033, + "step": 21221 + }, + { + "epoch": 0.64, + "learning_rate": 1.5204373507406662e-06, + "loss": 1.0833, + "step": 21222 + }, + { + "epoch": 0.64, + "learning_rate": 1.5202129392657995e-06, + "loss": 1.1212, + "step": 21223 + }, + { + "epoch": 0.64, + "learning_rate": 1.5199885371180335e-06, + "loss": 1.2449, + "step": 21224 + }, + { + "epoch": 0.64, + "learning_rate": 1.5197641442995053e-06, + "loss": 1.0748, + "step": 21225 + }, + { + "epoch": 0.64, + "learning_rate": 1.5195397608123497e-06, + "loss": 1.1514, + "step": 21226 + }, + { + "epoch": 0.64, + "learning_rate": 1.5193153866587036e-06, + "loss": 1.0645, + "step": 21227 + }, + { + "epoch": 0.64, + "learning_rate": 1.5190910218407024e-06, + "loss": 1.1279, + "step": 21228 + }, + { + "epoch": 0.64, + "learning_rate": 1.5188666663604834e-06, + "loss": 1.1682, + "step": 21229 + }, + { + "epoch": 0.64, + "learning_rate": 1.5186423202201804e-06, + "loss": 1.1234, + "step": 21230 + }, + { + "epoch": 0.64, + "learning_rate": 1.5184179834219298e-06, + "loss": 1.0197, + "step": 21231 + }, + { + "epoch": 0.64, + "learning_rate": 1.518193655967867e-06, + "loss": 1.0831, + "step": 21232 + }, + { + "epoch": 0.64, + "learning_rate": 1.517969337860129e-06, + "loss": 1.1075, + "step": 21233 + }, + { + "epoch": 0.64, + "learning_rate": 1.5177450291008489e-06, + "loss": 1.0753, + "step": 21234 + }, + { + "epoch": 0.64, + "learning_rate": 1.517520729692163e-06, + "loss": 1.1028, + "step": 21235 + }, + { + "epoch": 0.64, + "learning_rate": 1.5172964396362064e-06, + "loss": 1.1035, + "step": 21236 + }, + { + "epoch": 0.64, + "learning_rate": 1.5170721589351145e-06, + "loss": 1.1998, + "step": 21237 + }, + { + "epoch": 0.64, + "learning_rate": 1.5168478875910232e-06, + "loss": 1.0592, + "step": 21238 + }, + { + "epoch": 0.64, + "learning_rate": 1.5166236256060655e-06, + "loss": 1.0862, + "step": 21239 + }, + { + "epoch": 0.64, + "learning_rate": 1.5163993729823772e-06, + "loss": 1.1028, + "step": 21240 + }, + { + "epoch": 0.64, + "learning_rate": 1.5161751297220933e-06, + "loss": 1.1788, + "step": 21241 + }, + { + "epoch": 0.64, + "learning_rate": 1.5159508958273494e-06, + "loss": 1.0892, + "step": 21242 + }, + { + "epoch": 0.64, + "learning_rate": 1.5157266713002783e-06, + "loss": 1.1074, + "step": 21243 + }, + { + "epoch": 0.64, + "learning_rate": 1.515502456143015e-06, + "loss": 1.0554, + "step": 21244 + }, + { + "epoch": 0.64, + "learning_rate": 1.515278250357694e-06, + "loss": 1.2158, + "step": 21245 + }, + { + "epoch": 0.64, + "learning_rate": 1.5150540539464509e-06, + "loss": 1.1207, + "step": 21246 + }, + { + "epoch": 0.64, + "learning_rate": 1.514829866911418e-06, + "loss": 1.121, + "step": 21247 + }, + { + "epoch": 0.64, + "learning_rate": 1.51460568925473e-06, + "loss": 1.1808, + "step": 21248 + }, + { + "epoch": 0.64, + "learning_rate": 1.5143815209785214e-06, + "loss": 1.1337, + "step": 21249 + }, + { + "epoch": 0.64, + "learning_rate": 1.5141573620849262e-06, + "loss": 1.1037, + "step": 21250 + }, + { + "epoch": 0.64, + "learning_rate": 1.5139332125760786e-06, + "loss": 1.127, + "step": 21251 + }, + { + "epoch": 0.64, + "learning_rate": 1.5137090724541112e-06, + "loss": 1.1252, + "step": 21252 + }, + { + "epoch": 0.64, + "learning_rate": 1.5134849417211582e-06, + "loss": 1.1407, + "step": 21253 + }, + { + "epoch": 0.64, + "learning_rate": 1.5132608203793542e-06, + "loss": 1.0346, + "step": 21254 + }, + { + "epoch": 0.64, + "learning_rate": 1.5130367084308322e-06, + "loss": 1.2255, + "step": 21255 + }, + { + "epoch": 0.64, + "learning_rate": 1.5128126058777248e-06, + "loss": 1.2271, + "step": 21256 + }, + { + "epoch": 0.64, + "learning_rate": 1.5125885127221656e-06, + "loss": 1.1154, + "step": 21257 + }, + { + "epoch": 0.64, + "learning_rate": 1.5123644289662887e-06, + "loss": 1.0679, + "step": 21258 + }, + { + "epoch": 0.64, + "learning_rate": 1.5121403546122277e-06, + "loss": 1.112, + "step": 21259 + }, + { + "epoch": 0.64, + "learning_rate": 1.5119162896621134e-06, + "loss": 1.0707, + "step": 21260 + }, + { + "epoch": 0.64, + "learning_rate": 1.5116922341180803e-06, + "loss": 1.0802, + "step": 21261 + }, + { + "epoch": 0.64, + "learning_rate": 1.5114681879822613e-06, + "loss": 1.1715, + "step": 21262 + }, + { + "epoch": 0.64, + "learning_rate": 1.5112441512567888e-06, + "loss": 1.0406, + "step": 21263 + }, + { + "epoch": 0.64, + "learning_rate": 1.5110201239437966e-06, + "loss": 1.0899, + "step": 21264 + }, + { + "epoch": 0.64, + "learning_rate": 1.5107961060454156e-06, + "loss": 1.0637, + "step": 21265 + }, + { + "epoch": 0.64, + "learning_rate": 1.5105720975637795e-06, + "loss": 1.161, + "step": 21266 + }, + { + "epoch": 0.64, + "learning_rate": 1.5103480985010206e-06, + "loss": 1.0092, + "step": 21267 + }, + { + "epoch": 0.64, + "learning_rate": 1.5101241088592719e-06, + "loss": 1.1269, + "step": 21268 + }, + { + "epoch": 0.64, + "learning_rate": 1.509900128640664e-06, + "loss": 1.2189, + "step": 21269 + }, + { + "epoch": 0.64, + "learning_rate": 1.5096761578473302e-06, + "loss": 1.1653, + "step": 21270 + }, + { + "epoch": 0.64, + "learning_rate": 1.5094521964814024e-06, + "loss": 1.077, + "step": 21271 + }, + { + "epoch": 0.64, + "learning_rate": 1.5092282445450135e-06, + "loss": 1.0401, + "step": 21272 + }, + { + "epoch": 0.64, + "learning_rate": 1.5090043020402936e-06, + "loss": 1.1394, + "step": 21273 + }, + { + "epoch": 0.64, + "learning_rate": 1.5087803689693752e-06, + "loss": 1.2209, + "step": 21274 + }, + { + "epoch": 0.64, + "learning_rate": 1.508556445334391e-06, + "loss": 1.1524, + "step": 21275 + }, + { + "epoch": 0.64, + "learning_rate": 1.5083325311374713e-06, + "loss": 1.0193, + "step": 21276 + }, + { + "epoch": 0.64, + "learning_rate": 1.5081086263807491e-06, + "loss": 0.9824, + "step": 21277 + }, + { + "epoch": 0.64, + "learning_rate": 1.5078847310663544e-06, + "loss": 1.0951, + "step": 21278 + }, + { + "epoch": 0.64, + "learning_rate": 1.5076608451964192e-06, + "loss": 1.0339, + "step": 21279 + }, + { + "epoch": 0.64, + "learning_rate": 1.5074369687730756e-06, + "loss": 1.2064, + "step": 21280 + }, + { + "epoch": 0.64, + "learning_rate": 1.5072131017984536e-06, + "loss": 0.9741, + "step": 21281 + }, + { + "epoch": 0.64, + "learning_rate": 1.5069892442746848e-06, + "loss": 1.0078, + "step": 21282 + }, + { + "epoch": 0.64, + "learning_rate": 1.5067653962038996e-06, + "loss": 1.0571, + "step": 21283 + }, + { + "epoch": 0.64, + "learning_rate": 1.5065415575882296e-06, + "loss": 1.033, + "step": 21284 + }, + { + "epoch": 0.64, + "learning_rate": 1.506317728429807e-06, + "loss": 1.0651, + "step": 21285 + }, + { + "epoch": 0.64, + "learning_rate": 1.5060939087307597e-06, + "loss": 1.1271, + "step": 21286 + }, + { + "epoch": 0.64, + "learning_rate": 1.5058700984932195e-06, + "loss": 1.1812, + "step": 21287 + }, + { + "epoch": 0.64, + "learning_rate": 1.5056462977193177e-06, + "loss": 1.1525, + "step": 21288 + }, + { + "epoch": 0.64, + "learning_rate": 1.5054225064111836e-06, + "loss": 1.0059, + "step": 21289 + }, + { + "epoch": 0.64, + "learning_rate": 1.505198724570949e-06, + "loss": 1.1198, + "step": 21290 + }, + { + "epoch": 0.64, + "learning_rate": 1.5049749522007434e-06, + "loss": 1.0197, + "step": 21291 + }, + { + "epoch": 0.64, + "learning_rate": 1.5047511893026968e-06, + "loss": 1.1312, + "step": 21292 + }, + { + "epoch": 0.64, + "learning_rate": 1.504527435878939e-06, + "loss": 1.0737, + "step": 21293 + }, + { + "epoch": 0.64, + "learning_rate": 1.5043036919316017e-06, + "loss": 1.0464, + "step": 21294 + }, + { + "epoch": 0.64, + "learning_rate": 1.5040799574628128e-06, + "loss": 1.1161, + "step": 21295 + }, + { + "epoch": 0.64, + "learning_rate": 1.503856232474703e-06, + "loss": 1.0585, + "step": 21296 + }, + { + "epoch": 0.64, + "learning_rate": 1.5036325169694026e-06, + "loss": 0.9945, + "step": 21297 + }, + { + "epoch": 0.64, + "learning_rate": 1.5034088109490414e-06, + "loss": 1.0881, + "step": 21298 + }, + { + "epoch": 0.64, + "learning_rate": 1.5031851144157471e-06, + "loss": 1.2097, + "step": 21299 + }, + { + "epoch": 0.64, + "learning_rate": 1.502961427371651e-06, + "loss": 1.1066, + "step": 21300 + }, + { + "epoch": 0.64, + "learning_rate": 1.5027377498188817e-06, + "loss": 1.0789, + "step": 21301 + }, + { + "epoch": 0.64, + "learning_rate": 1.5025140817595685e-06, + "loss": 1.0663, + "step": 21302 + }, + { + "epoch": 0.64, + "learning_rate": 1.5022904231958422e-06, + "loss": 1.1302, + "step": 21303 + }, + { + "epoch": 0.64, + "learning_rate": 1.5020667741298296e-06, + "loss": 1.1262, + "step": 21304 + }, + { + "epoch": 0.64, + "learning_rate": 1.5018431345636603e-06, + "loss": 1.1552, + "step": 21305 + }, + { + "epoch": 0.64, + "learning_rate": 1.5016195044994635e-06, + "loss": 1.1861, + "step": 21306 + }, + { + "epoch": 0.64, + "learning_rate": 1.5013958839393692e-06, + "loss": 1.0374, + "step": 21307 + }, + { + "epoch": 0.64, + "learning_rate": 1.5011722728855045e-06, + "loss": 1.048, + "step": 21308 + }, + { + "epoch": 0.64, + "learning_rate": 1.5009486713399983e-06, + "loss": 1.0649, + "step": 21309 + }, + { + "epoch": 0.64, + "learning_rate": 1.5007250793049798e-06, + "loss": 0.9479, + "step": 21310 + }, + { + "epoch": 0.64, + "learning_rate": 1.5005014967825788e-06, + "loss": 1.0634, + "step": 21311 + }, + { + "epoch": 0.64, + "learning_rate": 1.5002779237749205e-06, + "loss": 1.1839, + "step": 21312 + }, + { + "epoch": 0.64, + "learning_rate": 1.5000543602841352e-06, + "loss": 1.2231, + "step": 21313 + }, + { + "epoch": 0.64, + "learning_rate": 1.4998308063123508e-06, + "loss": 1.2217, + "step": 21314 + }, + { + "epoch": 0.64, + "learning_rate": 1.4996072618616953e-06, + "loss": 1.0834, + "step": 21315 + }, + { + "epoch": 0.64, + "learning_rate": 1.4993837269342981e-06, + "loss": 1.0896, + "step": 21316 + }, + { + "epoch": 0.64, + "learning_rate": 1.4991602015322847e-06, + "loss": 1.1339, + "step": 21317 + }, + { + "epoch": 0.64, + "learning_rate": 1.4989366856577841e-06, + "loss": 1.1196, + "step": 21318 + }, + { + "epoch": 0.64, + "learning_rate": 1.4987131793129245e-06, + "loss": 1.1169, + "step": 21319 + }, + { + "epoch": 0.64, + "learning_rate": 1.4984896824998333e-06, + "loss": 1.0856, + "step": 21320 + }, + { + "epoch": 0.64, + "learning_rate": 1.4982661952206373e-06, + "loss": 1.14, + "step": 21321 + }, + { + "epoch": 0.64, + "learning_rate": 1.4980427174774654e-06, + "loss": 1.0959, + "step": 21322 + }, + { + "epoch": 0.64, + "learning_rate": 1.4978192492724436e-06, + "loss": 1.2128, + "step": 21323 + }, + { + "epoch": 0.64, + "learning_rate": 1.497595790607701e-06, + "loss": 1.1446, + "step": 21324 + }, + { + "epoch": 0.64, + "learning_rate": 1.497372341485363e-06, + "loss": 1.2662, + "step": 21325 + }, + { + "epoch": 0.64, + "learning_rate": 1.4971489019075571e-06, + "loss": 1.0538, + "step": 21326 + }, + { + "epoch": 0.64, + "learning_rate": 1.496925471876411e-06, + "loss": 1.1836, + "step": 21327 + }, + { + "epoch": 0.64, + "learning_rate": 1.4967020513940521e-06, + "loss": 1.092, + "step": 21328 + }, + { + "epoch": 0.64, + "learning_rate": 1.4964786404626054e-06, + "loss": 1.0677, + "step": 21329 + }, + { + "epoch": 0.64, + "learning_rate": 1.4962552390841988e-06, + "loss": 1.0384, + "step": 21330 + }, + { + "epoch": 0.64, + "learning_rate": 1.496031847260959e-06, + "loss": 1.0594, + "step": 21331 + }, + { + "epoch": 0.64, + "learning_rate": 1.4958084649950123e-06, + "loss": 1.0198, + "step": 21332 + }, + { + "epoch": 0.64, + "learning_rate": 1.495585092288486e-06, + "loss": 1.0557, + "step": 21333 + }, + { + "epoch": 0.64, + "learning_rate": 1.4953617291435053e-06, + "loss": 1.0399, + "step": 21334 + }, + { + "epoch": 0.64, + "learning_rate": 1.4951383755621972e-06, + "loss": 1.1156, + "step": 21335 + }, + { + "epoch": 0.64, + "learning_rate": 1.4949150315466876e-06, + "loss": 1.082, + "step": 21336 + }, + { + "epoch": 0.64, + "learning_rate": 1.4946916970991042e-06, + "loss": 1.2517, + "step": 21337 + }, + { + "epoch": 0.64, + "learning_rate": 1.4944683722215704e-06, + "loss": 1.1732, + "step": 21338 + }, + { + "epoch": 0.64, + "learning_rate": 1.4942450569162137e-06, + "loss": 1.1021, + "step": 21339 + }, + { + "epoch": 0.64, + "learning_rate": 1.4940217511851593e-06, + "loss": 1.1363, + "step": 21340 + }, + { + "epoch": 0.64, + "learning_rate": 1.4937984550305345e-06, + "loss": 1.0841, + "step": 21341 + }, + { + "epoch": 0.64, + "learning_rate": 1.4935751684544627e-06, + "loss": 1.0851, + "step": 21342 + }, + { + "epoch": 0.64, + "learning_rate": 1.4933518914590705e-06, + "loss": 1.1407, + "step": 21343 + }, + { + "epoch": 0.64, + "learning_rate": 1.4931286240464837e-06, + "loss": 1.0909, + "step": 21344 + }, + { + "epoch": 0.64, + "learning_rate": 1.4929053662188275e-06, + "loss": 1.0966, + "step": 21345 + }, + { + "epoch": 0.64, + "learning_rate": 1.4926821179782277e-06, + "loss": 1.0615, + "step": 21346 + }, + { + "epoch": 0.64, + "learning_rate": 1.4924588793268085e-06, + "loss": 1.1802, + "step": 21347 + }, + { + "epoch": 0.64, + "learning_rate": 1.4922356502666951e-06, + "loss": 1.1042, + "step": 21348 + }, + { + "epoch": 0.64, + "learning_rate": 1.4920124308000134e-06, + "loss": 1.1071, + "step": 21349 + }, + { + "epoch": 0.64, + "learning_rate": 1.4917892209288886e-06, + "loss": 1.1094, + "step": 21350 + }, + { + "epoch": 0.64, + "learning_rate": 1.4915660206554445e-06, + "loss": 0.9904, + "step": 21351 + }, + { + "epoch": 0.64, + "learning_rate": 1.4913428299818055e-06, + "loss": 1.0706, + "step": 21352 + }, + { + "epoch": 0.64, + "learning_rate": 1.491119648910097e-06, + "loss": 1.0936, + "step": 21353 + }, + { + "epoch": 0.64, + "learning_rate": 1.490896477442445e-06, + "loss": 1.1257, + "step": 21354 + }, + { + "epoch": 0.64, + "learning_rate": 1.490673315580971e-06, + "loss": 1.1486, + "step": 21355 + }, + { + "epoch": 0.64, + "learning_rate": 1.4904501633278012e-06, + "loss": 1.0543, + "step": 21356 + }, + { + "epoch": 0.64, + "learning_rate": 1.49022702068506e-06, + "loss": 1.0978, + "step": 21357 + }, + { + "epoch": 0.64, + "learning_rate": 1.4900038876548705e-06, + "loss": 1.1072, + "step": 21358 + }, + { + "epoch": 0.64, + "learning_rate": 1.4897807642393586e-06, + "loss": 1.1077, + "step": 21359 + }, + { + "epoch": 0.64, + "learning_rate": 1.4895576504406467e-06, + "loss": 1.157, + "step": 21360 + }, + { + "epoch": 0.64, + "learning_rate": 1.489334546260859e-06, + "loss": 1.1368, + "step": 21361 + }, + { + "epoch": 0.64, + "learning_rate": 1.4891114517021204e-06, + "loss": 1.0826, + "step": 21362 + }, + { + "epoch": 0.64, + "learning_rate": 1.488888366766554e-06, + "loss": 1.0284, + "step": 21363 + }, + { + "epoch": 0.64, + "learning_rate": 1.4886652914562827e-06, + "loss": 1.0977, + "step": 21364 + }, + { + "epoch": 0.64, + "learning_rate": 1.488442225773431e-06, + "loss": 1.0344, + "step": 21365 + }, + { + "epoch": 0.64, + "learning_rate": 1.488219169720122e-06, + "loss": 1.114, + "step": 21366 + }, + { + "epoch": 0.64, + "learning_rate": 1.4879961232984802e-06, + "loss": 1.0761, + "step": 21367 + }, + { + "epoch": 0.64, + "learning_rate": 1.4877730865106268e-06, + "loss": 1.1209, + "step": 21368 + }, + { + "epoch": 0.64, + "learning_rate": 1.4875500593586862e-06, + "loss": 1.1647, + "step": 21369 + }, + { + "epoch": 0.64, + "learning_rate": 1.4873270418447816e-06, + "loss": 1.0681, + "step": 21370 + }, + { + "epoch": 0.64, + "learning_rate": 1.4871040339710359e-06, + "loss": 0.9935, + "step": 21371 + }, + { + "epoch": 0.64, + "learning_rate": 1.4868810357395718e-06, + "loss": 1.1297, + "step": 21372 + }, + { + "epoch": 0.64, + "learning_rate": 1.4866580471525128e-06, + "loss": 0.9979, + "step": 21373 + }, + { + "epoch": 0.64, + "learning_rate": 1.4864350682119808e-06, + "loss": 1.1487, + "step": 21374 + }, + { + "epoch": 0.64, + "learning_rate": 1.4862120989200983e-06, + "loss": 1.1191, + "step": 21375 + }, + { + "epoch": 0.64, + "learning_rate": 1.4859891392789893e-06, + "loss": 1.2183, + "step": 21376 + }, + { + "epoch": 0.64, + "learning_rate": 1.4857661892907749e-06, + "loss": 1.115, + "step": 21377 + }, + { + "epoch": 0.64, + "learning_rate": 1.4855432489575777e-06, + "loss": 1.1096, + "step": 21378 + }, + { + "epoch": 0.64, + "learning_rate": 1.48532031828152e-06, + "loss": 1.1132, + "step": 21379 + }, + { + "epoch": 0.64, + "learning_rate": 1.4850973972647253e-06, + "loss": 1.1098, + "step": 21380 + }, + { + "epoch": 0.64, + "learning_rate": 1.4848744859093138e-06, + "loss": 1.1718, + "step": 21381 + }, + { + "epoch": 0.64, + "learning_rate": 1.484651584217408e-06, + "loss": 1.1835, + "step": 21382 + }, + { + "epoch": 0.64, + "learning_rate": 1.4844286921911305e-06, + "loss": 1.1038, + "step": 21383 + }, + { + "epoch": 0.64, + "learning_rate": 1.4842058098326024e-06, + "loss": 1.0993, + "step": 21384 + }, + { + "epoch": 0.64, + "learning_rate": 1.4839829371439468e-06, + "loss": 1.0686, + "step": 21385 + }, + { + "epoch": 0.64, + "learning_rate": 1.4837600741272833e-06, + "loss": 1.1786, + "step": 21386 + }, + { + "epoch": 0.64, + "learning_rate": 1.4835372207847345e-06, + "loss": 1.1177, + "step": 21387 + }, + { + "epoch": 0.64, + "learning_rate": 1.483314377118422e-06, + "loss": 1.0613, + "step": 21388 + }, + { + "epoch": 0.64, + "learning_rate": 1.4830915431304672e-06, + "loss": 1.1493, + "step": 21389 + }, + { + "epoch": 0.64, + "learning_rate": 1.4828687188229906e-06, + "loss": 1.0127, + "step": 21390 + }, + { + "epoch": 0.64, + "learning_rate": 1.4826459041981145e-06, + "loss": 1.1812, + "step": 21391 + }, + { + "epoch": 0.64, + "learning_rate": 1.4824230992579588e-06, + "loss": 1.1669, + "step": 21392 + }, + { + "epoch": 0.64, + "learning_rate": 1.4822003040046462e-06, + "loss": 1.1923, + "step": 21393 + }, + { + "epoch": 0.64, + "learning_rate": 1.4819775184402957e-06, + "loss": 1.0456, + "step": 21394 + }, + { + "epoch": 0.64, + "learning_rate": 1.481754742567029e-06, + "loss": 1.2462, + "step": 21395 + }, + { + "epoch": 0.64, + "learning_rate": 1.4815319763869664e-06, + "loss": 1.082, + "step": 21396 + }, + { + "epoch": 0.64, + "learning_rate": 1.4813092199022294e-06, + "loss": 1.0818, + "step": 21397 + }, + { + "epoch": 0.64, + "learning_rate": 1.4810864731149386e-06, + "loss": 1.2225, + "step": 21398 + }, + { + "epoch": 0.64, + "learning_rate": 1.4808637360272129e-06, + "loss": 1.1054, + "step": 21399 + }, + { + "epoch": 0.64, + "learning_rate": 1.4806410086411738e-06, + "loss": 1.2247, + "step": 21400 + }, + { + "epoch": 0.64, + "learning_rate": 1.480418290958941e-06, + "loss": 1.1304, + "step": 21401 + }, + { + "epoch": 0.64, + "learning_rate": 1.4801955829826358e-06, + "loss": 1.1899, + "step": 21402 + }, + { + "epoch": 0.64, + "learning_rate": 1.479972884714377e-06, + "loss": 1.0921, + "step": 21403 + }, + { + "epoch": 0.64, + "learning_rate": 1.479750196156285e-06, + "loss": 1.0861, + "step": 21404 + }, + { + "epoch": 0.64, + "learning_rate": 1.4795275173104795e-06, + "loss": 1.2115, + "step": 21405 + }, + { + "epoch": 0.64, + "learning_rate": 1.479304848179082e-06, + "loss": 1.2563, + "step": 21406 + }, + { + "epoch": 0.64, + "learning_rate": 1.4790821887642096e-06, + "loss": 1.0446, + "step": 21407 + }, + { + "epoch": 0.64, + "learning_rate": 1.478859539067983e-06, + "loss": 1.1635, + "step": 21408 + }, + { + "epoch": 0.64, + "learning_rate": 1.4786368990925219e-06, + "loss": 1.0587, + "step": 21409 + }, + { + "epoch": 0.64, + "learning_rate": 1.4784142688399456e-06, + "loss": 1.0146, + "step": 21410 + }, + { + "epoch": 0.65, + "learning_rate": 1.4781916483123742e-06, + "loss": 1.1034, + "step": 21411 + }, + { + "epoch": 0.65, + "learning_rate": 1.4779690375119254e-06, + "loss": 1.2753, + "step": 21412 + }, + { + "epoch": 0.65, + "learning_rate": 1.4777464364407192e-06, + "loss": 1.0294, + "step": 21413 + }, + { + "epoch": 0.65, + "learning_rate": 1.4775238451008745e-06, + "loss": 1.0788, + "step": 21414 + }, + { + "epoch": 0.65, + "learning_rate": 1.477301263494511e-06, + "loss": 1.222, + "step": 21415 + }, + { + "epoch": 0.65, + "learning_rate": 1.4770786916237463e-06, + "loss": 1.1208, + "step": 21416 + }, + { + "epoch": 0.65, + "learning_rate": 1.4768561294906997e-06, + "loss": 1.2162, + "step": 21417 + }, + { + "epoch": 0.65, + "learning_rate": 1.4766335770974902e-06, + "loss": 1.1058, + "step": 21418 + }, + { + "epoch": 0.65, + "learning_rate": 1.4764110344462368e-06, + "loss": 1.2372, + "step": 21419 + }, + { + "epoch": 0.65, + "learning_rate": 1.4761885015390571e-06, + "loss": 1.09, + "step": 21420 + }, + { + "epoch": 0.65, + "learning_rate": 1.4759659783780689e-06, + "loss": 1.0753, + "step": 21421 + }, + { + "epoch": 0.65, + "learning_rate": 1.4757434649653918e-06, + "loss": 1.0963, + "step": 21422 + }, + { + "epoch": 0.65, + "learning_rate": 1.4755209613031438e-06, + "loss": 1.0663, + "step": 21423 + }, + { + "epoch": 0.65, + "learning_rate": 1.4752984673934438e-06, + "loss": 1.1446, + "step": 21424 + }, + { + "epoch": 0.65, + "learning_rate": 1.4750759832384077e-06, + "loss": 1.0482, + "step": 21425 + }, + { + "epoch": 0.65, + "learning_rate": 1.4748535088401544e-06, + "loss": 1.0969, + "step": 21426 + }, + { + "epoch": 0.65, + "learning_rate": 1.474631044200802e-06, + "loss": 1.0958, + "step": 21427 + }, + { + "epoch": 0.65, + "learning_rate": 1.4744085893224694e-06, + "loss": 1.0448, + "step": 21428 + }, + { + "epoch": 0.65, + "learning_rate": 1.4741861442072719e-06, + "loss": 1.2139, + "step": 21429 + }, + { + "epoch": 0.65, + "learning_rate": 1.4739637088573287e-06, + "loss": 1.2521, + "step": 21430 + }, + { + "epoch": 0.65, + "learning_rate": 1.4737412832747566e-06, + "loss": 1.1701, + "step": 21431 + }, + { + "epoch": 0.65, + "learning_rate": 1.4735188674616741e-06, + "loss": 1.1063, + "step": 21432 + }, + { + "epoch": 0.65, + "learning_rate": 1.4732964614201969e-06, + "loss": 1.1387, + "step": 21433 + }, + { + "epoch": 0.65, + "learning_rate": 1.4730740651524428e-06, + "loss": 1.0665, + "step": 21434 + }, + { + "epoch": 0.65, + "learning_rate": 1.472851678660529e-06, + "loss": 0.9996, + "step": 21435 + }, + { + "epoch": 0.65, + "learning_rate": 1.4726293019465726e-06, + "loss": 1.1509, + "step": 21436 + }, + { + "epoch": 0.65, + "learning_rate": 1.4724069350126912e-06, + "loss": 1.3235, + "step": 21437 + }, + { + "epoch": 0.65, + "learning_rate": 1.472184577861e-06, + "loss": 1.2469, + "step": 21438 + }, + { + "epoch": 0.65, + "learning_rate": 1.4719622304936168e-06, + "loss": 1.0642, + "step": 21439 + }, + { + "epoch": 0.65, + "learning_rate": 1.471739892912658e-06, + "loss": 1.1248, + "step": 21440 + }, + { + "epoch": 0.65, + "learning_rate": 1.4715175651202404e-06, + "loss": 1.1527, + "step": 21441 + }, + { + "epoch": 0.65, + "learning_rate": 1.47129524711848e-06, + "loss": 1.0427, + "step": 21442 + }, + { + "epoch": 0.65, + "learning_rate": 1.4710729389094932e-06, + "loss": 1.1852, + "step": 21443 + }, + { + "epoch": 0.65, + "learning_rate": 1.4708506404953968e-06, + "loss": 1.1135, + "step": 21444 + }, + { + "epoch": 0.65, + "learning_rate": 1.4706283518783073e-06, + "loss": 1.1337, + "step": 21445 + }, + { + "epoch": 0.65, + "learning_rate": 1.4704060730603393e-06, + "loss": 1.123, + "step": 21446 + }, + { + "epoch": 0.65, + "learning_rate": 1.4701838040436095e-06, + "loss": 1.1781, + "step": 21447 + }, + { + "epoch": 0.65, + "learning_rate": 1.469961544830234e-06, + "loss": 1.2107, + "step": 21448 + }, + { + "epoch": 0.65, + "learning_rate": 1.469739295422329e-06, + "loss": 1.0204, + "step": 21449 + }, + { + "epoch": 0.65, + "learning_rate": 1.4695170558220101e-06, + "loss": 1.1013, + "step": 21450 + }, + { + "epoch": 0.65, + "learning_rate": 1.4692948260313916e-06, + "loss": 1.1091, + "step": 21451 + }, + { + "epoch": 0.65, + "learning_rate": 1.4690726060525901e-06, + "loss": 1.1129, + "step": 21452 + }, + { + "epoch": 0.65, + "learning_rate": 1.4688503958877206e-06, + "loss": 1.1083, + "step": 21453 + }, + { + "epoch": 0.65, + "learning_rate": 1.4686281955388992e-06, + "loss": 1.0267, + "step": 21454 + }, + { + "epoch": 0.65, + "learning_rate": 1.4684060050082404e-06, + "loss": 1.0926, + "step": 21455 + }, + { + "epoch": 0.65, + "learning_rate": 1.4681838242978602e-06, + "loss": 1.106, + "step": 21456 + }, + { + "epoch": 0.65, + "learning_rate": 1.4679616534098723e-06, + "loss": 1.1421, + "step": 21457 + }, + { + "epoch": 0.65, + "learning_rate": 1.4677394923463933e-06, + "loss": 1.1133, + "step": 21458 + }, + { + "epoch": 0.65, + "learning_rate": 1.4675173411095362e-06, + "loss": 1.0513, + "step": 21459 + }, + { + "epoch": 0.65, + "learning_rate": 1.467295199701417e-06, + "loss": 1.0532, + "step": 21460 + }, + { + "epoch": 0.65, + "learning_rate": 1.46707306812415e-06, + "loss": 1.1122, + "step": 21461 + }, + { + "epoch": 0.65, + "learning_rate": 1.4668509463798503e-06, + "loss": 1.007, + "step": 21462 + }, + { + "epoch": 0.65, + "learning_rate": 1.4666288344706325e-06, + "loss": 1.2643, + "step": 21463 + }, + { + "epoch": 0.65, + "learning_rate": 1.4664067323986098e-06, + "loss": 1.1678, + "step": 21464 + }, + { + "epoch": 0.65, + "learning_rate": 1.4661846401658971e-06, + "loss": 1.192, + "step": 21465 + }, + { + "epoch": 0.65, + "learning_rate": 1.465962557774609e-06, + "loss": 1.0474, + "step": 21466 + }, + { + "epoch": 0.65, + "learning_rate": 1.4657404852268598e-06, + "loss": 1.1129, + "step": 21467 + }, + { + "epoch": 0.65, + "learning_rate": 1.4655184225247626e-06, + "loss": 1.1525, + "step": 21468 + }, + { + "epoch": 0.65, + "learning_rate": 1.4652963696704315e-06, + "loss": 1.0814, + "step": 21469 + }, + { + "epoch": 0.65, + "learning_rate": 1.4650743266659805e-06, + "loss": 1.087, + "step": 21470 + }, + { + "epoch": 0.65, + "learning_rate": 1.4648522935135243e-06, + "loss": 1.0626, + "step": 21471 + }, + { + "epoch": 0.65, + "learning_rate": 1.464630270215175e-06, + "loss": 1.1314, + "step": 21472 + }, + { + "epoch": 0.65, + "learning_rate": 1.464408256773047e-06, + "loss": 1.0504, + "step": 21473 + }, + { + "epoch": 0.65, + "learning_rate": 1.4641862531892537e-06, + "loss": 1.1072, + "step": 21474 + }, + { + "epoch": 0.65, + "learning_rate": 1.463964259465908e-06, + "loss": 1.0901, + "step": 21475 + }, + { + "epoch": 0.65, + "learning_rate": 1.463742275605125e-06, + "loss": 1.0791, + "step": 21476 + }, + { + "epoch": 0.65, + "learning_rate": 1.4635203016090155e-06, + "loss": 0.9982, + "step": 21477 + }, + { + "epoch": 0.65, + "learning_rate": 1.4632983374796932e-06, + "loss": 0.9771, + "step": 21478 + }, + { + "epoch": 0.65, + "learning_rate": 1.4630763832192718e-06, + "loss": 1.1057, + "step": 21479 + }, + { + "epoch": 0.65, + "learning_rate": 1.4628544388298643e-06, + "loss": 1.1419, + "step": 21480 + }, + { + "epoch": 0.65, + "learning_rate": 1.4626325043135825e-06, + "loss": 1.1848, + "step": 21481 + }, + { + "epoch": 0.65, + "learning_rate": 1.4624105796725396e-06, + "loss": 1.058, + "step": 21482 + }, + { + "epoch": 0.65, + "learning_rate": 1.4621886649088483e-06, + "loss": 1.079, + "step": 21483 + }, + { + "epoch": 0.65, + "learning_rate": 1.4619667600246212e-06, + "loss": 0.9909, + "step": 21484 + }, + { + "epoch": 0.65, + "learning_rate": 1.4617448650219707e-06, + "loss": 1.0281, + "step": 21485 + }, + { + "epoch": 0.65, + "learning_rate": 1.4615229799030084e-06, + "loss": 1.126, + "step": 21486 + }, + { + "epoch": 0.65, + "learning_rate": 1.4613011046698477e-06, + "loss": 1.1345, + "step": 21487 + }, + { + "epoch": 0.65, + "learning_rate": 1.4610792393245998e-06, + "loss": 1.1058, + "step": 21488 + }, + { + "epoch": 0.65, + "learning_rate": 1.4608573838693785e-06, + "loss": 1.075, + "step": 21489 + }, + { + "epoch": 0.65, + "learning_rate": 1.4606355383062937e-06, + "loss": 1.1663, + "step": 21490 + }, + { + "epoch": 0.65, + "learning_rate": 1.4604137026374577e-06, + "loss": 1.1411, + "step": 21491 + }, + { + "epoch": 0.65, + "learning_rate": 1.4601918768649822e-06, + "loss": 1.2051, + "step": 21492 + }, + { + "epoch": 0.65, + "learning_rate": 1.4599700609909805e-06, + "loss": 1.3143, + "step": 21493 + }, + { + "epoch": 0.65, + "learning_rate": 1.4597482550175624e-06, + "loss": 1.1724, + "step": 21494 + }, + { + "epoch": 0.65, + "learning_rate": 1.4595264589468388e-06, + "loss": 1.0911, + "step": 21495 + }, + { + "epoch": 0.65, + "learning_rate": 1.4593046727809228e-06, + "loss": 1.012, + "step": 21496 + }, + { + "epoch": 0.65, + "learning_rate": 1.4590828965219262e-06, + "loss": 1.0066, + "step": 21497 + }, + { + "epoch": 0.65, + "learning_rate": 1.458861130171958e-06, + "loss": 1.0403, + "step": 21498 + }, + { + "epoch": 0.65, + "learning_rate": 1.4586393737331306e-06, + "loss": 1.1226, + "step": 21499 + }, + { + "epoch": 0.65, + "learning_rate": 1.4584176272075548e-06, + "loss": 1.0718, + "step": 21500 + }, + { + "epoch": 0.65, + "learning_rate": 1.4581958905973414e-06, + "loss": 1.1051, + "step": 21501 + }, + { + "epoch": 0.65, + "learning_rate": 1.4579741639046024e-06, + "loss": 1.1608, + "step": 21502 + }, + { + "epoch": 0.65, + "learning_rate": 1.4577524471314468e-06, + "loss": 1.1067, + "step": 21503 + }, + { + "epoch": 0.65, + "learning_rate": 1.4575307402799854e-06, + "loss": 1.1649, + "step": 21504 + }, + { + "epoch": 0.65, + "learning_rate": 1.4573090433523298e-06, + "loss": 1.1926, + "step": 21505 + }, + { + "epoch": 0.65, + "learning_rate": 1.4570873563505908e-06, + "loss": 1.1713, + "step": 21506 + }, + { + "epoch": 0.65, + "learning_rate": 1.4568656792768767e-06, + "loss": 1.0722, + "step": 21507 + }, + { + "epoch": 0.65, + "learning_rate": 1.4566440121332992e-06, + "loss": 1.1777, + "step": 21508 + }, + { + "epoch": 0.65, + "learning_rate": 1.456422354921968e-06, + "loss": 1.134, + "step": 21509 + }, + { + "epoch": 0.65, + "learning_rate": 1.4562007076449945e-06, + "loss": 1.0397, + "step": 21510 + }, + { + "epoch": 0.65, + "learning_rate": 1.4559790703044863e-06, + "loss": 1.0125, + "step": 21511 + }, + { + "epoch": 0.65, + "learning_rate": 1.4557574429025548e-06, + "loss": 1.1487, + "step": 21512 + }, + { + "epoch": 0.65, + "learning_rate": 1.4555358254413094e-06, + "loss": 1.0579, + "step": 21513 + }, + { + "epoch": 0.65, + "learning_rate": 1.4553142179228607e-06, + "loss": 0.9883, + "step": 21514 + }, + { + "epoch": 0.65, + "learning_rate": 1.455092620349317e-06, + "loss": 1.0524, + "step": 21515 + }, + { + "epoch": 0.65, + "learning_rate": 1.454871032722788e-06, + "loss": 1.1819, + "step": 21516 + }, + { + "epoch": 0.65, + "learning_rate": 1.4546494550453835e-06, + "loss": 1.0917, + "step": 21517 + }, + { + "epoch": 0.65, + "learning_rate": 1.4544278873192125e-06, + "loss": 1.2809, + "step": 21518 + }, + { + "epoch": 0.65, + "learning_rate": 1.454206329546385e-06, + "loss": 1.2023, + "step": 21519 + }, + { + "epoch": 0.65, + "learning_rate": 1.453984781729009e-06, + "loss": 1.0003, + "step": 21520 + }, + { + "epoch": 0.65, + "learning_rate": 1.4537632438691946e-06, + "loss": 1.0832, + "step": 21521 + }, + { + "epoch": 0.65, + "learning_rate": 1.4535417159690495e-06, + "loss": 1.1504, + "step": 21522 + }, + { + "epoch": 0.65, + "learning_rate": 1.453320198030685e-06, + "loss": 1.1166, + "step": 21523 + }, + { + "epoch": 0.65, + "learning_rate": 1.4530986900562066e-06, + "loss": 1.1452, + "step": 21524 + }, + { + "epoch": 0.65, + "learning_rate": 1.4528771920477248e-06, + "loss": 1.1278, + "step": 21525 + }, + { + "epoch": 0.65, + "learning_rate": 1.4526557040073477e-06, + "loss": 1.0999, + "step": 21526 + }, + { + "epoch": 0.65, + "learning_rate": 1.4524342259371848e-06, + "loss": 1.0555, + "step": 21527 + }, + { + "epoch": 0.65, + "learning_rate": 1.452212757839343e-06, + "loss": 1.1238, + "step": 21528 + }, + { + "epoch": 0.65, + "learning_rate": 1.4519912997159308e-06, + "loss": 1.0112, + "step": 21529 + }, + { + "epoch": 0.65, + "learning_rate": 1.4517698515690565e-06, + "loss": 1.1058, + "step": 21530 + }, + { + "epoch": 0.65, + "learning_rate": 1.4515484134008284e-06, + "loss": 1.2465, + "step": 21531 + }, + { + "epoch": 0.65, + "learning_rate": 1.4513269852133557e-06, + "loss": 1.2156, + "step": 21532 + }, + { + "epoch": 0.65, + "learning_rate": 1.4511055670087436e-06, + "loss": 1.1824, + "step": 21533 + }, + { + "epoch": 0.65, + "learning_rate": 1.4508841587891021e-06, + "loss": 1.0904, + "step": 21534 + }, + { + "epoch": 0.65, + "learning_rate": 1.4506627605565377e-06, + "loss": 1.1708, + "step": 21535 + }, + { + "epoch": 0.65, + "learning_rate": 1.4504413723131594e-06, + "loss": 1.059, + "step": 21536 + }, + { + "epoch": 0.65, + "learning_rate": 1.4502199940610728e-06, + "loss": 1.1003, + "step": 21537 + }, + { + "epoch": 0.65, + "learning_rate": 1.4499986258023863e-06, + "loss": 1.059, + "step": 21538 + }, + { + "epoch": 0.65, + "learning_rate": 1.4497772675392069e-06, + "loss": 1.1541, + "step": 21539 + }, + { + "epoch": 0.65, + "learning_rate": 1.4495559192736437e-06, + "loss": 1.1422, + "step": 21540 + }, + { + "epoch": 0.65, + "learning_rate": 1.4493345810078008e-06, + "loss": 1.1444, + "step": 21541 + }, + { + "epoch": 0.65, + "learning_rate": 1.4491132527437864e-06, + "loss": 1.0177, + "step": 21542 + }, + { + "epoch": 0.65, + "learning_rate": 1.4488919344837083e-06, + "loss": 1.054, + "step": 21543 + }, + { + "epoch": 0.65, + "learning_rate": 1.4486706262296723e-06, + "loss": 1.1775, + "step": 21544 + }, + { + "epoch": 0.65, + "learning_rate": 1.4484493279837859e-06, + "loss": 1.1412, + "step": 21545 + }, + { + "epoch": 0.65, + "learning_rate": 1.4482280397481551e-06, + "loss": 1.0535, + "step": 21546 + }, + { + "epoch": 0.65, + "learning_rate": 1.4480067615248873e-06, + "loss": 1.2416, + "step": 21547 + }, + { + "epoch": 0.65, + "learning_rate": 1.4477854933160885e-06, + "loss": 1.1082, + "step": 21548 + }, + { + "epoch": 0.65, + "learning_rate": 1.4475642351238655e-06, + "loss": 1.1809, + "step": 21549 + }, + { + "epoch": 0.65, + "learning_rate": 1.4473429869503235e-06, + "loss": 1.0695, + "step": 21550 + }, + { + "epoch": 0.65, + "learning_rate": 1.4471217487975692e-06, + "loss": 1.008, + "step": 21551 + }, + { + "epoch": 0.65, + "learning_rate": 1.446900520667709e-06, + "loss": 1.1248, + "step": 21552 + }, + { + "epoch": 0.65, + "learning_rate": 1.4466793025628489e-06, + "loss": 1.1219, + "step": 21553 + }, + { + "epoch": 0.65, + "learning_rate": 1.4464580944850941e-06, + "loss": 1.1802, + "step": 21554 + }, + { + "epoch": 0.65, + "learning_rate": 1.4462368964365509e-06, + "loss": 1.2363, + "step": 21555 + }, + { + "epoch": 0.65, + "learning_rate": 1.446015708419325e-06, + "loss": 1.0302, + "step": 21556 + }, + { + "epoch": 0.65, + "learning_rate": 1.4457945304355217e-06, + "loss": 1.2061, + "step": 21557 + }, + { + "epoch": 0.65, + "learning_rate": 1.4455733624872478e-06, + "loss": 1.0563, + "step": 21558 + }, + { + "epoch": 0.65, + "learning_rate": 1.4453522045766067e-06, + "loss": 1.09, + "step": 21559 + }, + { + "epoch": 0.65, + "learning_rate": 1.4451310567057048e-06, + "loss": 1.0843, + "step": 21560 + }, + { + "epoch": 0.65, + "learning_rate": 1.4449099188766468e-06, + "loss": 1.1281, + "step": 21561 + }, + { + "epoch": 0.65, + "learning_rate": 1.4446887910915397e-06, + "loss": 1.1383, + "step": 21562 + }, + { + "epoch": 0.65, + "learning_rate": 1.4444676733524856e-06, + "loss": 1.0894, + "step": 21563 + }, + { + "epoch": 0.65, + "learning_rate": 1.444246565661591e-06, + "loss": 1.1583, + "step": 21564 + }, + { + "epoch": 0.65, + "learning_rate": 1.4440254680209608e-06, + "loss": 1.1042, + "step": 21565 + }, + { + "epoch": 0.65, + "learning_rate": 1.4438043804327007e-06, + "loss": 1.0043, + "step": 21566 + }, + { + "epoch": 0.65, + "learning_rate": 1.443583302898913e-06, + "loss": 1.1014, + "step": 21567 + }, + { + "epoch": 0.65, + "learning_rate": 1.4433622354217035e-06, + "loss": 1.0665, + "step": 21568 + }, + { + "epoch": 0.65, + "learning_rate": 1.4431411780031765e-06, + "loss": 1.0561, + "step": 21569 + }, + { + "epoch": 0.65, + "learning_rate": 1.4429201306454365e-06, + "loss": 1.1228, + "step": 21570 + }, + { + "epoch": 0.65, + "learning_rate": 1.442699093350588e-06, + "loss": 1.0413, + "step": 21571 + }, + { + "epoch": 0.65, + "learning_rate": 1.442478066120735e-06, + "loss": 1.1321, + "step": 21572 + }, + { + "epoch": 0.65, + "learning_rate": 1.4422570489579813e-06, + "loss": 1.1136, + "step": 21573 + }, + { + "epoch": 0.65, + "learning_rate": 1.442036041864432e-06, + "loss": 1.1264, + "step": 21574 + }, + { + "epoch": 0.65, + "learning_rate": 1.4418150448421888e-06, + "loss": 1.1796, + "step": 21575 + }, + { + "epoch": 0.65, + "learning_rate": 1.441594057893357e-06, + "loss": 1.0645, + "step": 21576 + }, + { + "epoch": 0.65, + "learning_rate": 1.44137308102004e-06, + "loss": 1.0026, + "step": 21577 + }, + { + "epoch": 0.65, + "learning_rate": 1.4411521142243415e-06, + "loss": 1.0634, + "step": 21578 + }, + { + "epoch": 0.65, + "learning_rate": 1.440931157508366e-06, + "loss": 1.0205, + "step": 21579 + }, + { + "epoch": 0.65, + "learning_rate": 1.4407102108742147e-06, + "loss": 1.1944, + "step": 21580 + }, + { + "epoch": 0.65, + "learning_rate": 1.4404892743239919e-06, + "loss": 1.0682, + "step": 21581 + }, + { + "epoch": 0.65, + "learning_rate": 1.4402683478598012e-06, + "loss": 1.0659, + "step": 21582 + }, + { + "epoch": 0.65, + "learning_rate": 1.4400474314837452e-06, + "loss": 1.1257, + "step": 21583 + }, + { + "epoch": 0.65, + "learning_rate": 1.4398265251979282e-06, + "loss": 1.0432, + "step": 21584 + }, + { + "epoch": 0.65, + "learning_rate": 1.439605629004451e-06, + "loss": 1.1778, + "step": 21585 + }, + { + "epoch": 0.65, + "learning_rate": 1.4393847429054175e-06, + "loss": 1.1898, + "step": 21586 + }, + { + "epoch": 0.65, + "learning_rate": 1.4391638669029307e-06, + "loss": 1.0408, + "step": 21587 + }, + { + "epoch": 0.65, + "learning_rate": 1.438943000999094e-06, + "loss": 1.1777, + "step": 21588 + }, + { + "epoch": 0.65, + "learning_rate": 1.4387221451960077e-06, + "loss": 1.114, + "step": 21589 + }, + { + "epoch": 0.65, + "learning_rate": 1.4385012994957754e-06, + "loss": 1.106, + "step": 21590 + }, + { + "epoch": 0.65, + "learning_rate": 1.4382804639004996e-06, + "loss": 1.1978, + "step": 21591 + }, + { + "epoch": 0.65, + "learning_rate": 1.4380596384122835e-06, + "loss": 1.1941, + "step": 21592 + }, + { + "epoch": 0.65, + "learning_rate": 1.437838823033227e-06, + "loss": 1.2332, + "step": 21593 + }, + { + "epoch": 0.65, + "learning_rate": 1.4376180177654336e-06, + "loss": 1.2145, + "step": 21594 + }, + { + "epoch": 0.65, + "learning_rate": 1.437397222611005e-06, + "loss": 1.1288, + "step": 21595 + }, + { + "epoch": 0.65, + "learning_rate": 1.4371764375720426e-06, + "loss": 1.074, + "step": 21596 + }, + { + "epoch": 0.65, + "learning_rate": 1.4369556626506503e-06, + "loss": 1.0961, + "step": 21597 + }, + { + "epoch": 0.65, + "learning_rate": 1.4367348978489265e-06, + "loss": 1.0902, + "step": 21598 + }, + { + "epoch": 0.65, + "learning_rate": 1.436514143168975e-06, + "loss": 1.169, + "step": 21599 + }, + { + "epoch": 0.65, + "learning_rate": 1.4362933986128962e-06, + "loss": 1.2319, + "step": 21600 + }, + { + "epoch": 0.65, + "learning_rate": 1.436072664182792e-06, + "loss": 1.1069, + "step": 21601 + }, + { + "epoch": 0.65, + "learning_rate": 1.4358519398807638e-06, + "loss": 1.0562, + "step": 21602 + }, + { + "epoch": 0.65, + "learning_rate": 1.4356312257089127e-06, + "loss": 1.186, + "step": 21603 + }, + { + "epoch": 0.65, + "learning_rate": 1.4354105216693396e-06, + "loss": 0.959, + "step": 21604 + }, + { + "epoch": 0.65, + "learning_rate": 1.4351898277641466e-06, + "loss": 1.1465, + "step": 21605 + }, + { + "epoch": 0.65, + "learning_rate": 1.4349691439954325e-06, + "loss": 1.1479, + "step": 21606 + }, + { + "epoch": 0.65, + "learning_rate": 1.4347484703652991e-06, + "loss": 1.0832, + "step": 21607 + }, + { + "epoch": 0.65, + "learning_rate": 1.4345278068758478e-06, + "loss": 1.1216, + "step": 21608 + }, + { + "epoch": 0.65, + "learning_rate": 1.434307153529178e-06, + "loss": 0.9929, + "step": 21609 + }, + { + "epoch": 0.65, + "learning_rate": 1.4340865103273921e-06, + "loss": 1.1166, + "step": 21610 + }, + { + "epoch": 0.65, + "learning_rate": 1.4338658772725883e-06, + "loss": 1.0844, + "step": 21611 + }, + { + "epoch": 0.65, + "learning_rate": 1.4336452543668677e-06, + "loss": 1.188, + "step": 21612 + }, + { + "epoch": 0.65, + "learning_rate": 1.433424641612331e-06, + "loss": 1.069, + "step": 21613 + }, + { + "epoch": 0.65, + "learning_rate": 1.433204039011079e-06, + "loss": 1.1224, + "step": 21614 + }, + { + "epoch": 0.65, + "learning_rate": 1.4329834465652096e-06, + "loss": 1.0854, + "step": 21615 + }, + { + "epoch": 0.65, + "learning_rate": 1.4327628642768237e-06, + "loss": 1.0977, + "step": 21616 + }, + { + "epoch": 0.65, + "learning_rate": 1.4325422921480217e-06, + "loss": 1.1626, + "step": 21617 + }, + { + "epoch": 0.65, + "learning_rate": 1.4323217301809039e-06, + "loss": 1.123, + "step": 21618 + }, + { + "epoch": 0.65, + "learning_rate": 1.432101178377568e-06, + "loss": 1.1139, + "step": 21619 + }, + { + "epoch": 0.65, + "learning_rate": 1.4318806367401144e-06, + "loss": 1.101, + "step": 21620 + }, + { + "epoch": 0.65, + "learning_rate": 1.4316601052706431e-06, + "loss": 1.2014, + "step": 21621 + }, + { + "epoch": 0.65, + "learning_rate": 1.4314395839712525e-06, + "loss": 1.1299, + "step": 21622 + }, + { + "epoch": 0.65, + "learning_rate": 1.4312190728440439e-06, + "loss": 1.1006, + "step": 21623 + }, + { + "epoch": 0.65, + "learning_rate": 1.4309985718911138e-06, + "loss": 1.1106, + "step": 21624 + }, + { + "epoch": 0.65, + "learning_rate": 1.4307780811145624e-06, + "loss": 1.0977, + "step": 21625 + }, + { + "epoch": 0.65, + "learning_rate": 1.430557600516489e-06, + "loss": 1.1127, + "step": 21626 + }, + { + "epoch": 0.65, + "learning_rate": 1.4303371300989916e-06, + "loss": 1.0963, + "step": 21627 + }, + { + "epoch": 0.65, + "learning_rate": 1.43011666986417e-06, + "loss": 1.0229, + "step": 21628 + }, + { + "epoch": 0.65, + "learning_rate": 1.4298962198141225e-06, + "loss": 1.0469, + "step": 21629 + }, + { + "epoch": 0.65, + "learning_rate": 1.4296757799509473e-06, + "loss": 1.0391, + "step": 21630 + }, + { + "epoch": 0.65, + "learning_rate": 1.4294553502767444e-06, + "loss": 1.292, + "step": 21631 + }, + { + "epoch": 0.65, + "learning_rate": 1.4292349307936098e-06, + "loss": 1.0104, + "step": 21632 + }, + { + "epoch": 0.65, + "learning_rate": 1.4290145215036433e-06, + "loss": 1.2483, + "step": 21633 + }, + { + "epoch": 0.65, + "learning_rate": 1.4287941224089425e-06, + "loss": 1.0263, + "step": 21634 + }, + { + "epoch": 0.65, + "learning_rate": 1.4285737335116057e-06, + "loss": 1.0942, + "step": 21635 + }, + { + "epoch": 0.65, + "learning_rate": 1.4283533548137318e-06, + "loss": 1.2088, + "step": 21636 + }, + { + "epoch": 0.65, + "learning_rate": 1.428132986317417e-06, + "loss": 1.1345, + "step": 21637 + }, + { + "epoch": 0.65, + "learning_rate": 1.4279126280247602e-06, + "loss": 1.1345, + "step": 21638 + }, + { + "epoch": 0.65, + "learning_rate": 1.4276922799378583e-06, + "loss": 1.0701, + "step": 21639 + }, + { + "epoch": 0.65, + "learning_rate": 1.4274719420588112e-06, + "loss": 1.0123, + "step": 21640 + }, + { + "epoch": 0.65, + "learning_rate": 1.427251614389713e-06, + "loss": 1.1551, + "step": 21641 + }, + { + "epoch": 0.65, + "learning_rate": 1.4270312969326632e-06, + "loss": 1.1625, + "step": 21642 + }, + { + "epoch": 0.65, + "learning_rate": 1.4268109896897586e-06, + "loss": 1.1811, + "step": 21643 + }, + { + "epoch": 0.65, + "learning_rate": 1.4265906926630973e-06, + "loss": 0.9387, + "step": 21644 + }, + { + "epoch": 0.65, + "learning_rate": 1.4263704058547747e-06, + "loss": 1.1927, + "step": 21645 + }, + { + "epoch": 0.65, + "learning_rate": 1.426150129266889e-06, + "loss": 1.1199, + "step": 21646 + }, + { + "epoch": 0.65, + "learning_rate": 1.4259298629015366e-06, + "loss": 1.0677, + "step": 21647 + }, + { + "epoch": 0.65, + "learning_rate": 1.4257096067608144e-06, + "loss": 1.1303, + "step": 21648 + }, + { + "epoch": 0.65, + "learning_rate": 1.4254893608468209e-06, + "loss": 1.0851, + "step": 21649 + }, + { + "epoch": 0.65, + "learning_rate": 1.4252691251616502e-06, + "loss": 1.2503, + "step": 21650 + }, + { + "epoch": 0.65, + "learning_rate": 1.4250488997073995e-06, + "loss": 1.1469, + "step": 21651 + }, + { + "epoch": 0.65, + "learning_rate": 1.4248286844861655e-06, + "loss": 1.0989, + "step": 21652 + }, + { + "epoch": 0.65, + "learning_rate": 1.4246084795000447e-06, + "loss": 1.1353, + "step": 21653 + }, + { + "epoch": 0.65, + "learning_rate": 1.4243882847511333e-06, + "loss": 1.1658, + "step": 21654 + }, + { + "epoch": 0.65, + "learning_rate": 1.4241681002415276e-06, + "loss": 1.2148, + "step": 21655 + }, + { + "epoch": 0.65, + "learning_rate": 1.423947925973324e-06, + "loss": 1.1881, + "step": 21656 + }, + { + "epoch": 0.65, + "learning_rate": 1.4237277619486172e-06, + "loss": 1.0336, + "step": 21657 + }, + { + "epoch": 0.65, + "learning_rate": 1.4235076081695037e-06, + "loss": 1.0765, + "step": 21658 + }, + { + "epoch": 0.65, + "learning_rate": 1.4232874646380793e-06, + "loss": 1.2109, + "step": 21659 + }, + { + "epoch": 0.65, + "learning_rate": 1.4230673313564397e-06, + "loss": 1.0485, + "step": 21660 + }, + { + "epoch": 0.65, + "learning_rate": 1.4228472083266804e-06, + "loss": 1.1961, + "step": 21661 + }, + { + "epoch": 0.65, + "learning_rate": 1.422627095550898e-06, + "loss": 1.1752, + "step": 21662 + }, + { + "epoch": 0.65, + "learning_rate": 1.4224069930311856e-06, + "loss": 1.0839, + "step": 21663 + }, + { + "epoch": 0.65, + "learning_rate": 1.4221869007696398e-06, + "loss": 1.0938, + "step": 21664 + }, + { + "epoch": 0.65, + "learning_rate": 1.4219668187683555e-06, + "loss": 1.1721, + "step": 21665 + }, + { + "epoch": 0.65, + "learning_rate": 1.4217467470294288e-06, + "loss": 1.0353, + "step": 21666 + }, + { + "epoch": 0.65, + "learning_rate": 1.4215266855549531e-06, + "loss": 1.1561, + "step": 21667 + }, + { + "epoch": 0.65, + "learning_rate": 1.4213066343470237e-06, + "loss": 1.0323, + "step": 21668 + }, + { + "epoch": 0.65, + "learning_rate": 1.4210865934077356e-06, + "loss": 1.1326, + "step": 21669 + }, + { + "epoch": 0.65, + "learning_rate": 1.4208665627391843e-06, + "loss": 1.0997, + "step": 21670 + }, + { + "epoch": 0.65, + "learning_rate": 1.4206465423434628e-06, + "loss": 1.14, + "step": 21671 + }, + { + "epoch": 0.65, + "learning_rate": 1.4204265322226668e-06, + "loss": 1.0403, + "step": 21672 + }, + { + "epoch": 0.65, + "learning_rate": 1.4202065323788899e-06, + "loss": 1.1093, + "step": 21673 + }, + { + "epoch": 0.65, + "learning_rate": 1.4199865428142268e-06, + "loss": 1.0549, + "step": 21674 + }, + { + "epoch": 0.65, + "learning_rate": 1.4197665635307725e-06, + "loss": 1.1633, + "step": 21675 + }, + { + "epoch": 0.65, + "learning_rate": 1.4195465945306195e-06, + "loss": 1.0873, + "step": 21676 + }, + { + "epoch": 0.65, + "learning_rate": 1.4193266358158624e-06, + "loss": 1.1512, + "step": 21677 + }, + { + "epoch": 0.65, + "learning_rate": 1.4191066873885953e-06, + "loss": 1.0425, + "step": 21678 + }, + { + "epoch": 0.65, + "learning_rate": 1.418886749250913e-06, + "loss": 1.0723, + "step": 21679 + }, + { + "epoch": 0.65, + "learning_rate": 1.418666821404907e-06, + "loss": 1.042, + "step": 21680 + }, + { + "epoch": 0.65, + "learning_rate": 1.4184469038526721e-06, + "loss": 1.0778, + "step": 21681 + }, + { + "epoch": 0.65, + "learning_rate": 1.418226996596302e-06, + "loss": 1.1999, + "step": 21682 + }, + { + "epoch": 0.65, + "learning_rate": 1.4180070996378898e-06, + "loss": 1.0931, + "step": 21683 + }, + { + "epoch": 0.65, + "learning_rate": 1.417787212979529e-06, + "loss": 1.0596, + "step": 21684 + }, + { + "epoch": 0.65, + "learning_rate": 1.4175673366233126e-06, + "loss": 1.1909, + "step": 21685 + }, + { + "epoch": 0.65, + "learning_rate": 1.4173474705713337e-06, + "loss": 1.1431, + "step": 21686 + }, + { + "epoch": 0.65, + "learning_rate": 1.4171276148256858e-06, + "loss": 1.2314, + "step": 21687 + }, + { + "epoch": 0.65, + "learning_rate": 1.4169077693884623e-06, + "loss": 1.1281, + "step": 21688 + }, + { + "epoch": 0.65, + "learning_rate": 1.416687934261754e-06, + "loss": 1.0938, + "step": 21689 + }, + { + "epoch": 0.65, + "learning_rate": 1.4164681094476552e-06, + "loss": 1.1175, + "step": 21690 + }, + { + "epoch": 0.65, + "learning_rate": 1.4162482949482578e-06, + "loss": 1.1384, + "step": 21691 + }, + { + "epoch": 0.65, + "learning_rate": 1.4160284907656558e-06, + "loss": 1.1204, + "step": 21692 + }, + { + "epoch": 0.65, + "learning_rate": 1.4158086969019396e-06, + "loss": 1.1335, + "step": 21693 + }, + { + "epoch": 0.65, + "learning_rate": 1.4155889133592025e-06, + "loss": 1.0405, + "step": 21694 + }, + { + "epoch": 0.65, + "learning_rate": 1.4153691401395365e-06, + "loss": 1.1115, + "step": 21695 + }, + { + "epoch": 0.65, + "learning_rate": 1.4151493772450349e-06, + "loss": 1.1134, + "step": 21696 + }, + { + "epoch": 0.65, + "learning_rate": 1.4149296246777878e-06, + "loss": 1.0109, + "step": 21697 + }, + { + "epoch": 0.65, + "learning_rate": 1.414709882439888e-06, + "loss": 1.1141, + "step": 21698 + }, + { + "epoch": 0.65, + "learning_rate": 1.4144901505334277e-06, + "loss": 1.1794, + "step": 21699 + }, + { + "epoch": 0.65, + "learning_rate": 1.4142704289604992e-06, + "loss": 1.0446, + "step": 21700 + }, + { + "epoch": 0.65, + "learning_rate": 1.414050717723192e-06, + "loss": 1.0269, + "step": 21701 + }, + { + "epoch": 0.65, + "learning_rate": 1.4138310168235998e-06, + "loss": 1.1506, + "step": 21702 + }, + { + "epoch": 0.65, + "learning_rate": 1.4136113262638123e-06, + "loss": 1.1057, + "step": 21703 + }, + { + "epoch": 0.65, + "learning_rate": 1.4133916460459224e-06, + "loss": 1.1001, + "step": 21704 + }, + { + "epoch": 0.65, + "learning_rate": 1.4131719761720214e-06, + "loss": 1.1041, + "step": 21705 + }, + { + "epoch": 0.65, + "learning_rate": 1.4129523166441985e-06, + "loss": 0.975, + "step": 21706 + }, + { + "epoch": 0.65, + "learning_rate": 1.4127326674645464e-06, + "loss": 1.1731, + "step": 21707 + }, + { + "epoch": 0.65, + "learning_rate": 1.4125130286351553e-06, + "loss": 1.132, + "step": 21708 + }, + { + "epoch": 0.65, + "learning_rate": 1.4122934001581167e-06, + "loss": 1.0244, + "step": 21709 + }, + { + "epoch": 0.65, + "learning_rate": 1.4120737820355214e-06, + "loss": 1.0455, + "step": 21710 + }, + { + "epoch": 0.65, + "learning_rate": 1.4118541742694592e-06, + "loss": 1.0729, + "step": 21711 + }, + { + "epoch": 0.65, + "learning_rate": 1.4116345768620212e-06, + "loss": 1.102, + "step": 21712 + }, + { + "epoch": 0.65, + "learning_rate": 1.411414989815299e-06, + "loss": 1.1255, + "step": 21713 + }, + { + "epoch": 0.65, + "learning_rate": 1.411195413131381e-06, + "loss": 1.0981, + "step": 21714 + }, + { + "epoch": 0.65, + "learning_rate": 1.410975846812358e-06, + "loss": 1.1188, + "step": 21715 + }, + { + "epoch": 0.65, + "learning_rate": 1.4107562908603205e-06, + "loss": 1.0496, + "step": 21716 + }, + { + "epoch": 0.65, + "learning_rate": 1.4105367452773585e-06, + "loss": 1.0768, + "step": 21717 + }, + { + "epoch": 0.65, + "learning_rate": 1.4103172100655631e-06, + "loss": 1.1263, + "step": 21718 + }, + { + "epoch": 0.65, + "learning_rate": 1.410097685227022e-06, + "loss": 1.1199, + "step": 21719 + }, + { + "epoch": 0.65, + "learning_rate": 1.409878170763826e-06, + "loss": 0.9967, + "step": 21720 + }, + { + "epoch": 0.65, + "learning_rate": 1.409658666678065e-06, + "loss": 1.1477, + "step": 21721 + }, + { + "epoch": 0.65, + "learning_rate": 1.409439172971829e-06, + "loss": 0.9984, + "step": 21722 + }, + { + "epoch": 0.65, + "learning_rate": 1.409219689647206e-06, + "loss": 1.0424, + "step": 21723 + }, + { + "epoch": 0.65, + "learning_rate": 1.409000216706286e-06, + "loss": 1.1027, + "step": 21724 + }, + { + "epoch": 0.65, + "learning_rate": 1.408780754151159e-06, + "loss": 1.1155, + "step": 21725 + }, + { + "epoch": 0.65, + "learning_rate": 1.4085613019839146e-06, + "loss": 1.1387, + "step": 21726 + }, + { + "epoch": 0.65, + "learning_rate": 1.4083418602066396e-06, + "loss": 1.1438, + "step": 21727 + }, + { + "epoch": 0.65, + "learning_rate": 1.4081224288214243e-06, + "loss": 1.0605, + "step": 21728 + }, + { + "epoch": 0.65, + "learning_rate": 1.407903007830358e-06, + "loss": 1.103, + "step": 21729 + }, + { + "epoch": 0.65, + "learning_rate": 1.4076835972355287e-06, + "loss": 1.1551, + "step": 21730 + }, + { + "epoch": 0.65, + "learning_rate": 1.4074641970390267e-06, + "loss": 1.233, + "step": 21731 + }, + { + "epoch": 0.65, + "learning_rate": 1.4072448072429384e-06, + "loss": 1.0864, + "step": 21732 + }, + { + "epoch": 0.65, + "learning_rate": 1.407025427849353e-06, + "loss": 1.2108, + "step": 21733 + }, + { + "epoch": 0.65, + "learning_rate": 1.4068060588603593e-06, + "loss": 1.0592, + "step": 21734 + }, + { + "epoch": 0.65, + "learning_rate": 1.4065867002780454e-06, + "loss": 1.088, + "step": 21735 + }, + { + "epoch": 0.65, + "learning_rate": 1.4063673521044997e-06, + "loss": 1.0873, + "step": 21736 + }, + { + "epoch": 0.65, + "learning_rate": 1.4061480143418098e-06, + "loss": 1.1811, + "step": 21737 + }, + { + "epoch": 0.65, + "learning_rate": 1.4059286869920651e-06, + "loss": 1.1024, + "step": 21738 + }, + { + "epoch": 0.65, + "learning_rate": 1.4057093700573516e-06, + "loss": 1.0906, + "step": 21739 + }, + { + "epoch": 0.65, + "learning_rate": 1.4054900635397573e-06, + "loss": 1.1167, + "step": 21740 + }, + { + "epoch": 0.65, + "learning_rate": 1.405270767441371e-06, + "loss": 1.0132, + "step": 21741 + }, + { + "epoch": 0.65, + "learning_rate": 1.4050514817642797e-06, + "loss": 1.0354, + "step": 21742 + }, + { + "epoch": 0.66, + "learning_rate": 1.4048322065105707e-06, + "loss": 1.1839, + "step": 21743 + }, + { + "epoch": 0.66, + "learning_rate": 1.4046129416823328e-06, + "loss": 1.1597, + "step": 21744 + }, + { + "epoch": 0.66, + "learning_rate": 1.404393687281651e-06, + "loss": 1.0992, + "step": 21745 + }, + { + "epoch": 0.66, + "learning_rate": 1.4041744433106135e-06, + "loss": 1.0699, + "step": 21746 + }, + { + "epoch": 0.66, + "learning_rate": 1.403955209771308e-06, + "loss": 1.0188, + "step": 21747 + }, + { + "epoch": 0.66, + "learning_rate": 1.4037359866658218e-06, + "loss": 1.0801, + "step": 21748 + }, + { + "epoch": 0.66, + "learning_rate": 1.4035167739962403e-06, + "loss": 1.0478, + "step": 21749 + }, + { + "epoch": 0.66, + "learning_rate": 1.4032975717646505e-06, + "loss": 1.083, + "step": 21750 + }, + { + "epoch": 0.66, + "learning_rate": 1.4030783799731398e-06, + "loss": 1.0345, + "step": 21751 + }, + { + "epoch": 0.66, + "learning_rate": 1.4028591986237957e-06, + "loss": 1.0389, + "step": 21752 + }, + { + "epoch": 0.66, + "learning_rate": 1.4026400277187025e-06, + "loss": 1.0501, + "step": 21753 + }, + { + "epoch": 0.66, + "learning_rate": 1.4024208672599482e-06, + "loss": 1.1294, + "step": 21754 + }, + { + "epoch": 0.66, + "learning_rate": 1.4022017172496184e-06, + "loss": 1.1081, + "step": 21755 + }, + { + "epoch": 0.66, + "learning_rate": 1.4019825776897992e-06, + "loss": 1.0398, + "step": 21756 + }, + { + "epoch": 0.66, + "learning_rate": 1.401763448582578e-06, + "loss": 1.1158, + "step": 21757 + }, + { + "epoch": 0.66, + "learning_rate": 1.401544329930039e-06, + "loss": 1.0705, + "step": 21758 + }, + { + "epoch": 0.66, + "learning_rate": 1.4013252217342693e-06, + "loss": 1.1187, + "step": 21759 + }, + { + "epoch": 0.66, + "learning_rate": 1.401106123997354e-06, + "loss": 1.0393, + "step": 21760 + }, + { + "epoch": 0.66, + "learning_rate": 1.4008870367213803e-06, + "loss": 1.1559, + "step": 21761 + }, + { + "epoch": 0.66, + "learning_rate": 1.4006679599084317e-06, + "loss": 1.3167, + "step": 21762 + }, + { + "epoch": 0.66, + "learning_rate": 1.4004488935605948e-06, + "loss": 1.2136, + "step": 21763 + }, + { + "epoch": 0.66, + "learning_rate": 1.4002298376799545e-06, + "loss": 1.0706, + "step": 21764 + }, + { + "epoch": 0.66, + "learning_rate": 1.4000107922685966e-06, + "loss": 1.0361, + "step": 21765 + }, + { + "epoch": 0.66, + "learning_rate": 1.3997917573286062e-06, + "loss": 1.0223, + "step": 21766 + }, + { + "epoch": 0.66, + "learning_rate": 1.3995727328620683e-06, + "loss": 1.1372, + "step": 21767 + }, + { + "epoch": 0.66, + "learning_rate": 1.3993537188710683e-06, + "loss": 1.1492, + "step": 21768 + }, + { + "epoch": 0.66, + "learning_rate": 1.3991347153576907e-06, + "loss": 1.1835, + "step": 21769 + }, + { + "epoch": 0.66, + "learning_rate": 1.398915722324021e-06, + "loss": 1.0577, + "step": 21770 + }, + { + "epoch": 0.66, + "learning_rate": 1.3986967397721427e-06, + "loss": 1.067, + "step": 21771 + }, + { + "epoch": 0.66, + "learning_rate": 1.3984777677041412e-06, + "loss": 1.1802, + "step": 21772 + }, + { + "epoch": 0.66, + "learning_rate": 1.3982588061221003e-06, + "loss": 1.2358, + "step": 21773 + }, + { + "epoch": 0.66, + "learning_rate": 1.3980398550281063e-06, + "loss": 1.2695, + "step": 21774 + }, + { + "epoch": 0.66, + "learning_rate": 1.3978209144242411e-06, + "loss": 1.0661, + "step": 21775 + }, + { + "epoch": 0.66, + "learning_rate": 1.39760198431259e-06, + "loss": 1.0901, + "step": 21776 + }, + { + "epoch": 0.66, + "learning_rate": 1.3973830646952372e-06, + "loss": 1.0986, + "step": 21777 + }, + { + "epoch": 0.66, + "learning_rate": 1.3971641555742674e-06, + "loss": 1.0065, + "step": 21778 + }, + { + "epoch": 0.66, + "learning_rate": 1.3969452569517628e-06, + "loss": 1.135, + "step": 21779 + }, + { + "epoch": 0.66, + "learning_rate": 1.396726368829808e-06, + "loss": 1.0864, + "step": 21780 + }, + { + "epoch": 0.66, + "learning_rate": 1.3965074912104871e-06, + "loss": 1.202, + "step": 21781 + }, + { + "epoch": 0.66, + "learning_rate": 1.3962886240958828e-06, + "loss": 1.1113, + "step": 21782 + }, + { + "epoch": 0.66, + "learning_rate": 1.3960697674880807e-06, + "loss": 1.1077, + "step": 21783 + }, + { + "epoch": 0.66, + "learning_rate": 1.3958509213891619e-06, + "loss": 1.0208, + "step": 21784 + }, + { + "epoch": 0.66, + "learning_rate": 1.3956320858012102e-06, + "loss": 1.0229, + "step": 21785 + }, + { + "epoch": 0.66, + "learning_rate": 1.3954132607263094e-06, + "loss": 1.0293, + "step": 21786 + }, + { + "epoch": 0.66, + "learning_rate": 1.395194446166543e-06, + "loss": 1.1232, + "step": 21787 + }, + { + "epoch": 0.66, + "learning_rate": 1.3949756421239926e-06, + "loss": 1.1326, + "step": 21788 + }, + { + "epoch": 0.66, + "learning_rate": 1.3947568486007422e-06, + "loss": 1.1039, + "step": 21789 + }, + { + "epoch": 0.66, + "learning_rate": 1.3945380655988737e-06, + "loss": 1.027, + "step": 21790 + }, + { + "epoch": 0.66, + "learning_rate": 1.3943192931204707e-06, + "loss": 1.0039, + "step": 21791 + }, + { + "epoch": 0.66, + "learning_rate": 1.3941005311676156e-06, + "loss": 1.1446, + "step": 21792 + }, + { + "epoch": 0.66, + "learning_rate": 1.393881779742391e-06, + "loss": 1.1526, + "step": 21793 + }, + { + "epoch": 0.66, + "learning_rate": 1.3936630388468786e-06, + "loss": 1.2187, + "step": 21794 + }, + { + "epoch": 0.66, + "learning_rate": 1.3934443084831616e-06, + "loss": 1.102, + "step": 21795 + }, + { + "epoch": 0.66, + "learning_rate": 1.393225588653323e-06, + "loss": 1.0942, + "step": 21796 + }, + { + "epoch": 0.66, + "learning_rate": 1.3930068793594426e-06, + "loss": 1.0642, + "step": 21797 + }, + { + "epoch": 0.66, + "learning_rate": 1.392788180603603e-06, + "loss": 1.194, + "step": 21798 + }, + { + "epoch": 0.66, + "learning_rate": 1.3925694923878874e-06, + "loss": 1.1423, + "step": 21799 + }, + { + "epoch": 0.66, + "learning_rate": 1.3923508147143777e-06, + "loss": 1.1161, + "step": 21800 + }, + { + "epoch": 0.66, + "learning_rate": 1.3921321475851537e-06, + "loss": 1.178, + "step": 21801 + }, + { + "epoch": 0.66, + "learning_rate": 1.391913491002298e-06, + "loss": 1.2031, + "step": 21802 + }, + { + "epoch": 0.66, + "learning_rate": 1.3916948449678924e-06, + "loss": 1.0262, + "step": 21803 + }, + { + "epoch": 0.66, + "learning_rate": 1.391476209484019e-06, + "loss": 1.0876, + "step": 21804 + }, + { + "epoch": 0.66, + "learning_rate": 1.391257584552757e-06, + "loss": 1.1282, + "step": 21805 + }, + { + "epoch": 0.66, + "learning_rate": 1.3910389701761892e-06, + "loss": 1.1269, + "step": 21806 + }, + { + "epoch": 0.66, + "learning_rate": 1.3908203663563964e-06, + "loss": 0.9637, + "step": 21807 + }, + { + "epoch": 0.66, + "learning_rate": 1.390601773095459e-06, + "loss": 1.1152, + "step": 21808 + }, + { + "epoch": 0.66, + "learning_rate": 1.3903831903954596e-06, + "loss": 1.0226, + "step": 21809 + }, + { + "epoch": 0.66, + "learning_rate": 1.3901646182584768e-06, + "loss": 1.1099, + "step": 21810 + }, + { + "epoch": 0.66, + "learning_rate": 1.3899460566865924e-06, + "loss": 1.1729, + "step": 21811 + }, + { + "epoch": 0.66, + "learning_rate": 1.389727505681887e-06, + "loss": 1.0759, + "step": 21812 + }, + { + "epoch": 0.66, + "learning_rate": 1.389508965246442e-06, + "loss": 1.1277, + "step": 21813 + }, + { + "epoch": 0.66, + "learning_rate": 1.3892904353823355e-06, + "loss": 1.1105, + "step": 21814 + }, + { + "epoch": 0.66, + "learning_rate": 1.3890719160916493e-06, + "loss": 1.1357, + "step": 21815 + }, + { + "epoch": 0.66, + "learning_rate": 1.3888534073764636e-06, + "loss": 1.1102, + "step": 21816 + }, + { + "epoch": 0.66, + "learning_rate": 1.3886349092388585e-06, + "loss": 1.1057, + "step": 21817 + }, + { + "epoch": 0.66, + "learning_rate": 1.3884164216809131e-06, + "loss": 1.1038, + "step": 21818 + }, + { + "epoch": 0.66, + "learning_rate": 1.3881979447047086e-06, + "loss": 1.1747, + "step": 21819 + }, + { + "epoch": 0.66, + "learning_rate": 1.3879794783123252e-06, + "loss": 1.0747, + "step": 21820 + }, + { + "epoch": 0.66, + "learning_rate": 1.3877610225058402e-06, + "loss": 1.1096, + "step": 21821 + }, + { + "epoch": 0.66, + "learning_rate": 1.387542577287335e-06, + "loss": 1.0917, + "step": 21822 + }, + { + "epoch": 0.66, + "learning_rate": 1.3873241426588885e-06, + "loss": 1.0625, + "step": 21823 + }, + { + "epoch": 0.66, + "learning_rate": 1.38710571862258e-06, + "loss": 1.1714, + "step": 21824 + }, + { + "epoch": 0.66, + "learning_rate": 1.3868873051804896e-06, + "loss": 1.1389, + "step": 21825 + }, + { + "epoch": 0.66, + "learning_rate": 1.3866689023346969e-06, + "loss": 1.0391, + "step": 21826 + }, + { + "epoch": 0.66, + "learning_rate": 1.3864505100872787e-06, + "loss": 1.1331, + "step": 21827 + }, + { + "epoch": 0.66, + "learning_rate": 1.3862321284403155e-06, + "loss": 1.1344, + "step": 21828 + }, + { + "epoch": 0.66, + "learning_rate": 1.386013757395886e-06, + "loss": 1.1811, + "step": 21829 + }, + { + "epoch": 0.66, + "learning_rate": 1.38579539695607e-06, + "loss": 1.1822, + "step": 21830 + }, + { + "epoch": 0.66, + "learning_rate": 1.3855770471229443e-06, + "loss": 1.2178, + "step": 21831 + }, + { + "epoch": 0.66, + "learning_rate": 1.3853587078985884e-06, + "loss": 1.1256, + "step": 21832 + }, + { + "epoch": 0.66, + "learning_rate": 1.3851403792850807e-06, + "loss": 0.9529, + "step": 21833 + }, + { + "epoch": 0.66, + "learning_rate": 1.3849220612844997e-06, + "loss": 1.0355, + "step": 21834 + }, + { + "epoch": 0.66, + "learning_rate": 1.3847037538989243e-06, + "loss": 1.0671, + "step": 21835 + }, + { + "epoch": 0.66, + "learning_rate": 1.3844854571304318e-06, + "loss": 1.1085, + "step": 21836 + }, + { + "epoch": 0.66, + "learning_rate": 1.3842671709810996e-06, + "loss": 1.2604, + "step": 21837 + }, + { + "epoch": 0.66, + "learning_rate": 1.384048895453007e-06, + "loss": 1.1066, + "step": 21838 + }, + { + "epoch": 0.66, + "learning_rate": 1.3838306305482325e-06, + "loss": 1.114, + "step": 21839 + }, + { + "epoch": 0.66, + "learning_rate": 1.3836123762688518e-06, + "loss": 1.0682, + "step": 21840 + }, + { + "epoch": 0.66, + "learning_rate": 1.3833941326169437e-06, + "loss": 1.1345, + "step": 21841 + }, + { + "epoch": 0.66, + "learning_rate": 1.3831758995945854e-06, + "loss": 1.1183, + "step": 21842 + }, + { + "epoch": 0.66, + "learning_rate": 1.382957677203856e-06, + "loss": 1.3124, + "step": 21843 + }, + { + "epoch": 0.66, + "learning_rate": 1.3827394654468302e-06, + "loss": 1.1011, + "step": 21844 + }, + { + "epoch": 0.66, + "learning_rate": 1.382521264325587e-06, + "loss": 1.0553, + "step": 21845 + }, + { + "epoch": 0.66, + "learning_rate": 1.3823030738422026e-06, + "loss": 1.0983, + "step": 21846 + }, + { + "epoch": 0.66, + "learning_rate": 1.3820848939987552e-06, + "loss": 1.0962, + "step": 21847 + }, + { + "epoch": 0.66, + "learning_rate": 1.3818667247973208e-06, + "loss": 1.0707, + "step": 21848 + }, + { + "epoch": 0.66, + "learning_rate": 1.381648566239977e-06, + "loss": 1.0587, + "step": 21849 + }, + { + "epoch": 0.66, + "learning_rate": 1.3814304183288e-06, + "loss": 1.0485, + "step": 21850 + }, + { + "epoch": 0.66, + "learning_rate": 1.3812122810658667e-06, + "loss": 1.0209, + "step": 21851 + }, + { + "epoch": 0.66, + "learning_rate": 1.3809941544532545e-06, + "loss": 1.1083, + "step": 21852 + }, + { + "epoch": 0.66, + "learning_rate": 1.3807760384930385e-06, + "loss": 1.1542, + "step": 21853 + }, + { + "epoch": 0.66, + "learning_rate": 1.3805579331872954e-06, + "loss": 1.1218, + "step": 21854 + }, + { + "epoch": 0.66, + "learning_rate": 1.3803398385381012e-06, + "loss": 1.2839, + "step": 21855 + }, + { + "epoch": 0.66, + "learning_rate": 1.3801217545475338e-06, + "loss": 1.0593, + "step": 21856 + }, + { + "epoch": 0.66, + "learning_rate": 1.379903681217667e-06, + "loss": 1.1135, + "step": 21857 + }, + { + "epoch": 0.66, + "learning_rate": 1.3796856185505778e-06, + "loss": 0.9601, + "step": 21858 + }, + { + "epoch": 0.66, + "learning_rate": 1.3794675665483418e-06, + "loss": 1.2166, + "step": 21859 + }, + { + "epoch": 0.66, + "learning_rate": 1.379249525213035e-06, + "loss": 1.0917, + "step": 21860 + }, + { + "epoch": 0.66, + "learning_rate": 1.3790314945467337e-06, + "loss": 1.0367, + "step": 21861 + }, + { + "epoch": 0.66, + "learning_rate": 1.3788134745515118e-06, + "loss": 1.3083, + "step": 21862 + }, + { + "epoch": 0.66, + "learning_rate": 1.378595465229446e-06, + "loss": 1.1926, + "step": 21863 + }, + { + "epoch": 0.66, + "learning_rate": 1.3783774665826109e-06, + "loss": 1.0769, + "step": 21864 + }, + { + "epoch": 0.66, + "learning_rate": 1.378159478613083e-06, + "loss": 1.1202, + "step": 21865 + }, + { + "epoch": 0.66, + "learning_rate": 1.3779415013229358e-06, + "loss": 1.0207, + "step": 21866 + }, + { + "epoch": 0.66, + "learning_rate": 1.3777235347142453e-06, + "loss": 1.1379, + "step": 21867 + }, + { + "epoch": 0.66, + "learning_rate": 1.377505578789086e-06, + "loss": 1.1356, + "step": 21868 + }, + { + "epoch": 0.66, + "learning_rate": 1.3772876335495339e-06, + "loss": 1.2132, + "step": 21869 + }, + { + "epoch": 0.66, + "learning_rate": 1.3770696989976618e-06, + "loss": 1.1722, + "step": 21870 + }, + { + "epoch": 0.66, + "learning_rate": 1.3768517751355456e-06, + "loss": 1.2126, + "step": 21871 + }, + { + "epoch": 0.66, + "learning_rate": 1.3766338619652595e-06, + "loss": 1.1732, + "step": 21872 + }, + { + "epoch": 0.66, + "learning_rate": 1.3764159594888778e-06, + "loss": 1.1334, + "step": 21873 + }, + { + "epoch": 0.66, + "learning_rate": 1.3761980677084752e-06, + "loss": 1.1558, + "step": 21874 + }, + { + "epoch": 0.66, + "learning_rate": 1.3759801866261259e-06, + "loss": 1.0865, + "step": 21875 + }, + { + "epoch": 0.66, + "learning_rate": 1.3757623162439035e-06, + "loss": 1.0079, + "step": 21876 + }, + { + "epoch": 0.66, + "learning_rate": 1.3755444565638827e-06, + "loss": 1.0945, + "step": 21877 + }, + { + "epoch": 0.66, + "learning_rate": 1.3753266075881378e-06, + "loss": 1.1896, + "step": 21878 + }, + { + "epoch": 0.66, + "learning_rate": 1.3751087693187412e-06, + "loss": 1.0474, + "step": 21879 + }, + { + "epoch": 0.66, + "learning_rate": 1.3748909417577673e-06, + "loss": 1.1808, + "step": 21880 + }, + { + "epoch": 0.66, + "learning_rate": 1.3746731249072897e-06, + "loss": 1.2555, + "step": 21881 + }, + { + "epoch": 0.66, + "learning_rate": 1.3744553187693832e-06, + "loss": 1.1682, + "step": 21882 + }, + { + "epoch": 0.66, + "learning_rate": 1.3742375233461186e-06, + "loss": 1.1127, + "step": 21883 + }, + { + "epoch": 0.66, + "learning_rate": 1.374019738639571e-06, + "loss": 1.0443, + "step": 21884 + }, + { + "epoch": 0.66, + "learning_rate": 1.373801964651813e-06, + "loss": 1.054, + "step": 21885 + }, + { + "epoch": 0.66, + "learning_rate": 1.3735842013849187e-06, + "loss": 1.1835, + "step": 21886 + }, + { + "epoch": 0.66, + "learning_rate": 1.3733664488409598e-06, + "loss": 1.136, + "step": 21887 + }, + { + "epoch": 0.66, + "learning_rate": 1.3731487070220095e-06, + "loss": 1.1158, + "step": 21888 + }, + { + "epoch": 0.66, + "learning_rate": 1.3729309759301407e-06, + "loss": 1.2152, + "step": 21889 + }, + { + "epoch": 0.66, + "learning_rate": 1.372713255567426e-06, + "loss": 1.0325, + "step": 21890 + }, + { + "epoch": 0.66, + "learning_rate": 1.3724955459359397e-06, + "loss": 1.0983, + "step": 21891 + }, + { + "epoch": 0.66, + "learning_rate": 1.3722778470377512e-06, + "loss": 1.1368, + "step": 21892 + }, + { + "epoch": 0.66, + "learning_rate": 1.372060158874935e-06, + "loss": 1.1278, + "step": 21893 + }, + { + "epoch": 0.66, + "learning_rate": 1.3718424814495623e-06, + "loss": 1.1552, + "step": 21894 + }, + { + "epoch": 0.66, + "learning_rate": 1.3716248147637073e-06, + "loss": 1.1, + "step": 21895 + }, + { + "epoch": 0.66, + "learning_rate": 1.3714071588194394e-06, + "loss": 1.0474, + "step": 21896 + }, + { + "epoch": 0.66, + "learning_rate": 1.371189513618832e-06, + "loss": 1.1326, + "step": 21897 + }, + { + "epoch": 0.66, + "learning_rate": 1.3709718791639564e-06, + "loss": 1.0849, + "step": 21898 + }, + { + "epoch": 0.66, + "learning_rate": 1.3707542554568847e-06, + "loss": 1.2541, + "step": 21899 + }, + { + "epoch": 0.66, + "learning_rate": 1.370536642499689e-06, + "loss": 1.1772, + "step": 21900 + }, + { + "epoch": 0.66, + "learning_rate": 1.3703190402944406e-06, + "loss": 1.0643, + "step": 21901 + }, + { + "epoch": 0.66, + "learning_rate": 1.3701014488432107e-06, + "loss": 1.1014, + "step": 21902 + }, + { + "epoch": 0.66, + "learning_rate": 1.3698838681480717e-06, + "loss": 1.142, + "step": 21903 + }, + { + "epoch": 0.66, + "learning_rate": 1.369666298211093e-06, + "loss": 1.1108, + "step": 21904 + }, + { + "epoch": 0.66, + "learning_rate": 1.369448739034347e-06, + "loss": 1.1561, + "step": 21905 + }, + { + "epoch": 0.66, + "learning_rate": 1.369231190619904e-06, + "loss": 1.2256, + "step": 21906 + }, + { + "epoch": 0.66, + "learning_rate": 1.3690136529698361e-06, + "loss": 1.0336, + "step": 21907 + }, + { + "epoch": 0.66, + "learning_rate": 1.3687961260862142e-06, + "loss": 1.1108, + "step": 21908 + }, + { + "epoch": 0.66, + "learning_rate": 1.3685786099711073e-06, + "loss": 1.0961, + "step": 21909 + }, + { + "epoch": 0.66, + "learning_rate": 1.3683611046265872e-06, + "loss": 1.0872, + "step": 21910 + }, + { + "epoch": 0.66, + "learning_rate": 1.3681436100547246e-06, + "loss": 1.1474, + "step": 21911 + }, + { + "epoch": 0.66, + "learning_rate": 1.3679261262575905e-06, + "loss": 1.313, + "step": 21912 + }, + { + "epoch": 0.66, + "learning_rate": 1.3677086532372535e-06, + "loss": 1.0492, + "step": 21913 + }, + { + "epoch": 0.66, + "learning_rate": 1.3674911909957847e-06, + "loss": 1.1956, + "step": 21914 + }, + { + "epoch": 0.66, + "learning_rate": 1.3672737395352543e-06, + "loss": 1.0399, + "step": 21915 + }, + { + "epoch": 0.66, + "learning_rate": 1.3670562988577323e-06, + "loss": 1.0605, + "step": 21916 + }, + { + "epoch": 0.66, + "learning_rate": 1.3668388689652901e-06, + "loss": 1.0765, + "step": 21917 + }, + { + "epoch": 0.66, + "learning_rate": 1.3666214498599948e-06, + "loss": 1.1341, + "step": 21918 + }, + { + "epoch": 0.66, + "learning_rate": 1.3664040415439172e-06, + "loss": 1.1779, + "step": 21919 + }, + { + "epoch": 0.66, + "learning_rate": 1.3661866440191277e-06, + "loss": 1.1852, + "step": 21920 + }, + { + "epoch": 0.66, + "learning_rate": 1.365969257287696e-06, + "loss": 1.0545, + "step": 21921 + }, + { + "epoch": 0.66, + "learning_rate": 1.36575188135169e-06, + "loss": 1.1313, + "step": 21922 + }, + { + "epoch": 0.66, + "learning_rate": 1.3655345162131795e-06, + "loss": 1.0515, + "step": 21923 + }, + { + "epoch": 0.66, + "learning_rate": 1.3653171618742341e-06, + "loss": 1.1419, + "step": 21924 + }, + { + "epoch": 0.66, + "learning_rate": 1.3650998183369241e-06, + "loss": 1.0662, + "step": 21925 + }, + { + "epoch": 0.66, + "learning_rate": 1.364882485603316e-06, + "loss": 1.0844, + "step": 21926 + }, + { + "epoch": 0.66, + "learning_rate": 1.36466516367548e-06, + "loss": 1.0864, + "step": 21927 + }, + { + "epoch": 0.66, + "learning_rate": 1.364447852555485e-06, + "loss": 1.036, + "step": 21928 + }, + { + "epoch": 0.66, + "learning_rate": 1.364230552245399e-06, + "loss": 1.1992, + "step": 21929 + }, + { + "epoch": 0.66, + "learning_rate": 1.3640132627472919e-06, + "loss": 1.2276, + "step": 21930 + }, + { + "epoch": 0.66, + "learning_rate": 1.3637959840632308e-06, + "loss": 1.1709, + "step": 21931 + }, + { + "epoch": 0.66, + "learning_rate": 1.3635787161952852e-06, + "loss": 1.1497, + "step": 21932 + }, + { + "epoch": 0.66, + "learning_rate": 1.3633614591455228e-06, + "loss": 1.047, + "step": 21933 + }, + { + "epoch": 0.66, + "learning_rate": 1.3631442129160128e-06, + "loss": 1.1282, + "step": 21934 + }, + { + "epoch": 0.66, + "learning_rate": 1.362926977508821e-06, + "loss": 1.1641, + "step": 21935 + }, + { + "epoch": 0.66, + "learning_rate": 1.3627097529260174e-06, + "loss": 1.1649, + "step": 21936 + }, + { + "epoch": 0.66, + "learning_rate": 1.3624925391696686e-06, + "loss": 1.1186, + "step": 21937 + }, + { + "epoch": 0.66, + "learning_rate": 1.3622753362418446e-06, + "loss": 1.1442, + "step": 21938 + }, + { + "epoch": 0.66, + "learning_rate": 1.3620581441446102e-06, + "loss": 1.0956, + "step": 21939 + }, + { + "epoch": 0.66, + "learning_rate": 1.361840962880034e-06, + "loss": 1.1942, + "step": 21940 + }, + { + "epoch": 0.66, + "learning_rate": 1.3616237924501837e-06, + "loss": 1.0463, + "step": 21941 + }, + { + "epoch": 0.66, + "learning_rate": 1.3614066328571267e-06, + "loss": 1.0675, + "step": 21942 + }, + { + "epoch": 0.66, + "learning_rate": 1.3611894841029314e-06, + "loss": 1.0715, + "step": 21943 + }, + { + "epoch": 0.66, + "learning_rate": 1.3609723461896626e-06, + "loss": 1.0792, + "step": 21944 + }, + { + "epoch": 0.66, + "learning_rate": 1.3607552191193885e-06, + "loss": 1.1151, + "step": 21945 + }, + { + "epoch": 0.66, + "learning_rate": 1.3605381028941761e-06, + "loss": 0.9537, + "step": 21946 + }, + { + "epoch": 0.66, + "learning_rate": 1.3603209975160931e-06, + "loss": 1.1138, + "step": 21947 + }, + { + "epoch": 0.66, + "learning_rate": 1.3601039029872043e-06, + "loss": 1.1149, + "step": 21948 + }, + { + "epoch": 0.66, + "learning_rate": 1.359886819309577e-06, + "loss": 1.1341, + "step": 21949 + }, + { + "epoch": 0.66, + "learning_rate": 1.3596697464852788e-06, + "loss": 1.1406, + "step": 21950 + }, + { + "epoch": 0.66, + "learning_rate": 1.3594526845163758e-06, + "loss": 1.1193, + "step": 21951 + }, + { + "epoch": 0.66, + "learning_rate": 1.3592356334049334e-06, + "loss": 1.0588, + "step": 21952 + }, + { + "epoch": 0.66, + "learning_rate": 1.359018593153018e-06, + "loss": 1.0732, + "step": 21953 + }, + { + "epoch": 0.66, + "learning_rate": 1.358801563762696e-06, + "loss": 1.2349, + "step": 21954 + }, + { + "epoch": 0.66, + "learning_rate": 1.3585845452360342e-06, + "loss": 1.0976, + "step": 21955 + }, + { + "epoch": 0.66, + "learning_rate": 1.3583675375750971e-06, + "loss": 1.1768, + "step": 21956 + }, + { + "epoch": 0.66, + "learning_rate": 1.3581505407819515e-06, + "loss": 1.1379, + "step": 21957 + }, + { + "epoch": 0.66, + "learning_rate": 1.3579335548586628e-06, + "loss": 1.0914, + "step": 21958 + }, + { + "epoch": 0.66, + "learning_rate": 1.3577165798072966e-06, + "loss": 1.0715, + "step": 21959 + }, + { + "epoch": 0.66, + "learning_rate": 1.3574996156299192e-06, + "loss": 1.1139, + "step": 21960 + }, + { + "epoch": 0.66, + "learning_rate": 1.3572826623285945e-06, + "loss": 1.1248, + "step": 21961 + }, + { + "epoch": 0.66, + "learning_rate": 1.3570657199053882e-06, + "loss": 1.186, + "step": 21962 + }, + { + "epoch": 0.66, + "learning_rate": 1.3568487883623662e-06, + "loss": 1.1481, + "step": 21963 + }, + { + "epoch": 0.66, + "learning_rate": 1.3566318677015937e-06, + "loss": 1.0364, + "step": 21964 + }, + { + "epoch": 0.66, + "learning_rate": 1.3564149579251345e-06, + "loss": 1.078, + "step": 21965 + }, + { + "epoch": 0.66, + "learning_rate": 1.3561980590350543e-06, + "loss": 1.1926, + "step": 21966 + }, + { + "epoch": 0.66, + "learning_rate": 1.3559811710334176e-06, + "loss": 1.1703, + "step": 21967 + }, + { + "epoch": 0.66, + "learning_rate": 1.355764293922289e-06, + "loss": 1.0821, + "step": 21968 + }, + { + "epoch": 0.66, + "learning_rate": 1.3555474277037342e-06, + "loss": 1.2199, + "step": 21969 + }, + { + "epoch": 0.66, + "learning_rate": 1.3553305723798158e-06, + "loss": 1.1071, + "step": 21970 + }, + { + "epoch": 0.66, + "learning_rate": 1.355113727952599e-06, + "loss": 1.1069, + "step": 21971 + }, + { + "epoch": 0.66, + "learning_rate": 1.354896894424148e-06, + "loss": 1.0554, + "step": 21972 + }, + { + "epoch": 0.66, + "learning_rate": 1.3546800717965283e-06, + "loss": 1.1044, + "step": 21973 + }, + { + "epoch": 0.66, + "learning_rate": 1.3544632600718015e-06, + "loss": 1.0403, + "step": 21974 + }, + { + "epoch": 0.66, + "learning_rate": 1.3542464592520333e-06, + "loss": 1.1334, + "step": 21975 + }, + { + "epoch": 0.66, + "learning_rate": 1.3540296693392863e-06, + "loss": 1.0997, + "step": 21976 + }, + { + "epoch": 0.66, + "learning_rate": 1.3538128903356262e-06, + "loss": 0.9975, + "step": 21977 + }, + { + "epoch": 0.66, + "learning_rate": 1.3535961222431143e-06, + "loss": 1.0865, + "step": 21978 + }, + { + "epoch": 0.66, + "learning_rate": 1.3533793650638155e-06, + "loss": 1.1127, + "step": 21979 + }, + { + "epoch": 0.66, + "learning_rate": 1.3531626187997926e-06, + "loss": 1.1123, + "step": 21980 + }, + { + "epoch": 0.66, + "learning_rate": 1.3529458834531092e-06, + "loss": 1.1777, + "step": 21981 + }, + { + "epoch": 0.66, + "learning_rate": 1.3527291590258288e-06, + "loss": 1.0955, + "step": 21982 + }, + { + "epoch": 0.66, + "learning_rate": 1.352512445520014e-06, + "loss": 1.1564, + "step": 21983 + }, + { + "epoch": 0.66, + "learning_rate": 1.3522957429377281e-06, + "loss": 1.1238, + "step": 21984 + }, + { + "epoch": 0.66, + "learning_rate": 1.352079051281035e-06, + "loss": 1.0859, + "step": 21985 + }, + { + "epoch": 0.66, + "learning_rate": 1.3518623705519957e-06, + "loss": 1.1505, + "step": 21986 + }, + { + "epoch": 0.66, + "learning_rate": 1.3516457007526733e-06, + "loss": 1.0976, + "step": 21987 + }, + { + "epoch": 0.66, + "learning_rate": 1.351429041885131e-06, + "loss": 1.1423, + "step": 21988 + }, + { + "epoch": 0.66, + "learning_rate": 1.351212393951431e-06, + "loss": 1.1282, + "step": 21989 + }, + { + "epoch": 0.66, + "learning_rate": 1.350995756953637e-06, + "loss": 1.0439, + "step": 21990 + }, + { + "epoch": 0.66, + "learning_rate": 1.3507791308938086e-06, + "loss": 1.1386, + "step": 21991 + }, + { + "epoch": 0.66, + "learning_rate": 1.3505625157740095e-06, + "loss": 1.1218, + "step": 21992 + }, + { + "epoch": 0.66, + "learning_rate": 1.3503459115963019e-06, + "loss": 1.1441, + "step": 21993 + }, + { + "epoch": 0.66, + "learning_rate": 1.3501293183627472e-06, + "loss": 1.0747, + "step": 21994 + }, + { + "epoch": 0.66, + "learning_rate": 1.3499127360754088e-06, + "loss": 1.0696, + "step": 21995 + }, + { + "epoch": 0.66, + "learning_rate": 1.349696164736346e-06, + "loss": 1.1204, + "step": 21996 + }, + { + "epoch": 0.66, + "learning_rate": 1.3494796043476222e-06, + "loss": 1.2415, + "step": 21997 + }, + { + "epoch": 0.66, + "learning_rate": 1.3492630549112981e-06, + "loss": 1.0812, + "step": 21998 + }, + { + "epoch": 0.66, + "learning_rate": 1.3490465164294365e-06, + "loss": 1.1214, + "step": 21999 + }, + { + "epoch": 0.66, + "learning_rate": 1.3488299889040968e-06, + "loss": 1.0505, + "step": 22000 + }, + { + "epoch": 0.66, + "learning_rate": 1.348613472337341e-06, + "loss": 1.1155, + "step": 22001 + }, + { + "epoch": 0.66, + "learning_rate": 1.3483969667312307e-06, + "loss": 1.1732, + "step": 22002 + }, + { + "epoch": 0.66, + "learning_rate": 1.3481804720878277e-06, + "loss": 1.0907, + "step": 22003 + }, + { + "epoch": 0.66, + "learning_rate": 1.3479639884091905e-06, + "loss": 1.1762, + "step": 22004 + }, + { + "epoch": 0.66, + "learning_rate": 1.3477475156973818e-06, + "loss": 1.1987, + "step": 22005 + }, + { + "epoch": 0.66, + "learning_rate": 1.3475310539544614e-06, + "loss": 1.1015, + "step": 22006 + }, + { + "epoch": 0.66, + "learning_rate": 1.3473146031824904e-06, + "loss": 1.2322, + "step": 22007 + }, + { + "epoch": 0.66, + "learning_rate": 1.3470981633835302e-06, + "loss": 1.1991, + "step": 22008 + }, + { + "epoch": 0.66, + "learning_rate": 1.3468817345596393e-06, + "loss": 1.1193, + "step": 22009 + }, + { + "epoch": 0.66, + "learning_rate": 1.346665316712879e-06, + "loss": 1.083, + "step": 22010 + }, + { + "epoch": 0.66, + "learning_rate": 1.3464489098453092e-06, + "loss": 1.0375, + "step": 22011 + }, + { + "epoch": 0.66, + "learning_rate": 1.3462325139589904e-06, + "loss": 1.0447, + "step": 22012 + }, + { + "epoch": 0.66, + "learning_rate": 1.3460161290559826e-06, + "loss": 1.0804, + "step": 22013 + }, + { + "epoch": 0.66, + "learning_rate": 1.345799755138345e-06, + "loss": 1.2101, + "step": 22014 + }, + { + "epoch": 0.66, + "learning_rate": 1.345583392208138e-06, + "loss": 1.0576, + "step": 22015 + }, + { + "epoch": 0.66, + "learning_rate": 1.3453670402674224e-06, + "loss": 1.1447, + "step": 22016 + }, + { + "epoch": 0.66, + "learning_rate": 1.345150699318255e-06, + "loss": 1.1185, + "step": 22017 + }, + { + "epoch": 0.66, + "learning_rate": 1.344934369362697e-06, + "loss": 1.1591, + "step": 22018 + }, + { + "epoch": 0.66, + "learning_rate": 1.3447180504028076e-06, + "loss": 1.0989, + "step": 22019 + }, + { + "epoch": 0.66, + "learning_rate": 1.344501742440646e-06, + "loss": 1.1259, + "step": 22020 + }, + { + "epoch": 0.66, + "learning_rate": 1.3442854454782723e-06, + "loss": 1.0745, + "step": 22021 + }, + { + "epoch": 0.66, + "learning_rate": 1.344069159517743e-06, + "loss": 1.0264, + "step": 22022 + }, + { + "epoch": 0.66, + "learning_rate": 1.3438528845611192e-06, + "loss": 1.108, + "step": 22023 + }, + { + "epoch": 0.66, + "learning_rate": 1.343636620610459e-06, + "loss": 1.1683, + "step": 22024 + }, + { + "epoch": 0.66, + "learning_rate": 1.343420367667822e-06, + "loss": 1.124, + "step": 22025 + }, + { + "epoch": 0.66, + "learning_rate": 1.3432041257352652e-06, + "loss": 0.9772, + "step": 22026 + }, + { + "epoch": 0.66, + "learning_rate": 1.3429878948148485e-06, + "loss": 1.1406, + "step": 22027 + }, + { + "epoch": 0.66, + "learning_rate": 1.342771674908629e-06, + "loss": 1.0552, + "step": 22028 + }, + { + "epoch": 0.66, + "learning_rate": 1.342555466018667e-06, + "loss": 1.0937, + "step": 22029 + }, + { + "epoch": 0.66, + "learning_rate": 1.3423392681470189e-06, + "loss": 1.2874, + "step": 22030 + }, + { + "epoch": 0.66, + "learning_rate": 1.342123081295743e-06, + "loss": 1.274, + "step": 22031 + }, + { + "epoch": 0.66, + "learning_rate": 1.341906905466898e-06, + "loss": 1.1363, + "step": 22032 + }, + { + "epoch": 0.66, + "learning_rate": 1.3416907406625414e-06, + "loss": 1.0245, + "step": 22033 + }, + { + "epoch": 0.66, + "learning_rate": 1.3414745868847324e-06, + "loss": 1.0848, + "step": 22034 + }, + { + "epoch": 0.66, + "learning_rate": 1.341258444135526e-06, + "loss": 1.1351, + "step": 22035 + }, + { + "epoch": 0.66, + "learning_rate": 1.341042312416981e-06, + "loss": 1.2012, + "step": 22036 + }, + { + "epoch": 0.66, + "learning_rate": 1.3408261917311554e-06, + "loss": 1.1346, + "step": 22037 + }, + { + "epoch": 0.66, + "learning_rate": 1.340610082080106e-06, + "loss": 1.0383, + "step": 22038 + }, + { + "epoch": 0.66, + "learning_rate": 1.3403939834658901e-06, + "loss": 1.1093, + "step": 22039 + }, + { + "epoch": 0.66, + "learning_rate": 1.3401778958905654e-06, + "loss": 1.2042, + "step": 22040 + }, + { + "epoch": 0.66, + "learning_rate": 1.3399618193561881e-06, + "loss": 1.1349, + "step": 22041 + }, + { + "epoch": 0.66, + "learning_rate": 1.3397457538648167e-06, + "loss": 1.0535, + "step": 22042 + }, + { + "epoch": 0.66, + "learning_rate": 1.339529699418506e-06, + "loss": 1.0634, + "step": 22043 + }, + { + "epoch": 0.66, + "learning_rate": 1.3393136560193136e-06, + "loss": 1.2299, + "step": 22044 + }, + { + "epoch": 0.66, + "learning_rate": 1.3390976236692962e-06, + "loss": 1.1764, + "step": 22045 + }, + { + "epoch": 0.66, + "learning_rate": 1.3388816023705104e-06, + "loss": 1.0589, + "step": 22046 + }, + { + "epoch": 0.66, + "learning_rate": 1.3386655921250135e-06, + "loss": 1.0656, + "step": 22047 + }, + { + "epoch": 0.66, + "learning_rate": 1.3384495929348598e-06, + "loss": 1.1565, + "step": 22048 + }, + { + "epoch": 0.66, + "learning_rate": 1.3382336048021066e-06, + "loss": 1.1664, + "step": 22049 + }, + { + "epoch": 0.66, + "learning_rate": 1.3380176277288098e-06, + "loss": 1.0164, + "step": 22050 + }, + { + "epoch": 0.66, + "learning_rate": 1.337801661717027e-06, + "loss": 1.1502, + "step": 22051 + }, + { + "epoch": 0.66, + "learning_rate": 1.3375857067688113e-06, + "loss": 1.1476, + "step": 22052 + }, + { + "epoch": 0.66, + "learning_rate": 1.3373697628862198e-06, + "loss": 1.0825, + "step": 22053 + }, + { + "epoch": 0.66, + "learning_rate": 1.3371538300713082e-06, + "loss": 1.2035, + "step": 22054 + }, + { + "epoch": 0.66, + "learning_rate": 1.336937908326133e-06, + "loss": 1.3126, + "step": 22055 + }, + { + "epoch": 0.66, + "learning_rate": 1.3367219976527483e-06, + "loss": 1.1717, + "step": 22056 + }, + { + "epoch": 0.66, + "learning_rate": 1.3365060980532097e-06, + "loss": 1.1121, + "step": 22057 + }, + { + "epoch": 0.66, + "learning_rate": 1.3362902095295722e-06, + "loss": 1.0311, + "step": 22058 + }, + { + "epoch": 0.66, + "learning_rate": 1.3360743320838921e-06, + "loss": 1.0226, + "step": 22059 + }, + { + "epoch": 0.66, + "learning_rate": 1.3358584657182244e-06, + "loss": 1.046, + "step": 22060 + }, + { + "epoch": 0.66, + "learning_rate": 1.3356426104346223e-06, + "loss": 1.1133, + "step": 22061 + }, + { + "epoch": 0.66, + "learning_rate": 1.3354267662351421e-06, + "loss": 1.1337, + "step": 22062 + }, + { + "epoch": 0.66, + "learning_rate": 1.3352109331218382e-06, + "loss": 1.0856, + "step": 22063 + }, + { + "epoch": 0.66, + "learning_rate": 1.3349951110967651e-06, + "loss": 1.0908, + "step": 22064 + }, + { + "epoch": 0.66, + "learning_rate": 1.3347793001619775e-06, + "loss": 1.0699, + "step": 22065 + }, + { + "epoch": 0.66, + "learning_rate": 1.3345635003195299e-06, + "loss": 1.0872, + "step": 22066 + }, + { + "epoch": 0.66, + "learning_rate": 1.334347711571477e-06, + "loss": 1.0105, + "step": 22067 + }, + { + "epoch": 0.66, + "learning_rate": 1.3341319339198722e-06, + "loss": 1.0496, + "step": 22068 + }, + { + "epoch": 0.66, + "learning_rate": 1.3339161673667694e-06, + "loss": 1.0654, + "step": 22069 + }, + { + "epoch": 0.66, + "learning_rate": 1.3337004119142234e-06, + "loss": 1.0559, + "step": 22070 + }, + { + "epoch": 0.66, + "learning_rate": 1.3334846675642874e-06, + "loss": 1.0215, + "step": 22071 + }, + { + "epoch": 0.66, + "learning_rate": 1.333268934319017e-06, + "loss": 1.0455, + "step": 22072 + }, + { + "epoch": 0.66, + "learning_rate": 1.333053212180463e-06, + "loss": 1.0976, + "step": 22073 + }, + { + "epoch": 0.66, + "learning_rate": 1.3328375011506805e-06, + "loss": 1.0839, + "step": 22074 + }, + { + "epoch": 0.67, + "learning_rate": 1.332621801231723e-06, + "loss": 1.1708, + "step": 22075 + }, + { + "epoch": 0.67, + "learning_rate": 1.3324061124256437e-06, + "loss": 1.095, + "step": 22076 + }, + { + "epoch": 0.67, + "learning_rate": 1.3321904347344965e-06, + "loss": 0.9979, + "step": 22077 + }, + { + "epoch": 0.67, + "learning_rate": 1.3319747681603335e-06, + "loss": 1.0496, + "step": 22078 + }, + { + "epoch": 0.67, + "learning_rate": 1.3317591127052079e-06, + "loss": 1.1465, + "step": 22079 + }, + { + "epoch": 0.67, + "learning_rate": 1.331543468371173e-06, + "loss": 1.1226, + "step": 22080 + }, + { + "epoch": 0.67, + "learning_rate": 1.3313278351602823e-06, + "loss": 1.1447, + "step": 22081 + }, + { + "epoch": 0.67, + "learning_rate": 1.3311122130745868e-06, + "loss": 1.0963, + "step": 22082 + }, + { + "epoch": 0.67, + "learning_rate": 1.3308966021161405e-06, + "loss": 1.1321, + "step": 22083 + }, + { + "epoch": 0.67, + "learning_rate": 1.330681002286995e-06, + "loss": 1.0722, + "step": 22084 + }, + { + "epoch": 0.67, + "learning_rate": 1.3304654135892042e-06, + "loss": 1.1465, + "step": 22085 + }, + { + "epoch": 0.67, + "learning_rate": 1.3302498360248188e-06, + "loss": 1.1698, + "step": 22086 + }, + { + "epoch": 0.67, + "learning_rate": 1.3300342695958912e-06, + "loss": 1.098, + "step": 22087 + }, + { + "epoch": 0.67, + "learning_rate": 1.3298187143044743e-06, + "loss": 1.0726, + "step": 22088 + }, + { + "epoch": 0.67, + "learning_rate": 1.3296031701526195e-06, + "loss": 1.0403, + "step": 22089 + }, + { + "epoch": 0.67, + "learning_rate": 1.3293876371423798e-06, + "loss": 1.1078, + "step": 22090 + }, + { + "epoch": 0.67, + "learning_rate": 1.3291721152758046e-06, + "loss": 1.0444, + "step": 22091 + }, + { + "epoch": 0.67, + "learning_rate": 1.3289566045549474e-06, + "loss": 1.2599, + "step": 22092 + }, + { + "epoch": 0.67, + "learning_rate": 1.3287411049818593e-06, + "loss": 1.1418, + "step": 22093 + }, + { + "epoch": 0.67, + "learning_rate": 1.3285256165585916e-06, + "loss": 1.0919, + "step": 22094 + }, + { + "epoch": 0.67, + "learning_rate": 1.3283101392871961e-06, + "loss": 1.1115, + "step": 22095 + }, + { + "epoch": 0.67, + "learning_rate": 1.3280946731697237e-06, + "loss": 1.138, + "step": 22096 + }, + { + "epoch": 0.67, + "learning_rate": 1.3278792182082257e-06, + "loss": 1.1158, + "step": 22097 + }, + { + "epoch": 0.67, + "learning_rate": 1.3276637744047535e-06, + "loss": 1.233, + "step": 22098 + }, + { + "epoch": 0.67, + "learning_rate": 1.3274483417613572e-06, + "loss": 1.2217, + "step": 22099 + }, + { + "epoch": 0.67, + "learning_rate": 1.3272329202800877e-06, + "loss": 1.1821, + "step": 22100 + }, + { + "epoch": 0.67, + "learning_rate": 1.3270175099629956e-06, + "loss": 1.1104, + "step": 22101 + }, + { + "epoch": 0.67, + "learning_rate": 1.3268021108121324e-06, + "loss": 1.1301, + "step": 22102 + }, + { + "epoch": 0.67, + "learning_rate": 1.3265867228295487e-06, + "loss": 1.06, + "step": 22103 + }, + { + "epoch": 0.67, + "learning_rate": 1.3263713460172936e-06, + "loss": 1.1423, + "step": 22104 + }, + { + "epoch": 0.67, + "learning_rate": 1.3261559803774179e-06, + "loss": 1.1444, + "step": 22105 + }, + { + "epoch": 0.67, + "learning_rate": 1.325940625911972e-06, + "loss": 1.1414, + "step": 22106 + }, + { + "epoch": 0.67, + "learning_rate": 1.3257252826230068e-06, + "loss": 1.0753, + "step": 22107 + }, + { + "epoch": 0.67, + "learning_rate": 1.3255099505125705e-06, + "loss": 1.1736, + "step": 22108 + }, + { + "epoch": 0.67, + "learning_rate": 1.3252946295827135e-06, + "loss": 1.0784, + "step": 22109 + }, + { + "epoch": 0.67, + "learning_rate": 1.325079319835486e-06, + "loss": 1.1678, + "step": 22110 + }, + { + "epoch": 0.67, + "learning_rate": 1.3248640212729388e-06, + "loss": 1.2104, + "step": 22111 + }, + { + "epoch": 0.67, + "learning_rate": 1.324648733897119e-06, + "loss": 1.1633, + "step": 22112 + }, + { + "epoch": 0.67, + "learning_rate": 1.324433457710077e-06, + "loss": 1.0764, + "step": 22113 + }, + { + "epoch": 0.67, + "learning_rate": 1.3242181927138625e-06, + "loss": 1.0839, + "step": 22114 + }, + { + "epoch": 0.67, + "learning_rate": 1.3240029389105246e-06, + "loss": 1.1501, + "step": 22115 + }, + { + "epoch": 0.67, + "learning_rate": 1.3237876963021131e-06, + "loss": 1.046, + "step": 22116 + }, + { + "epoch": 0.67, + "learning_rate": 1.3235724648906757e-06, + "loss": 1.0259, + "step": 22117 + }, + { + "epoch": 0.67, + "learning_rate": 1.323357244678261e-06, + "loss": 1.1357, + "step": 22118 + }, + { + "epoch": 0.67, + "learning_rate": 1.3231420356669194e-06, + "loss": 1.1792, + "step": 22119 + }, + { + "epoch": 0.67, + "learning_rate": 1.3229268378586984e-06, + "loss": 1.1404, + "step": 22120 + }, + { + "epoch": 0.67, + "learning_rate": 1.3227116512556473e-06, + "loss": 1.012, + "step": 22121 + }, + { + "epoch": 0.67, + "learning_rate": 1.3224964758598141e-06, + "loss": 1.1798, + "step": 22122 + }, + { + "epoch": 0.67, + "learning_rate": 1.3222813116732475e-06, + "loss": 1.0793, + "step": 22123 + }, + { + "epoch": 0.67, + "learning_rate": 1.3220661586979965e-06, + "loss": 1.14, + "step": 22124 + }, + { + "epoch": 0.67, + "learning_rate": 1.3218510169361073e-06, + "loss": 1.1265, + "step": 22125 + }, + { + "epoch": 0.67, + "learning_rate": 1.3216358863896291e-06, + "loss": 1.0627, + "step": 22126 + }, + { + "epoch": 0.67, + "learning_rate": 1.3214207670606099e-06, + "loss": 1.0853, + "step": 22127 + }, + { + "epoch": 0.67, + "learning_rate": 1.3212056589510968e-06, + "loss": 1.0153, + "step": 22128 + }, + { + "epoch": 0.67, + "learning_rate": 1.3209905620631397e-06, + "loss": 1.0968, + "step": 22129 + }, + { + "epoch": 0.67, + "learning_rate": 1.3207754763987834e-06, + "loss": 1.2183, + "step": 22130 + }, + { + "epoch": 0.67, + "learning_rate": 1.3205604019600764e-06, + "loss": 1.2093, + "step": 22131 + }, + { + "epoch": 0.67, + "learning_rate": 1.3203453387490666e-06, + "loss": 1.1431, + "step": 22132 + }, + { + "epoch": 0.67, + "learning_rate": 1.3201302867678024e-06, + "loss": 1.1323, + "step": 22133 + }, + { + "epoch": 0.67, + "learning_rate": 1.319915246018328e-06, + "loss": 1.0429, + "step": 22134 + }, + { + "epoch": 0.67, + "learning_rate": 1.3197002165026922e-06, + "loss": 1.0264, + "step": 22135 + }, + { + "epoch": 0.67, + "learning_rate": 1.3194851982229424e-06, + "loss": 1.1179, + "step": 22136 + }, + { + "epoch": 0.67, + "learning_rate": 1.3192701911811253e-06, + "loss": 1.14, + "step": 22137 + }, + { + "epoch": 0.67, + "learning_rate": 1.3190551953792867e-06, + "loss": 1.1257, + "step": 22138 + }, + { + "epoch": 0.67, + "learning_rate": 1.3188402108194736e-06, + "loss": 1.0963, + "step": 22139 + }, + { + "epoch": 0.67, + "learning_rate": 1.3186252375037334e-06, + "loss": 1.0369, + "step": 22140 + }, + { + "epoch": 0.67, + "learning_rate": 1.3184102754341116e-06, + "loss": 1.0801, + "step": 22141 + }, + { + "epoch": 0.67, + "learning_rate": 1.3181953246126555e-06, + "loss": 1.1733, + "step": 22142 + }, + { + "epoch": 0.67, + "learning_rate": 1.3179803850414102e-06, + "loss": 1.1389, + "step": 22143 + }, + { + "epoch": 0.67, + "learning_rate": 1.3177654567224225e-06, + "loss": 1.0507, + "step": 22144 + }, + { + "epoch": 0.67, + "learning_rate": 1.317550539657738e-06, + "loss": 1.0619, + "step": 22145 + }, + { + "epoch": 0.67, + "learning_rate": 1.3173356338494028e-06, + "loss": 1.0754, + "step": 22146 + }, + { + "epoch": 0.67, + "learning_rate": 1.3171207392994628e-06, + "loss": 0.998, + "step": 22147 + }, + { + "epoch": 0.67, + "learning_rate": 1.316905856009964e-06, + "loss": 1.0679, + "step": 22148 + }, + { + "epoch": 0.67, + "learning_rate": 1.316690983982951e-06, + "loss": 1.1926, + "step": 22149 + }, + { + "epoch": 0.67, + "learning_rate": 1.3164761232204716e-06, + "loss": 0.937, + "step": 22150 + }, + { + "epoch": 0.67, + "learning_rate": 1.3162612737245683e-06, + "loss": 1.045, + "step": 22151 + }, + { + "epoch": 0.67, + "learning_rate": 1.3160464354972873e-06, + "loss": 1.1536, + "step": 22152 + }, + { + "epoch": 0.67, + "learning_rate": 1.3158316085406745e-06, + "loss": 1.2216, + "step": 22153 + }, + { + "epoch": 0.67, + "learning_rate": 1.3156167928567743e-06, + "loss": 1.1122, + "step": 22154 + }, + { + "epoch": 0.67, + "learning_rate": 1.3154019884476327e-06, + "loss": 1.1332, + "step": 22155 + }, + { + "epoch": 0.67, + "learning_rate": 1.3151871953152925e-06, + "loss": 1.0954, + "step": 22156 + }, + { + "epoch": 0.67, + "learning_rate": 1.3149724134617997e-06, + "loss": 1.1279, + "step": 22157 + }, + { + "epoch": 0.67, + "learning_rate": 1.3147576428891989e-06, + "loss": 1.0782, + "step": 22158 + }, + { + "epoch": 0.67, + "learning_rate": 1.3145428835995355e-06, + "loss": 1.1697, + "step": 22159 + }, + { + "epoch": 0.67, + "learning_rate": 1.3143281355948517e-06, + "loss": 1.1581, + "step": 22160 + }, + { + "epoch": 0.67, + "learning_rate": 1.3141133988771932e-06, + "loss": 1.1005, + "step": 22161 + }, + { + "epoch": 0.67, + "learning_rate": 1.3138986734486039e-06, + "loss": 0.958, + "step": 22162 + }, + { + "epoch": 0.67, + "learning_rate": 1.313683959311129e-06, + "loss": 1.0719, + "step": 22163 + }, + { + "epoch": 0.67, + "learning_rate": 1.3134692564668105e-06, + "loss": 1.1192, + "step": 22164 + }, + { + "epoch": 0.67, + "learning_rate": 1.3132545649176934e-06, + "loss": 1.1234, + "step": 22165 + }, + { + "epoch": 0.67, + "learning_rate": 1.313039884665821e-06, + "loss": 1.1715, + "step": 22166 + }, + { + "epoch": 0.67, + "learning_rate": 1.3128252157132376e-06, + "loss": 1.155, + "step": 22167 + }, + { + "epoch": 0.67, + "learning_rate": 1.3126105580619868e-06, + "loss": 1.0906, + "step": 22168 + }, + { + "epoch": 0.67, + "learning_rate": 1.312395911714111e-06, + "loss": 1.1011, + "step": 22169 + }, + { + "epoch": 0.67, + "learning_rate": 1.312181276671654e-06, + "loss": 1.121, + "step": 22170 + }, + { + "epoch": 0.67, + "learning_rate": 1.3119666529366595e-06, + "loss": 1.0916, + "step": 22171 + }, + { + "epoch": 0.67, + "learning_rate": 1.311752040511171e-06, + "loss": 1.1381, + "step": 22172 + }, + { + "epoch": 0.67, + "learning_rate": 1.31153743939723e-06, + "loss": 1.0255, + "step": 22173 + }, + { + "epoch": 0.67, + "learning_rate": 1.31132284959688e-06, + "loss": 1.166, + "step": 22174 + }, + { + "epoch": 0.67, + "learning_rate": 1.3111082711121642e-06, + "loss": 1.0934, + "step": 22175 + }, + { + "epoch": 0.67, + "learning_rate": 1.3108937039451248e-06, + "loss": 1.0748, + "step": 22176 + }, + { + "epoch": 0.67, + "learning_rate": 1.3106791480978047e-06, + "loss": 1.0931, + "step": 22177 + }, + { + "epoch": 0.67, + "learning_rate": 1.3104646035722462e-06, + "loss": 1.035, + "step": 22178 + }, + { + "epoch": 0.67, + "learning_rate": 1.3102500703704923e-06, + "loss": 1.1385, + "step": 22179 + }, + { + "epoch": 0.67, + "learning_rate": 1.3100355484945842e-06, + "loss": 1.2681, + "step": 22180 + }, + { + "epoch": 0.67, + "learning_rate": 1.309821037946566e-06, + "loss": 1.0497, + "step": 22181 + }, + { + "epoch": 0.67, + "learning_rate": 1.3096065387284768e-06, + "loss": 1.0649, + "step": 22182 + }, + { + "epoch": 0.67, + "learning_rate": 1.3093920508423602e-06, + "loss": 1.096, + "step": 22183 + }, + { + "epoch": 0.67, + "learning_rate": 1.309177574290258e-06, + "loss": 1.1543, + "step": 22184 + }, + { + "epoch": 0.67, + "learning_rate": 1.3089631090742128e-06, + "loss": 1.2075, + "step": 22185 + }, + { + "epoch": 0.67, + "learning_rate": 1.3087486551962642e-06, + "loss": 1.1428, + "step": 22186 + }, + { + "epoch": 0.67, + "learning_rate": 1.3085342126584545e-06, + "loss": 1.032, + "step": 22187 + }, + { + "epoch": 0.67, + "learning_rate": 1.3083197814628255e-06, + "loss": 1.0955, + "step": 22188 + }, + { + "epoch": 0.67, + "learning_rate": 1.308105361611419e-06, + "loss": 1.0965, + "step": 22189 + }, + { + "epoch": 0.67, + "learning_rate": 1.3078909531062744e-06, + "loss": 1.1328, + "step": 22190 + }, + { + "epoch": 0.67, + "learning_rate": 1.307676555949434e-06, + "loss": 1.1356, + "step": 22191 + }, + { + "epoch": 0.67, + "learning_rate": 1.3074621701429385e-06, + "loss": 1.1433, + "step": 22192 + }, + { + "epoch": 0.67, + "learning_rate": 1.3072477956888286e-06, + "loss": 1.1979, + "step": 22193 + }, + { + "epoch": 0.67, + "learning_rate": 1.3070334325891464e-06, + "loss": 1.0352, + "step": 22194 + }, + { + "epoch": 0.67, + "learning_rate": 1.3068190808459302e-06, + "loss": 1.1293, + "step": 22195 + }, + { + "epoch": 0.67, + "learning_rate": 1.3066047404612219e-06, + "loss": 1.0235, + "step": 22196 + }, + { + "epoch": 0.67, + "learning_rate": 1.3063904114370617e-06, + "loss": 1.1895, + "step": 22197 + }, + { + "epoch": 0.67, + "learning_rate": 1.3061760937754907e-06, + "loss": 1.096, + "step": 22198 + }, + { + "epoch": 0.67, + "learning_rate": 1.3059617874785476e-06, + "loss": 1.1606, + "step": 22199 + }, + { + "epoch": 0.67, + "learning_rate": 1.3057474925482732e-06, + "loss": 1.0558, + "step": 22200 + }, + { + "epoch": 0.67, + "learning_rate": 1.3055332089867074e-06, + "loss": 1.0503, + "step": 22201 + }, + { + "epoch": 0.67, + "learning_rate": 1.3053189367958903e-06, + "loss": 1.1602, + "step": 22202 + }, + { + "epoch": 0.67, + "learning_rate": 1.3051046759778613e-06, + "loss": 1.0921, + "step": 22203 + }, + { + "epoch": 0.67, + "learning_rate": 1.3048904265346603e-06, + "loss": 1.1198, + "step": 22204 + }, + { + "epoch": 0.67, + "learning_rate": 1.3046761884683273e-06, + "loss": 1.1635, + "step": 22205 + }, + { + "epoch": 0.67, + "learning_rate": 1.3044619617809006e-06, + "loss": 1.1, + "step": 22206 + }, + { + "epoch": 0.67, + "learning_rate": 1.3042477464744218e-06, + "loss": 1.1644, + "step": 22207 + }, + { + "epoch": 0.67, + "learning_rate": 1.3040335425509276e-06, + "loss": 1.1268, + "step": 22208 + }, + { + "epoch": 0.67, + "learning_rate": 1.3038193500124577e-06, + "loss": 1.0648, + "step": 22209 + }, + { + "epoch": 0.67, + "learning_rate": 1.3036051688610518e-06, + "loss": 1.1693, + "step": 22210 + }, + { + "epoch": 0.67, + "learning_rate": 1.3033909990987492e-06, + "loss": 1.202, + "step": 22211 + }, + { + "epoch": 0.67, + "learning_rate": 1.3031768407275868e-06, + "loss": 1.105, + "step": 22212 + }, + { + "epoch": 0.67, + "learning_rate": 1.302962693749605e-06, + "loss": 1.0158, + "step": 22213 + }, + { + "epoch": 0.67, + "learning_rate": 1.3027485581668418e-06, + "loss": 1.1407, + "step": 22214 + }, + { + "epoch": 0.67, + "learning_rate": 1.3025344339813365e-06, + "loss": 1.1387, + "step": 22215 + }, + { + "epoch": 0.67, + "learning_rate": 1.3023203211951258e-06, + "loss": 1.0759, + "step": 22216 + }, + { + "epoch": 0.67, + "learning_rate": 1.3021062198102486e-06, + "loss": 1.0693, + "step": 22217 + }, + { + "epoch": 0.67, + "learning_rate": 1.3018921298287435e-06, + "loss": 1.1133, + "step": 22218 + }, + { + "epoch": 0.67, + "learning_rate": 1.301678051252648e-06, + "loss": 1.0798, + "step": 22219 + }, + { + "epoch": 0.67, + "learning_rate": 1.3014639840840015e-06, + "loss": 1.1681, + "step": 22220 + }, + { + "epoch": 0.67, + "learning_rate": 1.3012499283248397e-06, + "loss": 1.1669, + "step": 22221 + }, + { + "epoch": 0.67, + "learning_rate": 1.3010358839772011e-06, + "loss": 1.2258, + "step": 22222 + }, + { + "epoch": 0.67, + "learning_rate": 1.3008218510431236e-06, + "loss": 1.1819, + "step": 22223 + }, + { + "epoch": 0.67, + "learning_rate": 1.3006078295246454e-06, + "loss": 1.1669, + "step": 22224 + }, + { + "epoch": 0.67, + "learning_rate": 1.300393819423802e-06, + "loss": 1.2757, + "step": 22225 + }, + { + "epoch": 0.67, + "learning_rate": 1.300179820742632e-06, + "loss": 1.1293, + "step": 22226 + }, + { + "epoch": 0.67, + "learning_rate": 1.2999658334831718e-06, + "loss": 1.179, + "step": 22227 + }, + { + "epoch": 0.67, + "learning_rate": 1.2997518576474593e-06, + "loss": 1.0833, + "step": 22228 + }, + { + "epoch": 0.67, + "learning_rate": 1.2995378932375308e-06, + "loss": 1.1406, + "step": 22229 + }, + { + "epoch": 0.67, + "learning_rate": 1.2993239402554236e-06, + "loss": 0.9881, + "step": 22230 + }, + { + "epoch": 0.67, + "learning_rate": 1.2991099987031742e-06, + "loss": 1.1295, + "step": 22231 + }, + { + "epoch": 0.67, + "learning_rate": 1.29889606858282e-06, + "loss": 1.1173, + "step": 22232 + }, + { + "epoch": 0.67, + "learning_rate": 1.2986821498963958e-06, + "loss": 1.1003, + "step": 22233 + }, + { + "epoch": 0.67, + "learning_rate": 1.2984682426459388e-06, + "loss": 1.1024, + "step": 22234 + }, + { + "epoch": 0.67, + "learning_rate": 1.298254346833486e-06, + "loss": 1.1473, + "step": 22235 + }, + { + "epoch": 0.67, + "learning_rate": 1.2980404624610726e-06, + "loss": 1.149, + "step": 22236 + }, + { + "epoch": 0.67, + "learning_rate": 1.2978265895307363e-06, + "loss": 1.1375, + "step": 22237 + }, + { + "epoch": 0.67, + "learning_rate": 1.2976127280445108e-06, + "loss": 1.0438, + "step": 22238 + }, + { + "epoch": 0.67, + "learning_rate": 1.2973988780044334e-06, + "loss": 1.0008, + "step": 22239 + }, + { + "epoch": 0.67, + "learning_rate": 1.297185039412539e-06, + "loss": 0.9544, + "step": 22240 + }, + { + "epoch": 0.67, + "learning_rate": 1.296971212270865e-06, + "loss": 1.1687, + "step": 22241 + }, + { + "epoch": 0.67, + "learning_rate": 1.2967573965814446e-06, + "loss": 1.1274, + "step": 22242 + }, + { + "epoch": 0.67, + "learning_rate": 1.296543592346314e-06, + "loss": 1.1724, + "step": 22243 + }, + { + "epoch": 0.67, + "learning_rate": 1.2963297995675089e-06, + "loss": 1.2339, + "step": 22244 + }, + { + "epoch": 0.67, + "learning_rate": 1.2961160182470647e-06, + "loss": 1.0568, + "step": 22245 + }, + { + "epoch": 0.67, + "learning_rate": 1.295902248387017e-06, + "loss": 1.1567, + "step": 22246 + }, + { + "epoch": 0.67, + "learning_rate": 1.295688489989399e-06, + "loss": 1.1395, + "step": 22247 + }, + { + "epoch": 0.67, + "learning_rate": 1.2954747430562465e-06, + "loss": 1.1824, + "step": 22248 + }, + { + "epoch": 0.67, + "learning_rate": 1.2952610075895945e-06, + "loss": 1.0301, + "step": 22249 + }, + { + "epoch": 0.67, + "learning_rate": 1.2950472835914784e-06, + "loss": 1.0909, + "step": 22250 + }, + { + "epoch": 0.67, + "learning_rate": 1.2948335710639309e-06, + "loss": 1.1102, + "step": 22251 + }, + { + "epoch": 0.67, + "learning_rate": 1.2946198700089874e-06, + "loss": 1.0816, + "step": 22252 + }, + { + "epoch": 0.67, + "learning_rate": 1.294406180428682e-06, + "loss": 1.0491, + "step": 22253 + }, + { + "epoch": 0.67, + "learning_rate": 1.29419250232505e-06, + "loss": 1.184, + "step": 22254 + }, + { + "epoch": 0.67, + "learning_rate": 1.293978835700124e-06, + "loss": 1.0838, + "step": 22255 + }, + { + "epoch": 0.67, + "learning_rate": 1.2937651805559388e-06, + "loss": 1.0694, + "step": 22256 + }, + { + "epoch": 0.67, + "learning_rate": 1.2935515368945275e-06, + "loss": 1.0904, + "step": 22257 + }, + { + "epoch": 0.67, + "learning_rate": 1.293337904717925e-06, + "loss": 1.0937, + "step": 22258 + }, + { + "epoch": 0.67, + "learning_rate": 1.2931242840281644e-06, + "loss": 1.1373, + "step": 22259 + }, + { + "epoch": 0.67, + "learning_rate": 1.2929106748272794e-06, + "loss": 1.0228, + "step": 22260 + }, + { + "epoch": 0.67, + "learning_rate": 1.2926970771173033e-06, + "loss": 1.087, + "step": 22261 + }, + { + "epoch": 0.67, + "learning_rate": 1.2924834909002698e-06, + "loss": 1.1514, + "step": 22262 + }, + { + "epoch": 0.67, + "learning_rate": 1.2922699161782126e-06, + "loss": 1.0674, + "step": 22263 + }, + { + "epoch": 0.67, + "learning_rate": 1.2920563529531632e-06, + "loss": 1.151, + "step": 22264 + }, + { + "epoch": 0.67, + "learning_rate": 1.2918428012271556e-06, + "loss": 1.1391, + "step": 22265 + }, + { + "epoch": 0.67, + "learning_rate": 1.291629261002223e-06, + "loss": 1.1081, + "step": 22266 + }, + { + "epoch": 0.67, + "learning_rate": 1.2914157322803983e-06, + "loss": 1.183, + "step": 22267 + }, + { + "epoch": 0.67, + "learning_rate": 1.2912022150637133e-06, + "loss": 1.1817, + "step": 22268 + }, + { + "epoch": 0.67, + "learning_rate": 1.2909887093542006e-06, + "loss": 1.1411, + "step": 22269 + }, + { + "epoch": 0.67, + "learning_rate": 1.2907752151538932e-06, + "loss": 1.1991, + "step": 22270 + }, + { + "epoch": 0.67, + "learning_rate": 1.2905617324648244e-06, + "loss": 1.1233, + "step": 22271 + }, + { + "epoch": 0.67, + "learning_rate": 1.2903482612890244e-06, + "loss": 1.1224, + "step": 22272 + }, + { + "epoch": 0.67, + "learning_rate": 1.2901348016285265e-06, + "loss": 1.0441, + "step": 22273 + }, + { + "epoch": 0.67, + "learning_rate": 1.2899213534853624e-06, + "loss": 1.1248, + "step": 22274 + }, + { + "epoch": 0.67, + "learning_rate": 1.2897079168615645e-06, + "loss": 1.167, + "step": 22275 + }, + { + "epoch": 0.67, + "learning_rate": 1.289494491759165e-06, + "loss": 1.1724, + "step": 22276 + }, + { + "epoch": 0.67, + "learning_rate": 1.289281078180194e-06, + "loss": 1.1559, + "step": 22277 + }, + { + "epoch": 0.67, + "learning_rate": 1.2890676761266843e-06, + "loss": 1.0523, + "step": 22278 + }, + { + "epoch": 0.67, + "learning_rate": 1.288854285600667e-06, + "loss": 1.0917, + "step": 22279 + }, + { + "epoch": 0.67, + "learning_rate": 1.2886409066041744e-06, + "loss": 0.9974, + "step": 22280 + }, + { + "epoch": 0.67, + "learning_rate": 1.2884275391392362e-06, + "loss": 1.0225, + "step": 22281 + }, + { + "epoch": 0.67, + "learning_rate": 1.2882141832078842e-06, + "loss": 1.1248, + "step": 22282 + }, + { + "epoch": 0.67, + "learning_rate": 1.2880008388121494e-06, + "loss": 1.1046, + "step": 22283 + }, + { + "epoch": 0.67, + "learning_rate": 1.2877875059540635e-06, + "loss": 1.0726, + "step": 22284 + }, + { + "epoch": 0.67, + "learning_rate": 1.287574184635656e-06, + "loss": 1.1389, + "step": 22285 + }, + { + "epoch": 0.67, + "learning_rate": 1.2873608748589589e-06, + "loss": 1.1449, + "step": 22286 + }, + { + "epoch": 0.67, + "learning_rate": 1.2871475766260017e-06, + "loss": 1.169, + "step": 22287 + }, + { + "epoch": 0.67, + "learning_rate": 1.286934289938816e-06, + "loss": 1.1645, + "step": 22288 + }, + { + "epoch": 0.67, + "learning_rate": 1.2867210147994321e-06, + "loss": 1.0855, + "step": 22289 + }, + { + "epoch": 0.67, + "learning_rate": 1.2865077512098788e-06, + "loss": 1.0854, + "step": 22290 + }, + { + "epoch": 0.67, + "learning_rate": 1.286294499172188e-06, + "loss": 1.1521, + "step": 22291 + }, + { + "epoch": 0.67, + "learning_rate": 1.2860812586883884e-06, + "loss": 1.0928, + "step": 22292 + }, + { + "epoch": 0.67, + "learning_rate": 1.2858680297605117e-06, + "loss": 1.2197, + "step": 22293 + }, + { + "epoch": 0.67, + "learning_rate": 1.2856548123905858e-06, + "loss": 1.1119, + "step": 22294 + }, + { + "epoch": 0.67, + "learning_rate": 1.2854416065806408e-06, + "loss": 1.0723, + "step": 22295 + }, + { + "epoch": 0.67, + "learning_rate": 1.2852284123327073e-06, + "loss": 1.1687, + "step": 22296 + }, + { + "epoch": 0.67, + "learning_rate": 1.285015229648815e-06, + "loss": 1.1152, + "step": 22297 + }, + { + "epoch": 0.67, + "learning_rate": 1.2848020585309912e-06, + "loss": 1.0977, + "step": 22298 + }, + { + "epoch": 0.67, + "learning_rate": 1.2845888989812673e-06, + "loss": 1.2162, + "step": 22299 + }, + { + "epoch": 0.67, + "learning_rate": 1.2843757510016712e-06, + "loss": 1.0663, + "step": 22300 + }, + { + "epoch": 0.67, + "learning_rate": 1.2841626145942326e-06, + "loss": 1.171, + "step": 22301 + }, + { + "epoch": 0.67, + "learning_rate": 1.2839494897609811e-06, + "loss": 1.0694, + "step": 22302 + }, + { + "epoch": 0.67, + "learning_rate": 1.283736376503944e-06, + "loss": 1.1304, + "step": 22303 + }, + { + "epoch": 0.67, + "learning_rate": 1.283523274825151e-06, + "loss": 1.152, + "step": 22304 + }, + { + "epoch": 0.67, + "learning_rate": 1.2833101847266305e-06, + "loss": 1.1376, + "step": 22305 + }, + { + "epoch": 0.67, + "learning_rate": 1.283097106210412e-06, + "loss": 1.2144, + "step": 22306 + }, + { + "epoch": 0.67, + "learning_rate": 1.2828840392785218e-06, + "loss": 1.1374, + "step": 22307 + }, + { + "epoch": 0.67, + "learning_rate": 1.2826709839329893e-06, + "loss": 1.0244, + "step": 22308 + }, + { + "epoch": 0.67, + "learning_rate": 1.282457940175843e-06, + "loss": 1.097, + "step": 22309 + }, + { + "epoch": 0.67, + "learning_rate": 1.2822449080091107e-06, + "loss": 1.1774, + "step": 22310 + }, + { + "epoch": 0.67, + "learning_rate": 1.2820318874348202e-06, + "loss": 1.2188, + "step": 22311 + }, + { + "epoch": 0.67, + "learning_rate": 1.2818188784549999e-06, + "loss": 1.2914, + "step": 22312 + }, + { + "epoch": 0.67, + "learning_rate": 1.281605881071677e-06, + "loss": 1.144, + "step": 22313 + }, + { + "epoch": 0.67, + "learning_rate": 1.2813928952868802e-06, + "loss": 1.0444, + "step": 22314 + }, + { + "epoch": 0.67, + "learning_rate": 1.2811799211026352e-06, + "loss": 1.0496, + "step": 22315 + }, + { + "epoch": 0.67, + "learning_rate": 1.2809669585209705e-06, + "loss": 1.0735, + "step": 22316 + }, + { + "epoch": 0.67, + "learning_rate": 1.280754007543913e-06, + "loss": 1.1067, + "step": 22317 + }, + { + "epoch": 0.67, + "learning_rate": 1.2805410681734903e-06, + "loss": 1.1324, + "step": 22318 + }, + { + "epoch": 0.67, + "learning_rate": 1.28032814041173e-06, + "loss": 1.0704, + "step": 22319 + }, + { + "epoch": 0.67, + "learning_rate": 1.2801152242606579e-06, + "loss": 1.0414, + "step": 22320 + }, + { + "epoch": 0.67, + "learning_rate": 1.2799023197223008e-06, + "loss": 1.115, + "step": 22321 + }, + { + "epoch": 0.67, + "learning_rate": 1.2796894267986864e-06, + "loss": 1.0399, + "step": 22322 + }, + { + "epoch": 0.67, + "learning_rate": 1.2794765454918417e-06, + "loss": 1.1897, + "step": 22323 + }, + { + "epoch": 0.67, + "learning_rate": 1.279263675803792e-06, + "loss": 1.1593, + "step": 22324 + }, + { + "epoch": 0.67, + "learning_rate": 1.2790508177365635e-06, + "loss": 1.0782, + "step": 22325 + }, + { + "epoch": 0.67, + "learning_rate": 1.2788379712921835e-06, + "loss": 1.1407, + "step": 22326 + }, + { + "epoch": 0.67, + "learning_rate": 1.2786251364726779e-06, + "loss": 1.0428, + "step": 22327 + }, + { + "epoch": 0.67, + "learning_rate": 1.2784123132800736e-06, + "loss": 1.1679, + "step": 22328 + }, + { + "epoch": 0.67, + "learning_rate": 1.2781995017163951e-06, + "loss": 1.2275, + "step": 22329 + }, + { + "epoch": 0.67, + "learning_rate": 1.2779867017836683e-06, + "loss": 1.2127, + "step": 22330 + }, + { + "epoch": 0.67, + "learning_rate": 1.27777391348392e-06, + "loss": 1.1552, + "step": 22331 + }, + { + "epoch": 0.67, + "learning_rate": 1.2775611368191765e-06, + "loss": 1.0325, + "step": 22332 + }, + { + "epoch": 0.67, + "learning_rate": 1.2773483717914609e-06, + "loss": 1.0562, + "step": 22333 + }, + { + "epoch": 0.67, + "learning_rate": 1.2771356184028e-06, + "loss": 1.1527, + "step": 22334 + }, + { + "epoch": 0.67, + "learning_rate": 1.2769228766552194e-06, + "loss": 1.1168, + "step": 22335 + }, + { + "epoch": 0.67, + "learning_rate": 1.2767101465507448e-06, + "loss": 1.0768, + "step": 22336 + }, + { + "epoch": 0.67, + "learning_rate": 1.276497428091399e-06, + "loss": 1.137, + "step": 22337 + }, + { + "epoch": 0.67, + "learning_rate": 1.276284721279209e-06, + "loss": 1.0021, + "step": 22338 + }, + { + "epoch": 0.67, + "learning_rate": 1.2760720261161988e-06, + "loss": 1.0533, + "step": 22339 + }, + { + "epoch": 0.67, + "learning_rate": 1.2758593426043936e-06, + "loss": 0.9745, + "step": 22340 + }, + { + "epoch": 0.67, + "learning_rate": 1.2756466707458176e-06, + "loss": 1.1995, + "step": 22341 + }, + { + "epoch": 0.67, + "learning_rate": 1.2754340105424962e-06, + "loss": 1.1643, + "step": 22342 + }, + { + "epoch": 0.67, + "learning_rate": 1.2752213619964527e-06, + "loss": 1.1633, + "step": 22343 + }, + { + "epoch": 0.67, + "learning_rate": 1.275008725109712e-06, + "loss": 1.0263, + "step": 22344 + }, + { + "epoch": 0.67, + "learning_rate": 1.2747960998842996e-06, + "loss": 1.1997, + "step": 22345 + }, + { + "epoch": 0.67, + "learning_rate": 1.2745834863222372e-06, + "loss": 1.0244, + "step": 22346 + }, + { + "epoch": 0.67, + "learning_rate": 1.2743708844255494e-06, + "loss": 1.0613, + "step": 22347 + }, + { + "epoch": 0.67, + "learning_rate": 1.274158294196261e-06, + "loss": 1.0489, + "step": 22348 + }, + { + "epoch": 0.67, + "learning_rate": 1.273945715636396e-06, + "loss": 1.019, + "step": 22349 + }, + { + "epoch": 0.67, + "learning_rate": 1.2737331487479764e-06, + "loss": 1.2011, + "step": 22350 + }, + { + "epoch": 0.67, + "learning_rate": 1.2735205935330264e-06, + "loss": 1.1447, + "step": 22351 + }, + { + "epoch": 0.67, + "learning_rate": 1.27330804999357e-06, + "loss": 1.1102, + "step": 22352 + }, + { + "epoch": 0.67, + "learning_rate": 1.2730955181316302e-06, + "loss": 1.0073, + "step": 22353 + }, + { + "epoch": 0.67, + "learning_rate": 1.2728829979492308e-06, + "loss": 1.1382, + "step": 22354 + }, + { + "epoch": 0.67, + "learning_rate": 1.2726704894483933e-06, + "loss": 1.0342, + "step": 22355 + }, + { + "epoch": 0.67, + "learning_rate": 1.272457992631142e-06, + "loss": 1.2133, + "step": 22356 + }, + { + "epoch": 0.67, + "learning_rate": 1.2722455074994988e-06, + "loss": 0.9846, + "step": 22357 + }, + { + "epoch": 0.67, + "learning_rate": 1.2720330340554887e-06, + "loss": 1.0847, + "step": 22358 + }, + { + "epoch": 0.67, + "learning_rate": 1.2718205723011311e-06, + "loss": 1.0427, + "step": 22359 + }, + { + "epoch": 0.67, + "learning_rate": 1.2716081222384508e-06, + "loss": 1.1266, + "step": 22360 + }, + { + "epoch": 0.67, + "learning_rate": 1.271395683869469e-06, + "loss": 1.0841, + "step": 22361 + }, + { + "epoch": 0.67, + "learning_rate": 1.2711832571962102e-06, + "loss": 1.1688, + "step": 22362 + }, + { + "epoch": 0.67, + "learning_rate": 1.2709708422206935e-06, + "loss": 0.9962, + "step": 22363 + }, + { + "epoch": 0.67, + "learning_rate": 1.2707584389449423e-06, + "loss": 1.0579, + "step": 22364 + }, + { + "epoch": 0.67, + "learning_rate": 1.270546047370979e-06, + "loss": 1.0505, + "step": 22365 + }, + { + "epoch": 0.67, + "learning_rate": 1.2703336675008254e-06, + "loss": 1.1349, + "step": 22366 + }, + { + "epoch": 0.67, + "learning_rate": 1.2701212993365029e-06, + "loss": 1.0925, + "step": 22367 + }, + { + "epoch": 0.67, + "learning_rate": 1.2699089428800333e-06, + "loss": 1.0722, + "step": 22368 + }, + { + "epoch": 0.67, + "learning_rate": 1.269696598133438e-06, + "loss": 1.0389, + "step": 22369 + }, + { + "epoch": 0.67, + "learning_rate": 1.2694842650987387e-06, + "loss": 1.1258, + "step": 22370 + }, + { + "epoch": 0.67, + "learning_rate": 1.2692719437779575e-06, + "loss": 1.0491, + "step": 22371 + }, + { + "epoch": 0.67, + "learning_rate": 1.2690596341731138e-06, + "loss": 1.0667, + "step": 22372 + }, + { + "epoch": 0.67, + "learning_rate": 1.2688473362862292e-06, + "loss": 1.1784, + "step": 22373 + }, + { + "epoch": 0.67, + "learning_rate": 1.268635050119325e-06, + "loss": 1.2067, + "step": 22374 + }, + { + "epoch": 0.67, + "learning_rate": 1.2684227756744232e-06, + "loss": 1.0261, + "step": 22375 + }, + { + "epoch": 0.67, + "learning_rate": 1.2682105129535427e-06, + "loss": 0.9966, + "step": 22376 + }, + { + "epoch": 0.67, + "learning_rate": 1.2679982619587048e-06, + "loss": 1.0653, + "step": 22377 + }, + { + "epoch": 0.67, + "learning_rate": 1.26778602269193e-06, + "loss": 1.0443, + "step": 22378 + }, + { + "epoch": 0.67, + "learning_rate": 1.2675737951552386e-06, + "loss": 1.0745, + "step": 22379 + }, + { + "epoch": 0.67, + "learning_rate": 1.2673615793506524e-06, + "loss": 1.1529, + "step": 22380 + }, + { + "epoch": 0.67, + "learning_rate": 1.2671493752801894e-06, + "loss": 1.1239, + "step": 22381 + }, + { + "epoch": 0.67, + "learning_rate": 1.2669371829458703e-06, + "loss": 1.0515, + "step": 22382 + }, + { + "epoch": 0.67, + "learning_rate": 1.2667250023497153e-06, + "loss": 1.0035, + "step": 22383 + }, + { + "epoch": 0.67, + "learning_rate": 1.2665128334937454e-06, + "loss": 1.0195, + "step": 22384 + }, + { + "epoch": 0.67, + "learning_rate": 1.2663006763799785e-06, + "loss": 1.1288, + "step": 22385 + }, + { + "epoch": 0.67, + "learning_rate": 1.2660885310104349e-06, + "loss": 1.1557, + "step": 22386 + }, + { + "epoch": 0.67, + "learning_rate": 1.2658763973871341e-06, + "loss": 1.0052, + "step": 22387 + }, + { + "epoch": 0.67, + "learning_rate": 1.2656642755120965e-06, + "loss": 1.0478, + "step": 22388 + }, + { + "epoch": 0.67, + "learning_rate": 1.2654521653873397e-06, + "loss": 1.1479, + "step": 22389 + }, + { + "epoch": 0.67, + "learning_rate": 1.2652400670148834e-06, + "loss": 1.1489, + "step": 22390 + }, + { + "epoch": 0.67, + "learning_rate": 1.2650279803967475e-06, + "loss": 1.1216, + "step": 22391 + }, + { + "epoch": 0.67, + "learning_rate": 1.2648159055349502e-06, + "loss": 1.1547, + "step": 22392 + }, + { + "epoch": 0.67, + "learning_rate": 1.2646038424315104e-06, + "loss": 1.1546, + "step": 22393 + }, + { + "epoch": 0.67, + "learning_rate": 1.2643917910884473e-06, + "loss": 1.0611, + "step": 22394 + }, + { + "epoch": 0.67, + "learning_rate": 1.2641797515077791e-06, + "loss": 1.0898, + "step": 22395 + }, + { + "epoch": 0.67, + "learning_rate": 1.263967723691525e-06, + "loss": 1.1392, + "step": 22396 + }, + { + "epoch": 0.67, + "learning_rate": 1.263755707641703e-06, + "loss": 1.0291, + "step": 22397 + }, + { + "epoch": 0.67, + "learning_rate": 1.2635437033603309e-06, + "loss": 1.2193, + "step": 22398 + }, + { + "epoch": 0.67, + "learning_rate": 1.263331710849427e-06, + "loss": 1.1814, + "step": 22399 + }, + { + "epoch": 0.67, + "learning_rate": 1.2631197301110098e-06, + "loss": 1.1661, + "step": 22400 + }, + { + "epoch": 0.67, + "learning_rate": 1.2629077611470978e-06, + "loss": 1.107, + "step": 22401 + }, + { + "epoch": 0.67, + "learning_rate": 1.262695803959707e-06, + "loss": 1.0596, + "step": 22402 + }, + { + "epoch": 0.67, + "learning_rate": 1.2624838585508567e-06, + "loss": 0.9703, + "step": 22403 + }, + { + "epoch": 0.67, + "learning_rate": 1.262271924922564e-06, + "loss": 1.091, + "step": 22404 + }, + { + "epoch": 0.67, + "learning_rate": 1.262060003076846e-06, + "loss": 1.1357, + "step": 22405 + }, + { + "epoch": 0.67, + "learning_rate": 1.261848093015722e-06, + "loss": 1.0426, + "step": 22406 + }, + { + "epoch": 0.68, + "learning_rate": 1.2616361947412065e-06, + "loss": 1.1805, + "step": 22407 + }, + { + "epoch": 0.68, + "learning_rate": 1.2614243082553184e-06, + "loss": 1.0908, + "step": 22408 + }, + { + "epoch": 0.68, + "learning_rate": 1.2612124335600743e-06, + "loss": 1.1237, + "step": 22409 + }, + { + "epoch": 0.68, + "learning_rate": 1.2610005706574918e-06, + "loss": 1.0723, + "step": 22410 + }, + { + "epoch": 0.68, + "learning_rate": 1.2607887195495866e-06, + "loss": 1.1862, + "step": 22411 + }, + { + "epoch": 0.68, + "learning_rate": 1.2605768802383754e-06, + "loss": 1.0884, + "step": 22412 + }, + { + "epoch": 0.68, + "learning_rate": 1.260365052725876e-06, + "loss": 1.0984, + "step": 22413 + }, + { + "epoch": 0.68, + "learning_rate": 1.2601532370141051e-06, + "loss": 1.0819, + "step": 22414 + }, + { + "epoch": 0.68, + "learning_rate": 1.2599414331050775e-06, + "loss": 1.0016, + "step": 22415 + }, + { + "epoch": 0.68, + "learning_rate": 1.2597296410008098e-06, + "loss": 1.0959, + "step": 22416 + }, + { + "epoch": 0.68, + "learning_rate": 1.2595178607033187e-06, + "loss": 1.0919, + "step": 22417 + }, + { + "epoch": 0.68, + "learning_rate": 1.25930609221462e-06, + "loss": 1.1732, + "step": 22418 + }, + { + "epoch": 0.68, + "learning_rate": 1.2590943355367307e-06, + "loss": 1.0515, + "step": 22419 + }, + { + "epoch": 0.68, + "learning_rate": 1.258882590671665e-06, + "loss": 1.1313, + "step": 22420 + }, + { + "epoch": 0.68, + "learning_rate": 1.258670857621439e-06, + "loss": 1.1244, + "step": 22421 + }, + { + "epoch": 0.68, + "learning_rate": 1.2584591363880689e-06, + "loss": 1.1128, + "step": 22422 + }, + { + "epoch": 0.68, + "learning_rate": 1.2582474269735697e-06, + "loss": 1.0789, + "step": 22423 + }, + { + "epoch": 0.68, + "learning_rate": 1.2580357293799571e-06, + "loss": 1.1168, + "step": 22424 + }, + { + "epoch": 0.68, + "learning_rate": 1.257824043609246e-06, + "loss": 1.1996, + "step": 22425 + }, + { + "epoch": 0.68, + "learning_rate": 1.2576123696634518e-06, + "loss": 1.0098, + "step": 22426 + }, + { + "epoch": 0.68, + "learning_rate": 1.2574007075445907e-06, + "loss": 1.0574, + "step": 22427 + }, + { + "epoch": 0.68, + "learning_rate": 1.2571890572546753e-06, + "loss": 1.1257, + "step": 22428 + }, + { + "epoch": 0.68, + "learning_rate": 1.2569774187957212e-06, + "loss": 1.0826, + "step": 22429 + }, + { + "epoch": 0.68, + "learning_rate": 1.2567657921697437e-06, + "loss": 1.1509, + "step": 22430 + }, + { + "epoch": 0.68, + "learning_rate": 1.256554177378757e-06, + "loss": 1.2027, + "step": 22431 + }, + { + "epoch": 0.68, + "learning_rate": 1.256342574424777e-06, + "loss": 1.1439, + "step": 22432 + }, + { + "epoch": 0.68, + "learning_rate": 1.2561309833098154e-06, + "loss": 1.2524, + "step": 22433 + }, + { + "epoch": 0.68, + "learning_rate": 1.255919404035888e-06, + "loss": 1.2092, + "step": 22434 + }, + { + "epoch": 0.68, + "learning_rate": 1.2557078366050085e-06, + "loss": 1.1979, + "step": 22435 + }, + { + "epoch": 0.68, + "learning_rate": 1.2554962810191917e-06, + "loss": 1.2656, + "step": 22436 + }, + { + "epoch": 0.68, + "learning_rate": 1.2552847372804506e-06, + "loss": 1.2827, + "step": 22437 + }, + { + "epoch": 0.68, + "learning_rate": 1.2550732053907991e-06, + "loss": 1.2135, + "step": 22438 + }, + { + "epoch": 0.68, + "learning_rate": 1.254861685352251e-06, + "loss": 1.1083, + "step": 22439 + }, + { + "epoch": 0.68, + "learning_rate": 1.2546501771668213e-06, + "loss": 1.0662, + "step": 22440 + }, + { + "epoch": 0.68, + "learning_rate": 1.2544386808365208e-06, + "loss": 1.1, + "step": 22441 + }, + { + "epoch": 0.68, + "learning_rate": 1.2542271963633646e-06, + "loss": 1.1137, + "step": 22442 + }, + { + "epoch": 0.68, + "learning_rate": 1.254015723749365e-06, + "loss": 1.1817, + "step": 22443 + }, + { + "epoch": 0.68, + "learning_rate": 1.253804262996537e-06, + "loss": 1.2043, + "step": 22444 + }, + { + "epoch": 0.68, + "learning_rate": 1.2535928141068908e-06, + "loss": 1.1085, + "step": 22445 + }, + { + "epoch": 0.68, + "learning_rate": 1.253381377082441e-06, + "loss": 1.1218, + "step": 22446 + }, + { + "epoch": 0.68, + "learning_rate": 1.2531699519252e-06, + "loss": 1.1373, + "step": 22447 + }, + { + "epoch": 0.68, + "learning_rate": 1.2529585386371806e-06, + "loss": 1.037, + "step": 22448 + }, + { + "epoch": 0.68, + "learning_rate": 1.2527471372203953e-06, + "loss": 1.2448, + "step": 22449 + }, + { + "epoch": 0.68, + "learning_rate": 1.2525357476768569e-06, + "loss": 1.0278, + "step": 22450 + }, + { + "epoch": 0.68, + "learning_rate": 1.2523243700085768e-06, + "loss": 1.0513, + "step": 22451 + }, + { + "epoch": 0.68, + "learning_rate": 1.2521130042175682e-06, + "loss": 1.0447, + "step": 22452 + }, + { + "epoch": 0.68, + "learning_rate": 1.251901650305844e-06, + "loss": 1.0433, + "step": 22453 + }, + { + "epoch": 0.68, + "learning_rate": 1.2516903082754134e-06, + "loss": 1.2138, + "step": 22454 + }, + { + "epoch": 0.68, + "learning_rate": 1.2514789781282901e-06, + "loss": 1.2064, + "step": 22455 + }, + { + "epoch": 0.68, + "learning_rate": 1.2512676598664858e-06, + "loss": 1.0774, + "step": 22456 + }, + { + "epoch": 0.68, + "learning_rate": 1.2510563534920128e-06, + "loss": 1.1293, + "step": 22457 + }, + { + "epoch": 0.68, + "learning_rate": 1.2508450590068807e-06, + "loss": 1.0903, + "step": 22458 + }, + { + "epoch": 0.68, + "learning_rate": 1.250633776413102e-06, + "loss": 1.0894, + "step": 22459 + }, + { + "epoch": 0.68, + "learning_rate": 1.2504225057126884e-06, + "loss": 1.0742, + "step": 22460 + }, + { + "epoch": 0.68, + "learning_rate": 1.2502112469076505e-06, + "loss": 1.0152, + "step": 22461 + }, + { + "epoch": 0.68, + "learning_rate": 1.2500000000000007e-06, + "loss": 1.3086, + "step": 22462 + }, + { + "epoch": 0.68, + "learning_rate": 1.2497887649917479e-06, + "loss": 0.9965, + "step": 22463 + }, + { + "epoch": 0.68, + "learning_rate": 1.2495775418849038e-06, + "loss": 1.0941, + "step": 22464 + }, + { + "epoch": 0.68, + "learning_rate": 1.249366330681479e-06, + "loss": 0.9777, + "step": 22465 + }, + { + "epoch": 0.68, + "learning_rate": 1.2491551313834857e-06, + "loss": 1.1506, + "step": 22466 + }, + { + "epoch": 0.68, + "learning_rate": 1.2489439439929323e-06, + "loss": 1.1647, + "step": 22467 + }, + { + "epoch": 0.68, + "learning_rate": 1.2487327685118297e-06, + "loss": 1.0942, + "step": 22468 + }, + { + "epoch": 0.68, + "learning_rate": 1.2485216049421888e-06, + "loss": 1.1649, + "step": 22469 + }, + { + "epoch": 0.68, + "learning_rate": 1.2483104532860205e-06, + "loss": 1.1071, + "step": 22470 + }, + { + "epoch": 0.68, + "learning_rate": 1.2480993135453326e-06, + "loss": 1.0986, + "step": 22471 + }, + { + "epoch": 0.68, + "learning_rate": 1.2478881857221364e-06, + "loss": 1.0969, + "step": 22472 + }, + { + "epoch": 0.68, + "learning_rate": 1.2476770698184418e-06, + "loss": 1.0773, + "step": 22473 + }, + { + "epoch": 0.68, + "learning_rate": 1.247465965836258e-06, + "loss": 1.142, + "step": 22474 + }, + { + "epoch": 0.68, + "learning_rate": 1.2472548737775953e-06, + "loss": 1.1619, + "step": 22475 + }, + { + "epoch": 0.68, + "learning_rate": 1.2470437936444627e-06, + "loss": 1.1449, + "step": 22476 + }, + { + "epoch": 0.68, + "learning_rate": 1.2468327254388699e-06, + "loss": 1.1125, + "step": 22477 + }, + { + "epoch": 0.68, + "learning_rate": 1.2466216691628258e-06, + "loss": 1.0253, + "step": 22478 + }, + { + "epoch": 0.68, + "learning_rate": 1.2464106248183408e-06, + "loss": 1.0981, + "step": 22479 + }, + { + "epoch": 0.68, + "learning_rate": 1.2461995924074218e-06, + "loss": 1.1323, + "step": 22480 + }, + { + "epoch": 0.68, + "learning_rate": 1.245988571932079e-06, + "loss": 1.2585, + "step": 22481 + }, + { + "epoch": 0.68, + "learning_rate": 1.2457775633943212e-06, + "loss": 1.0834, + "step": 22482 + }, + { + "epoch": 0.68, + "learning_rate": 1.2455665667961574e-06, + "loss": 1.1315, + "step": 22483 + }, + { + "epoch": 0.68, + "learning_rate": 1.2453555821395953e-06, + "loss": 1.1644, + "step": 22484 + }, + { + "epoch": 0.68, + "learning_rate": 1.2451446094266434e-06, + "loss": 1.0695, + "step": 22485 + }, + { + "epoch": 0.68, + "learning_rate": 1.2449336486593108e-06, + "loss": 1.1493, + "step": 22486 + }, + { + "epoch": 0.68, + "learning_rate": 1.2447226998396053e-06, + "loss": 1.231, + "step": 22487 + }, + { + "epoch": 0.68, + "learning_rate": 1.2445117629695362e-06, + "loss": 1.1914, + "step": 22488 + }, + { + "epoch": 0.68, + "learning_rate": 1.244300838051109e-06, + "loss": 1.0861, + "step": 22489 + }, + { + "epoch": 0.68, + "learning_rate": 1.2440899250863333e-06, + "loss": 1.0906, + "step": 22490 + }, + { + "epoch": 0.68, + "learning_rate": 1.243879024077217e-06, + "loss": 1.0978, + "step": 22491 + }, + { + "epoch": 0.68, + "learning_rate": 1.2436681350257682e-06, + "loss": 1.121, + "step": 22492 + }, + { + "epoch": 0.68, + "learning_rate": 1.2434572579339926e-06, + "loss": 1.1469, + "step": 22493 + }, + { + "epoch": 0.68, + "learning_rate": 1.2432463928038988e-06, + "loss": 1.0877, + "step": 22494 + }, + { + "epoch": 0.68, + "learning_rate": 1.2430355396374938e-06, + "loss": 1.0385, + "step": 22495 + }, + { + "epoch": 0.68, + "learning_rate": 1.2428246984367865e-06, + "loss": 1.1019, + "step": 22496 + }, + { + "epoch": 0.68, + "learning_rate": 1.2426138692037815e-06, + "loss": 1.0375, + "step": 22497 + }, + { + "epoch": 0.68, + "learning_rate": 1.2424030519404866e-06, + "loss": 1.114, + "step": 22498 + }, + { + "epoch": 0.68, + "learning_rate": 1.2421922466489092e-06, + "loss": 1.1953, + "step": 22499 + }, + { + "epoch": 0.68, + "learning_rate": 1.241981453331056e-06, + "loss": 1.152, + "step": 22500 + }, + { + "epoch": 0.68, + "learning_rate": 1.2417706719889342e-06, + "loss": 1.1515, + "step": 22501 + }, + { + "epoch": 0.68, + "learning_rate": 1.2415599026245486e-06, + "loss": 1.0394, + "step": 22502 + }, + { + "epoch": 0.68, + "learning_rate": 1.2413491452399068e-06, + "loss": 1.1287, + "step": 22503 + }, + { + "epoch": 0.68, + "learning_rate": 1.241138399837015e-06, + "loss": 1.0623, + "step": 22504 + }, + { + "epoch": 0.68, + "learning_rate": 1.240927666417879e-06, + "loss": 1.2261, + "step": 22505 + }, + { + "epoch": 0.68, + "learning_rate": 1.2407169449845054e-06, + "loss": 1.0241, + "step": 22506 + }, + { + "epoch": 0.68, + "learning_rate": 1.2405062355389002e-06, + "loss": 0.9746, + "step": 22507 + }, + { + "epoch": 0.68, + "learning_rate": 1.2402955380830689e-06, + "loss": 1.1019, + "step": 22508 + }, + { + "epoch": 0.68, + "learning_rate": 1.2400848526190186e-06, + "loss": 1.171, + "step": 22509 + }, + { + "epoch": 0.68, + "learning_rate": 1.2398741791487523e-06, + "loss": 1.0807, + "step": 22510 + }, + { + "epoch": 0.68, + "learning_rate": 1.2396635176742773e-06, + "loss": 1.106, + "step": 22511 + }, + { + "epoch": 0.68, + "learning_rate": 1.2394528681975985e-06, + "loss": 1.1535, + "step": 22512 + }, + { + "epoch": 0.68, + "learning_rate": 1.239242230720721e-06, + "loss": 1.1096, + "step": 22513 + }, + { + "epoch": 0.68, + "learning_rate": 1.2390316052456513e-06, + "loss": 1.0347, + "step": 22514 + }, + { + "epoch": 0.68, + "learning_rate": 1.238820991774393e-06, + "loss": 1.0245, + "step": 22515 + }, + { + "epoch": 0.68, + "learning_rate": 1.238610390308951e-06, + "loss": 1.0934, + "step": 22516 + }, + { + "epoch": 0.68, + "learning_rate": 1.2383998008513304e-06, + "loss": 1.21, + "step": 22517 + }, + { + "epoch": 0.68, + "learning_rate": 1.2381892234035373e-06, + "loss": 1.1783, + "step": 22518 + }, + { + "epoch": 0.68, + "learning_rate": 1.2379786579675742e-06, + "loss": 1.0234, + "step": 22519 + }, + { + "epoch": 0.68, + "learning_rate": 1.2377681045454462e-06, + "loss": 1.1915, + "step": 22520 + }, + { + "epoch": 0.68, + "learning_rate": 1.2375575631391581e-06, + "loss": 0.9986, + "step": 22521 + }, + { + "epoch": 0.68, + "learning_rate": 1.2373470337507152e-06, + "loss": 1.1127, + "step": 22522 + }, + { + "epoch": 0.68, + "learning_rate": 1.237136516382119e-06, + "loss": 1.215, + "step": 22523 + }, + { + "epoch": 0.68, + "learning_rate": 1.2369260110353753e-06, + "loss": 1.095, + "step": 22524 + }, + { + "epoch": 0.68, + "learning_rate": 1.2367155177124875e-06, + "loss": 1.1147, + "step": 22525 + }, + { + "epoch": 0.68, + "learning_rate": 1.2365050364154597e-06, + "loss": 1.0673, + "step": 22526 + }, + { + "epoch": 0.68, + "learning_rate": 1.2362945671462962e-06, + "loss": 1.1204, + "step": 22527 + }, + { + "epoch": 0.68, + "learning_rate": 1.236084109906999e-06, + "loss": 1.0313, + "step": 22528 + }, + { + "epoch": 0.68, + "learning_rate": 1.235873664699572e-06, + "loss": 1.0565, + "step": 22529 + }, + { + "epoch": 0.68, + "learning_rate": 1.2356632315260191e-06, + "loss": 1.0845, + "step": 22530 + }, + { + "epoch": 0.68, + "learning_rate": 1.2354528103883434e-06, + "loss": 1.0934, + "step": 22531 + }, + { + "epoch": 0.68, + "learning_rate": 1.2352424012885481e-06, + "loss": 1.1656, + "step": 22532 + }, + { + "epoch": 0.68, + "learning_rate": 1.2350320042286357e-06, + "loss": 1.1103, + "step": 22533 + }, + { + "epoch": 0.68, + "learning_rate": 1.2348216192106094e-06, + "loss": 1.0652, + "step": 22534 + }, + { + "epoch": 0.68, + "learning_rate": 1.234611246236473e-06, + "loss": 1.1824, + "step": 22535 + }, + { + "epoch": 0.68, + "learning_rate": 1.234400885308227e-06, + "loss": 1.0552, + "step": 22536 + }, + { + "epoch": 0.68, + "learning_rate": 1.2341905364278753e-06, + "loss": 1.1255, + "step": 22537 + }, + { + "epoch": 0.68, + "learning_rate": 1.23398019959742e-06, + "loss": 0.9319, + "step": 22538 + }, + { + "epoch": 0.68, + "learning_rate": 1.2337698748188633e-06, + "loss": 1.106, + "step": 22539 + }, + { + "epoch": 0.68, + "learning_rate": 1.2335595620942087e-06, + "loss": 1.0623, + "step": 22540 + }, + { + "epoch": 0.68, + "learning_rate": 1.2333492614254562e-06, + "loss": 1.1225, + "step": 22541 + }, + { + "epoch": 0.68, + "learning_rate": 1.2331389728146083e-06, + "loss": 1.1459, + "step": 22542 + }, + { + "epoch": 0.68, + "learning_rate": 1.2329286962636678e-06, + "loss": 0.9971, + "step": 22543 + }, + { + "epoch": 0.68, + "learning_rate": 1.2327184317746363e-06, + "loss": 1.0696, + "step": 22544 + }, + { + "epoch": 0.68, + "learning_rate": 1.2325081793495144e-06, + "loss": 1.1097, + "step": 22545 + }, + { + "epoch": 0.68, + "learning_rate": 1.2322979389903039e-06, + "loss": 1.0261, + "step": 22546 + }, + { + "epoch": 0.68, + "learning_rate": 1.2320877106990067e-06, + "loss": 1.0314, + "step": 22547 + }, + { + "epoch": 0.68, + "learning_rate": 1.2318774944776248e-06, + "loss": 1.2423, + "step": 22548 + }, + { + "epoch": 0.68, + "learning_rate": 1.2316672903281574e-06, + "loss": 0.9827, + "step": 22549 + }, + { + "epoch": 0.68, + "learning_rate": 1.2314570982526064e-06, + "loss": 1.1042, + "step": 22550 + }, + { + "epoch": 0.68, + "learning_rate": 1.2312469182529729e-06, + "loss": 1.1759, + "step": 22551 + }, + { + "epoch": 0.68, + "learning_rate": 1.231036750331258e-06, + "loss": 1.0851, + "step": 22552 + }, + { + "epoch": 0.68, + "learning_rate": 1.2308265944894627e-06, + "loss": 1.1198, + "step": 22553 + }, + { + "epoch": 0.68, + "learning_rate": 1.2306164507295862e-06, + "loss": 1.1305, + "step": 22554 + }, + { + "epoch": 0.68, + "learning_rate": 1.2304063190536297e-06, + "loss": 1.1689, + "step": 22555 + }, + { + "epoch": 0.68, + "learning_rate": 1.2301961994635936e-06, + "loss": 1.2688, + "step": 22556 + }, + { + "epoch": 0.68, + "learning_rate": 1.229986091961478e-06, + "loss": 1.1635, + "step": 22557 + }, + { + "epoch": 0.68, + "learning_rate": 1.229775996549283e-06, + "loss": 1.0063, + "step": 22558 + }, + { + "epoch": 0.68, + "learning_rate": 1.229565913229009e-06, + "loss": 1.1738, + "step": 22559 + }, + { + "epoch": 0.68, + "learning_rate": 1.2293558420026558e-06, + "loss": 1.122, + "step": 22560 + }, + { + "epoch": 0.68, + "learning_rate": 1.2291457828722236e-06, + "loss": 1.1284, + "step": 22561 + }, + { + "epoch": 0.68, + "learning_rate": 1.228935735839711e-06, + "loss": 1.1744, + "step": 22562 + }, + { + "epoch": 0.68, + "learning_rate": 1.2287257009071177e-06, + "loss": 1.0715, + "step": 22563 + }, + { + "epoch": 0.68, + "learning_rate": 1.2285156780764435e-06, + "loss": 1.1505, + "step": 22564 + }, + { + "epoch": 0.68, + "learning_rate": 1.2283056673496877e-06, + "loss": 1.1368, + "step": 22565 + }, + { + "epoch": 0.68, + "learning_rate": 1.2280956687288504e-06, + "loss": 1.1049, + "step": 22566 + }, + { + "epoch": 0.68, + "learning_rate": 1.2278856822159289e-06, + "loss": 1.1083, + "step": 22567 + }, + { + "epoch": 0.68, + "learning_rate": 1.227675707812923e-06, + "loss": 1.2144, + "step": 22568 + }, + { + "epoch": 0.68, + "learning_rate": 1.2274657455218314e-06, + "loss": 1.2405, + "step": 22569 + }, + { + "epoch": 0.68, + "learning_rate": 1.227255795344654e-06, + "loss": 1.0905, + "step": 22570 + }, + { + "epoch": 0.68, + "learning_rate": 1.2270458572833877e-06, + "loss": 0.9848, + "step": 22571 + }, + { + "epoch": 0.68, + "learning_rate": 1.2268359313400317e-06, + "loss": 1.0214, + "step": 22572 + }, + { + "epoch": 0.68, + "learning_rate": 1.2266260175165845e-06, + "loss": 1.1828, + "step": 22573 + }, + { + "epoch": 0.68, + "learning_rate": 1.2264161158150453e-06, + "loss": 1.1345, + "step": 22574 + }, + { + "epoch": 0.68, + "learning_rate": 1.2262062262374104e-06, + "loss": 1.0627, + "step": 22575 + }, + { + "epoch": 0.68, + "learning_rate": 1.2259963487856786e-06, + "loss": 1.1841, + "step": 22576 + }, + { + "epoch": 0.68, + "learning_rate": 1.225786483461848e-06, + "loss": 1.0357, + "step": 22577 + }, + { + "epoch": 0.68, + "learning_rate": 1.2255766302679162e-06, + "loss": 1.1101, + "step": 22578 + }, + { + "epoch": 0.68, + "learning_rate": 1.2253667892058824e-06, + "loss": 1.118, + "step": 22579 + }, + { + "epoch": 0.68, + "learning_rate": 1.2251569602777416e-06, + "loss": 1.0269, + "step": 22580 + }, + { + "epoch": 0.68, + "learning_rate": 1.224947143485493e-06, + "loss": 1.1613, + "step": 22581 + }, + { + "epoch": 0.68, + "learning_rate": 1.224737338831133e-06, + "loss": 1.1467, + "step": 22582 + }, + { + "epoch": 0.68, + "learning_rate": 1.2245275463166606e-06, + "loss": 1.2018, + "step": 22583 + }, + { + "epoch": 0.68, + "learning_rate": 1.2243177659440706e-06, + "loss": 1.0483, + "step": 22584 + }, + { + "epoch": 0.68, + "learning_rate": 1.224107997715361e-06, + "loss": 1.1957, + "step": 22585 + }, + { + "epoch": 0.68, + "learning_rate": 1.223898241632529e-06, + "loss": 1.0377, + "step": 22586 + }, + { + "epoch": 0.68, + "learning_rate": 1.2236884976975714e-06, + "loss": 1.1046, + "step": 22587 + }, + { + "epoch": 0.68, + "learning_rate": 1.2234787659124842e-06, + "loss": 1.2022, + "step": 22588 + }, + { + "epoch": 0.68, + "learning_rate": 1.2232690462792644e-06, + "loss": 1.1337, + "step": 22589 + }, + { + "epoch": 0.68, + "learning_rate": 1.2230593387999081e-06, + "loss": 1.1712, + "step": 22590 + }, + { + "epoch": 0.68, + "learning_rate": 1.2228496434764124e-06, + "loss": 0.9797, + "step": 22591 + }, + { + "epoch": 0.68, + "learning_rate": 1.222639960310774e-06, + "loss": 1.1265, + "step": 22592 + }, + { + "epoch": 0.68, + "learning_rate": 1.2224302893049867e-06, + "loss": 1.233, + "step": 22593 + }, + { + "epoch": 0.68, + "learning_rate": 1.2222206304610477e-06, + "loss": 1.0897, + "step": 22594 + }, + { + "epoch": 0.68, + "learning_rate": 1.222010983780953e-06, + "loss": 1.0353, + "step": 22595 + }, + { + "epoch": 0.68, + "learning_rate": 1.2218013492666991e-06, + "loss": 1.1172, + "step": 22596 + }, + { + "epoch": 0.68, + "learning_rate": 1.22159172692028e-06, + "loss": 1.0707, + "step": 22597 + }, + { + "epoch": 0.68, + "learning_rate": 1.2213821167436917e-06, + "loss": 1.0392, + "step": 22598 + }, + { + "epoch": 0.68, + "learning_rate": 1.2211725187389303e-06, + "loss": 1.1397, + "step": 22599 + }, + { + "epoch": 0.68, + "learning_rate": 1.2209629329079912e-06, + "loss": 1.1588, + "step": 22600 + }, + { + "epoch": 0.68, + "learning_rate": 1.220753359252868e-06, + "loss": 1.0983, + "step": 22601 + }, + { + "epoch": 0.68, + "learning_rate": 1.2205437977755569e-06, + "loss": 0.9987, + "step": 22602 + }, + { + "epoch": 0.68, + "learning_rate": 1.2203342484780526e-06, + "loss": 1.0859, + "step": 22603 + }, + { + "epoch": 0.68, + "learning_rate": 1.2201247113623498e-06, + "loss": 1.1967, + "step": 22604 + }, + { + "epoch": 0.68, + "learning_rate": 1.2199151864304446e-06, + "loss": 1.0253, + "step": 22605 + }, + { + "epoch": 0.68, + "learning_rate": 1.219705673684329e-06, + "loss": 1.1096, + "step": 22606 + }, + { + "epoch": 0.68, + "learning_rate": 1.219496173125999e-06, + "loss": 1.1962, + "step": 22607 + }, + { + "epoch": 0.68, + "learning_rate": 1.2192866847574485e-06, + "loss": 1.085, + "step": 22608 + }, + { + "epoch": 0.68, + "learning_rate": 1.2190772085806733e-06, + "loss": 1.1018, + "step": 22609 + }, + { + "epoch": 0.68, + "learning_rate": 1.218867744597665e-06, + "loss": 1.1282, + "step": 22610 + }, + { + "epoch": 0.68, + "learning_rate": 1.2186582928104184e-06, + "loss": 1.097, + "step": 22611 + }, + { + "epoch": 0.68, + "learning_rate": 1.2184488532209281e-06, + "loss": 1.205, + "step": 22612 + }, + { + "epoch": 0.68, + "learning_rate": 1.2182394258311875e-06, + "loss": 1.1625, + "step": 22613 + }, + { + "epoch": 0.68, + "learning_rate": 1.2180300106431903e-06, + "loss": 1.0773, + "step": 22614 + }, + { + "epoch": 0.68, + "learning_rate": 1.21782060765893e-06, + "loss": 1.0444, + "step": 22615 + }, + { + "epoch": 0.68, + "learning_rate": 1.2176112168803997e-06, + "loss": 1.1731, + "step": 22616 + }, + { + "epoch": 0.68, + "learning_rate": 1.2174018383095942e-06, + "loss": 1.0687, + "step": 22617 + }, + { + "epoch": 0.68, + "learning_rate": 1.2171924719485046e-06, + "loss": 1.214, + "step": 22618 + }, + { + "epoch": 0.68, + "learning_rate": 1.2169831177991246e-06, + "loss": 1.1079, + "step": 22619 + }, + { + "epoch": 0.68, + "learning_rate": 1.2167737758634474e-06, + "loss": 1.0651, + "step": 22620 + }, + { + "epoch": 0.68, + "learning_rate": 1.2165644461434661e-06, + "loss": 1.0511, + "step": 22621 + }, + { + "epoch": 0.68, + "learning_rate": 1.216355128641174e-06, + "loss": 1.0323, + "step": 22622 + }, + { + "epoch": 0.68, + "learning_rate": 1.2161458233585615e-06, + "loss": 1.1478, + "step": 22623 + }, + { + "epoch": 0.68, + "learning_rate": 1.215936530297623e-06, + "loss": 1.1133, + "step": 22624 + }, + { + "epoch": 0.68, + "learning_rate": 1.21572724946035e-06, + "loss": 1.0923, + "step": 22625 + }, + { + "epoch": 0.68, + "learning_rate": 1.2155179808487362e-06, + "loss": 1.069, + "step": 22626 + }, + { + "epoch": 0.68, + "learning_rate": 1.2153087244647716e-06, + "loss": 1.1007, + "step": 22627 + }, + { + "epoch": 0.68, + "learning_rate": 1.215099480310449e-06, + "loss": 1.0779, + "step": 22628 + }, + { + "epoch": 0.68, + "learning_rate": 1.2148902483877607e-06, + "loss": 1.1089, + "step": 22629 + }, + { + "epoch": 0.68, + "learning_rate": 1.2146810286986993e-06, + "loss": 1.0577, + "step": 22630 + }, + { + "epoch": 0.68, + "learning_rate": 1.2144718212452545e-06, + "loss": 1.1959, + "step": 22631 + }, + { + "epoch": 0.68, + "learning_rate": 1.2142626260294184e-06, + "loss": 1.136, + "step": 22632 + }, + { + "epoch": 0.68, + "learning_rate": 1.2140534430531834e-06, + "loss": 1.1366, + "step": 22633 + }, + { + "epoch": 0.68, + "learning_rate": 1.21384427231854e-06, + "loss": 1.0593, + "step": 22634 + }, + { + "epoch": 0.68, + "learning_rate": 1.213635113827481e-06, + "loss": 1.1342, + "step": 22635 + }, + { + "epoch": 0.68, + "learning_rate": 1.2134259675819948e-06, + "loss": 1.0806, + "step": 22636 + }, + { + "epoch": 0.68, + "learning_rate": 1.2132168335840742e-06, + "loss": 1.043, + "step": 22637 + }, + { + "epoch": 0.68, + "learning_rate": 1.2130077118357092e-06, + "loss": 1.292, + "step": 22638 + }, + { + "epoch": 0.68, + "learning_rate": 1.2127986023388914e-06, + "loss": 1.1632, + "step": 22639 + }, + { + "epoch": 0.68, + "learning_rate": 1.2125895050956105e-06, + "loss": 1.1118, + "step": 22640 + }, + { + "epoch": 0.68, + "learning_rate": 1.2123804201078575e-06, + "loss": 1.076, + "step": 22641 + }, + { + "epoch": 0.68, + "learning_rate": 1.2121713473776231e-06, + "loss": 1.2072, + "step": 22642 + }, + { + "epoch": 0.68, + "learning_rate": 1.2119622869068978e-06, + "loss": 0.9997, + "step": 22643 + }, + { + "epoch": 0.68, + "learning_rate": 1.2117532386976705e-06, + "loss": 1.0544, + "step": 22644 + }, + { + "epoch": 0.68, + "learning_rate": 1.211544202751932e-06, + "loss": 1.0667, + "step": 22645 + }, + { + "epoch": 0.68, + "learning_rate": 1.211335179071672e-06, + "loss": 1.0084, + "step": 22646 + }, + { + "epoch": 0.68, + "learning_rate": 1.2111261676588803e-06, + "loss": 1.1343, + "step": 22647 + }, + { + "epoch": 0.68, + "learning_rate": 1.210917168515548e-06, + "loss": 1.0624, + "step": 22648 + }, + { + "epoch": 0.68, + "learning_rate": 1.2107081816436623e-06, + "loss": 1.2512, + "step": 22649 + }, + { + "epoch": 0.68, + "learning_rate": 1.2104992070452136e-06, + "loss": 1.1233, + "step": 22650 + }, + { + "epoch": 0.68, + "learning_rate": 1.2102902447221918e-06, + "loss": 1.0925, + "step": 22651 + }, + { + "epoch": 0.68, + "learning_rate": 1.2100812946765864e-06, + "loss": 1.1942, + "step": 22652 + }, + { + "epoch": 0.68, + "learning_rate": 1.2098723569103848e-06, + "loss": 1.1337, + "step": 22653 + }, + { + "epoch": 0.68, + "learning_rate": 1.2096634314255774e-06, + "loss": 1.1227, + "step": 22654 + }, + { + "epoch": 0.68, + "learning_rate": 1.2094545182241524e-06, + "loss": 1.1507, + "step": 22655 + }, + { + "epoch": 0.68, + "learning_rate": 1.2092456173081e-06, + "loss": 1.1219, + "step": 22656 + }, + { + "epoch": 0.68, + "learning_rate": 1.2090367286794064e-06, + "loss": 1.1354, + "step": 22657 + }, + { + "epoch": 0.68, + "learning_rate": 1.2088278523400615e-06, + "loss": 1.0496, + "step": 22658 + }, + { + "epoch": 0.68, + "learning_rate": 1.2086189882920538e-06, + "loss": 1.064, + "step": 22659 + }, + { + "epoch": 0.68, + "learning_rate": 1.208410136537371e-06, + "loss": 1.1466, + "step": 22660 + }, + { + "epoch": 0.68, + "learning_rate": 1.208201297078003e-06, + "loss": 1.252, + "step": 22661 + }, + { + "epoch": 0.68, + "learning_rate": 1.2079924699159353e-06, + "loss": 1.1389, + "step": 22662 + }, + { + "epoch": 0.68, + "learning_rate": 1.2077836550531572e-06, + "loss": 1.053, + "step": 22663 + }, + { + "epoch": 0.68, + "learning_rate": 1.2075748524916562e-06, + "loss": 1.1266, + "step": 22664 + }, + { + "epoch": 0.68, + "learning_rate": 1.2073660622334203e-06, + "loss": 1.2312, + "step": 22665 + }, + { + "epoch": 0.68, + "learning_rate": 1.2071572842804377e-06, + "loss": 1.1094, + "step": 22666 + }, + { + "epoch": 0.68, + "learning_rate": 1.2069485186346943e-06, + "loss": 0.9984, + "step": 22667 + }, + { + "epoch": 0.68, + "learning_rate": 1.2067397652981782e-06, + "loss": 1.1288, + "step": 22668 + }, + { + "epoch": 0.68, + "learning_rate": 1.2065310242728766e-06, + "loss": 1.2271, + "step": 22669 + }, + { + "epoch": 0.68, + "learning_rate": 1.2063222955607768e-06, + "loss": 0.987, + "step": 22670 + }, + { + "epoch": 0.68, + "learning_rate": 1.2061135791638657e-06, + "loss": 1.0954, + "step": 22671 + }, + { + "epoch": 0.68, + "learning_rate": 1.20590487508413e-06, + "loss": 0.9567, + "step": 22672 + }, + { + "epoch": 0.68, + "learning_rate": 1.2056961833235566e-06, + "loss": 1.0903, + "step": 22673 + }, + { + "epoch": 0.68, + "learning_rate": 1.2054875038841334e-06, + "loss": 1.2444, + "step": 22674 + }, + { + "epoch": 0.68, + "learning_rate": 1.2052788367678447e-06, + "loss": 1.0435, + "step": 22675 + }, + { + "epoch": 0.68, + "learning_rate": 1.2050701819766777e-06, + "loss": 1.0778, + "step": 22676 + }, + { + "epoch": 0.68, + "learning_rate": 1.2048615395126193e-06, + "loss": 1.1714, + "step": 22677 + }, + { + "epoch": 0.68, + "learning_rate": 1.204652909377656e-06, + "loss": 1.1367, + "step": 22678 + }, + { + "epoch": 0.68, + "learning_rate": 1.2044442915737722e-06, + "loss": 1.1035, + "step": 22679 + }, + { + "epoch": 0.68, + "learning_rate": 1.2042356861029546e-06, + "loss": 1.2017, + "step": 22680 + }, + { + "epoch": 0.68, + "learning_rate": 1.2040270929671893e-06, + "loss": 1.2068, + "step": 22681 + }, + { + "epoch": 0.68, + "learning_rate": 1.203818512168463e-06, + "loss": 1.2084, + "step": 22682 + }, + { + "epoch": 0.68, + "learning_rate": 1.2036099437087592e-06, + "loss": 1.1945, + "step": 22683 + }, + { + "epoch": 0.68, + "learning_rate": 1.2034013875900644e-06, + "loss": 1.1397, + "step": 22684 + }, + { + "epoch": 0.68, + "learning_rate": 1.203192843814364e-06, + "loss": 1.0063, + "step": 22685 + }, + { + "epoch": 0.68, + "learning_rate": 1.2029843123836428e-06, + "loss": 1.0599, + "step": 22686 + }, + { + "epoch": 0.68, + "learning_rate": 1.2027757932998877e-06, + "loss": 1.1437, + "step": 22687 + }, + { + "epoch": 0.68, + "learning_rate": 1.2025672865650811e-06, + "loss": 1.0885, + "step": 22688 + }, + { + "epoch": 0.68, + "learning_rate": 1.202358792181209e-06, + "loss": 1.1793, + "step": 22689 + }, + { + "epoch": 0.68, + "learning_rate": 1.2021503101502563e-06, + "loss": 1.1274, + "step": 22690 + }, + { + "epoch": 0.68, + "learning_rate": 1.2019418404742087e-06, + "loss": 1.1143, + "step": 22691 + }, + { + "epoch": 0.68, + "learning_rate": 1.2017333831550485e-06, + "loss": 1.1778, + "step": 22692 + }, + { + "epoch": 0.68, + "learning_rate": 1.2015249381947614e-06, + "loss": 1.2859, + "step": 22693 + }, + { + "epoch": 0.68, + "learning_rate": 1.2013165055953313e-06, + "loss": 0.9488, + "step": 22694 + }, + { + "epoch": 0.68, + "learning_rate": 1.2011080853587426e-06, + "loss": 1.0458, + "step": 22695 + }, + { + "epoch": 0.68, + "learning_rate": 1.2008996774869794e-06, + "loss": 1.0501, + "step": 22696 + }, + { + "epoch": 0.68, + "learning_rate": 1.2006912819820255e-06, + "loss": 1.129, + "step": 22697 + }, + { + "epoch": 0.68, + "learning_rate": 1.200482898845865e-06, + "loss": 1.0911, + "step": 22698 + }, + { + "epoch": 0.68, + "learning_rate": 1.2002745280804814e-06, + "loss": 1.2592, + "step": 22699 + }, + { + "epoch": 0.68, + "learning_rate": 1.2000661696878593e-06, + "loss": 1.1779, + "step": 22700 + }, + { + "epoch": 0.68, + "learning_rate": 1.1998578236699801e-06, + "loss": 1.1556, + "step": 22701 + }, + { + "epoch": 0.68, + "learning_rate": 1.1996494900288282e-06, + "loss": 1.0976, + "step": 22702 + }, + { + "epoch": 0.68, + "learning_rate": 1.1994411687663873e-06, + "loss": 1.1224, + "step": 22703 + }, + { + "epoch": 0.68, + "learning_rate": 1.1992328598846405e-06, + "loss": 0.9883, + "step": 22704 + }, + { + "epoch": 0.68, + "learning_rate": 1.19902456338557e-06, + "loss": 1.1331, + "step": 22705 + }, + { + "epoch": 0.68, + "learning_rate": 1.198816279271159e-06, + "loss": 1.088, + "step": 22706 + }, + { + "epoch": 0.68, + "learning_rate": 1.19860800754339e-06, + "loss": 1.0504, + "step": 22707 + }, + { + "epoch": 0.68, + "learning_rate": 1.198399748204247e-06, + "loss": 1.0273, + "step": 22708 + }, + { + "epoch": 0.68, + "learning_rate": 1.1981915012557108e-06, + "loss": 1.1885, + "step": 22709 + }, + { + "epoch": 0.68, + "learning_rate": 1.1979832666997643e-06, + "loss": 1.1583, + "step": 22710 + }, + { + "epoch": 0.68, + "learning_rate": 1.1977750445383903e-06, + "loss": 1.1072, + "step": 22711 + }, + { + "epoch": 0.68, + "learning_rate": 1.1975668347735706e-06, + "loss": 1.0754, + "step": 22712 + }, + { + "epoch": 0.68, + "learning_rate": 1.1973586374072881e-06, + "loss": 1.1005, + "step": 22713 + }, + { + "epoch": 0.68, + "learning_rate": 1.1971504524415233e-06, + "loss": 1.0003, + "step": 22714 + }, + { + "epoch": 0.68, + "learning_rate": 1.1969422798782587e-06, + "loss": 1.1346, + "step": 22715 + }, + { + "epoch": 0.68, + "learning_rate": 1.196734119719476e-06, + "loss": 1.1511, + "step": 22716 + }, + { + "epoch": 0.68, + "learning_rate": 1.1965259719671577e-06, + "loss": 1.2469, + "step": 22717 + }, + { + "epoch": 0.68, + "learning_rate": 1.1963178366232833e-06, + "loss": 1.1502, + "step": 22718 + }, + { + "epoch": 0.68, + "learning_rate": 1.1961097136898353e-06, + "loss": 1.0547, + "step": 22719 + }, + { + "epoch": 0.68, + "learning_rate": 1.195901603168795e-06, + "loss": 1.1226, + "step": 22720 + }, + { + "epoch": 0.68, + "learning_rate": 1.1956935050621433e-06, + "loss": 1.041, + "step": 22721 + }, + { + "epoch": 0.68, + "learning_rate": 1.1954854193718612e-06, + "loss": 1.0456, + "step": 22722 + }, + { + "epoch": 0.68, + "learning_rate": 1.1952773460999298e-06, + "loss": 1.0991, + "step": 22723 + }, + { + "epoch": 0.68, + "learning_rate": 1.1950692852483296e-06, + "loss": 1.066, + "step": 22724 + }, + { + "epoch": 0.68, + "learning_rate": 1.1948612368190412e-06, + "loss": 1.1817, + "step": 22725 + }, + { + "epoch": 0.68, + "learning_rate": 1.1946532008140463e-06, + "loss": 1.2335, + "step": 22726 + }, + { + "epoch": 0.68, + "learning_rate": 1.1944451772353234e-06, + "loss": 1.0917, + "step": 22727 + }, + { + "epoch": 0.68, + "learning_rate": 1.1942371660848535e-06, + "loss": 1.0294, + "step": 22728 + }, + { + "epoch": 0.68, + "learning_rate": 1.1940291673646167e-06, + "loss": 1.0955, + "step": 22729 + }, + { + "epoch": 0.68, + "learning_rate": 1.1938211810765946e-06, + "loss": 1.1788, + "step": 22730 + }, + { + "epoch": 0.68, + "learning_rate": 1.1936132072227644e-06, + "loss": 1.0948, + "step": 22731 + }, + { + "epoch": 0.68, + "learning_rate": 1.1934052458051077e-06, + "loss": 1.1132, + "step": 22732 + }, + { + "epoch": 0.68, + "learning_rate": 1.1931972968256037e-06, + "loss": 1.0948, + "step": 22733 + }, + { + "epoch": 0.68, + "learning_rate": 1.1929893602862328e-06, + "loss": 1.0032, + "step": 22734 + }, + { + "epoch": 0.68, + "learning_rate": 1.1927814361889729e-06, + "loss": 1.1658, + "step": 22735 + }, + { + "epoch": 0.68, + "learning_rate": 1.1925735245358042e-06, + "loss": 1.0764, + "step": 22736 + }, + { + "epoch": 0.68, + "learning_rate": 1.1923656253287059e-06, + "loss": 1.1717, + "step": 22737 + }, + { + "epoch": 0.68, + "learning_rate": 1.1921577385696568e-06, + "loss": 1.1375, + "step": 22738 + }, + { + "epoch": 0.69, + "learning_rate": 1.1919498642606373e-06, + "loss": 1.0782, + "step": 22739 + }, + { + "epoch": 0.69, + "learning_rate": 1.1917420024036242e-06, + "loss": 1.1255, + "step": 22740 + }, + { + "epoch": 0.69, + "learning_rate": 1.191534153000597e-06, + "loss": 1.0474, + "step": 22741 + }, + { + "epoch": 0.69, + "learning_rate": 1.1913263160535347e-06, + "loss": 1.1663, + "step": 22742 + }, + { + "epoch": 0.69, + "learning_rate": 1.1911184915644161e-06, + "loss": 1.1495, + "step": 22743 + }, + { + "epoch": 0.69, + "learning_rate": 1.1909106795352185e-06, + "loss": 1.1445, + "step": 22744 + }, + { + "epoch": 0.69, + "learning_rate": 1.1907028799679207e-06, + "loss": 1.1182, + "step": 22745 + }, + { + "epoch": 0.69, + "learning_rate": 1.190495092864501e-06, + "loss": 1.0958, + "step": 22746 + }, + { + "epoch": 0.69, + "learning_rate": 1.1902873182269373e-06, + "loss": 1.0993, + "step": 22747 + }, + { + "epoch": 0.69, + "learning_rate": 1.1900795560572084e-06, + "loss": 1.078, + "step": 22748 + }, + { + "epoch": 0.69, + "learning_rate": 1.1898718063572904e-06, + "loss": 1.1324, + "step": 22749 + }, + { + "epoch": 0.69, + "learning_rate": 1.1896640691291617e-06, + "loss": 1.2276, + "step": 22750 + }, + { + "epoch": 0.69, + "learning_rate": 1.1894563443748e-06, + "loss": 1.0733, + "step": 22751 + }, + { + "epoch": 0.69, + "learning_rate": 1.189248632096183e-06, + "loss": 1.1494, + "step": 22752 + }, + { + "epoch": 0.69, + "learning_rate": 1.1890409322952873e-06, + "loss": 1.2439, + "step": 22753 + }, + { + "epoch": 0.69, + "learning_rate": 1.188833244974091e-06, + "loss": 1.1057, + "step": 22754 + }, + { + "epoch": 0.69, + "learning_rate": 1.1886255701345704e-06, + "loss": 1.1936, + "step": 22755 + }, + { + "epoch": 0.69, + "learning_rate": 1.1884179077787036e-06, + "loss": 1.0578, + "step": 22756 + }, + { + "epoch": 0.69, + "learning_rate": 1.188210257908466e-06, + "loss": 1.1356, + "step": 22757 + }, + { + "epoch": 0.69, + "learning_rate": 1.188002620525835e-06, + "loss": 1.1982, + "step": 22758 + }, + { + "epoch": 0.69, + "learning_rate": 1.187794995632787e-06, + "loss": 0.9805, + "step": 22759 + }, + { + "epoch": 0.69, + "learning_rate": 1.1875873832312994e-06, + "loss": 1.2053, + "step": 22760 + }, + { + "epoch": 0.69, + "learning_rate": 1.1873797833233475e-06, + "loss": 1.2534, + "step": 22761 + }, + { + "epoch": 0.69, + "learning_rate": 1.1871721959109076e-06, + "loss": 1.2576, + "step": 22762 + }, + { + "epoch": 0.69, + "learning_rate": 1.186964620995956e-06, + "loss": 1.067, + "step": 22763 + }, + { + "epoch": 0.69, + "learning_rate": 1.1867570585804688e-06, + "loss": 1.1039, + "step": 22764 + }, + { + "epoch": 0.69, + "learning_rate": 1.186549508666423e-06, + "loss": 1.1456, + "step": 22765 + }, + { + "epoch": 0.69, + "learning_rate": 1.1863419712557922e-06, + "loss": 1.0478, + "step": 22766 + }, + { + "epoch": 0.69, + "learning_rate": 1.1861344463505535e-06, + "loss": 1.0858, + "step": 22767 + }, + { + "epoch": 0.69, + "learning_rate": 1.1859269339526816e-06, + "loss": 1.1856, + "step": 22768 + }, + { + "epoch": 0.69, + "learning_rate": 1.1857194340641538e-06, + "loss": 1.2029, + "step": 22769 + }, + { + "epoch": 0.69, + "learning_rate": 1.1855119466869427e-06, + "loss": 1.1698, + "step": 22770 + }, + { + "epoch": 0.69, + "learning_rate": 1.185304471823025e-06, + "loss": 1.0986, + "step": 22771 + }, + { + "epoch": 0.69, + "learning_rate": 1.1850970094743754e-06, + "loss": 1.1597, + "step": 22772 + }, + { + "epoch": 0.69, + "learning_rate": 1.18488955964297e-06, + "loss": 1.1553, + "step": 22773 + }, + { + "epoch": 0.69, + "learning_rate": 1.1846821223307816e-06, + "loss": 1.038, + "step": 22774 + }, + { + "epoch": 0.69, + "learning_rate": 1.1844746975397862e-06, + "loss": 1.1433, + "step": 22775 + }, + { + "epoch": 0.69, + "learning_rate": 1.1842672852719578e-06, + "loss": 1.0987, + "step": 22776 + }, + { + "epoch": 0.69, + "learning_rate": 1.1840598855292714e-06, + "loss": 1.0115, + "step": 22777 + }, + { + "epoch": 0.69, + "learning_rate": 1.1838524983137008e-06, + "loss": 1.1685, + "step": 22778 + }, + { + "epoch": 0.69, + "learning_rate": 1.183645123627221e-06, + "loss": 1.0822, + "step": 22779 + }, + { + "epoch": 0.69, + "learning_rate": 1.1834377614718054e-06, + "loss": 1.1786, + "step": 22780 + }, + { + "epoch": 0.69, + "learning_rate": 1.1832304118494282e-06, + "loss": 1.1385, + "step": 22781 + }, + { + "epoch": 0.69, + "learning_rate": 1.183023074762064e-06, + "loss": 1.0818, + "step": 22782 + }, + { + "epoch": 0.69, + "learning_rate": 1.1828157502116855e-06, + "loss": 1.0616, + "step": 22783 + }, + { + "epoch": 0.69, + "learning_rate": 1.1826084382002661e-06, + "loss": 1.1642, + "step": 22784 + }, + { + "epoch": 0.69, + "learning_rate": 1.18240113872978e-06, + "loss": 1.0632, + "step": 22785 + }, + { + "epoch": 0.69, + "learning_rate": 1.182193851802202e-06, + "loss": 1.1525, + "step": 22786 + }, + { + "epoch": 0.69, + "learning_rate": 1.1819865774195022e-06, + "loss": 1.1597, + "step": 22787 + }, + { + "epoch": 0.69, + "learning_rate": 1.1817793155836558e-06, + "loss": 1.1375, + "step": 22788 + }, + { + "epoch": 0.69, + "learning_rate": 1.1815720662966353e-06, + "loss": 1.1437, + "step": 22789 + }, + { + "epoch": 0.69, + "learning_rate": 1.1813648295604138e-06, + "loss": 1.0305, + "step": 22790 + }, + { + "epoch": 0.69, + "learning_rate": 1.1811576053769649e-06, + "loss": 1.0784, + "step": 22791 + }, + { + "epoch": 0.69, + "learning_rate": 1.1809503937482595e-06, + "loss": 1.0317, + "step": 22792 + }, + { + "epoch": 0.69, + "learning_rate": 1.1807431946762713e-06, + "loss": 1.1945, + "step": 22793 + }, + { + "epoch": 0.69, + "learning_rate": 1.1805360081629722e-06, + "loss": 1.1537, + "step": 22794 + }, + { + "epoch": 0.69, + "learning_rate": 1.1803288342103358e-06, + "loss": 1.0803, + "step": 22795 + }, + { + "epoch": 0.69, + "learning_rate": 1.1801216728203323e-06, + "loss": 1.0811, + "step": 22796 + }, + { + "epoch": 0.69, + "learning_rate": 1.1799145239949353e-06, + "loss": 1.1616, + "step": 22797 + }, + { + "epoch": 0.69, + "learning_rate": 1.179707387736116e-06, + "loss": 1.1398, + "step": 22798 + }, + { + "epoch": 0.69, + "learning_rate": 1.1795002640458471e-06, + "loss": 1.0967, + "step": 22799 + }, + { + "epoch": 0.69, + "learning_rate": 1.1792931529260993e-06, + "loss": 1.1126, + "step": 22800 + }, + { + "epoch": 0.69, + "learning_rate": 1.179086054378844e-06, + "loss": 1.0954, + "step": 22801 + }, + { + "epoch": 0.69, + "learning_rate": 1.1788789684060538e-06, + "loss": 1.1449, + "step": 22802 + }, + { + "epoch": 0.69, + "learning_rate": 1.1786718950096992e-06, + "loss": 1.1887, + "step": 22803 + }, + { + "epoch": 0.69, + "learning_rate": 1.178464834191752e-06, + "loss": 1.1902, + "step": 22804 + }, + { + "epoch": 0.69, + "learning_rate": 1.1782577859541833e-06, + "loss": 1.1461, + "step": 22805 + }, + { + "epoch": 0.69, + "learning_rate": 1.1780507502989635e-06, + "loss": 1.0521, + "step": 22806 + }, + { + "epoch": 0.69, + "learning_rate": 1.1778437272280641e-06, + "loss": 1.1047, + "step": 22807 + }, + { + "epoch": 0.69, + "learning_rate": 1.1776367167434566e-06, + "loss": 1.1016, + "step": 22808 + }, + { + "epoch": 0.69, + "learning_rate": 1.1774297188471096e-06, + "loss": 1.1461, + "step": 22809 + }, + { + "epoch": 0.69, + "learning_rate": 1.177222733540995e-06, + "loss": 1.0208, + "step": 22810 + }, + { + "epoch": 0.69, + "learning_rate": 1.1770157608270827e-06, + "loss": 1.1963, + "step": 22811 + }, + { + "epoch": 0.69, + "learning_rate": 1.176808800707344e-06, + "loss": 1.1604, + "step": 22812 + }, + { + "epoch": 0.69, + "learning_rate": 1.1766018531837476e-06, + "loss": 1.134, + "step": 22813 + }, + { + "epoch": 0.69, + "learning_rate": 1.1763949182582638e-06, + "loss": 1.1664, + "step": 22814 + }, + { + "epoch": 0.69, + "learning_rate": 1.1761879959328633e-06, + "loss": 1.0682, + "step": 22815 + }, + { + "epoch": 0.69, + "learning_rate": 1.1759810862095162e-06, + "loss": 1.1165, + "step": 22816 + }, + { + "epoch": 0.69, + "learning_rate": 1.1757741890901905e-06, + "loss": 1.097, + "step": 22817 + }, + { + "epoch": 0.69, + "learning_rate": 1.175567304576857e-06, + "loss": 1.0695, + "step": 22818 + }, + { + "epoch": 0.69, + "learning_rate": 1.1753604326714848e-06, + "loss": 0.9506, + "step": 22819 + }, + { + "epoch": 0.69, + "learning_rate": 1.1751535733760433e-06, + "loss": 1.1279, + "step": 22820 + }, + { + "epoch": 0.69, + "learning_rate": 1.1749467266925024e-06, + "loss": 1.0765, + "step": 22821 + }, + { + "epoch": 0.69, + "learning_rate": 1.17473989262283e-06, + "loss": 1.0156, + "step": 22822 + }, + { + "epoch": 0.69, + "learning_rate": 1.1745330711689953e-06, + "loss": 1.0015, + "step": 22823 + }, + { + "epoch": 0.69, + "learning_rate": 1.1743262623329673e-06, + "loss": 1.0552, + "step": 22824 + }, + { + "epoch": 0.69, + "learning_rate": 1.174119466116716e-06, + "loss": 1.1899, + "step": 22825 + }, + { + "epoch": 0.69, + "learning_rate": 1.1739126825222078e-06, + "loss": 1.1135, + "step": 22826 + }, + { + "epoch": 0.69, + "learning_rate": 1.1737059115514121e-06, + "loss": 1.0741, + "step": 22827 + }, + { + "epoch": 0.69, + "learning_rate": 1.1734991532062975e-06, + "loss": 1.007, + "step": 22828 + }, + { + "epoch": 0.69, + "learning_rate": 1.173292407488832e-06, + "loss": 1.1264, + "step": 22829 + }, + { + "epoch": 0.69, + "learning_rate": 1.1730856744009847e-06, + "loss": 1.0992, + "step": 22830 + }, + { + "epoch": 0.69, + "learning_rate": 1.172878953944722e-06, + "loss": 1.0482, + "step": 22831 + }, + { + "epoch": 0.69, + "learning_rate": 1.1726722461220123e-06, + "loss": 1.1371, + "step": 22832 + }, + { + "epoch": 0.69, + "learning_rate": 1.1724655509348236e-06, + "loss": 1.0203, + "step": 22833 + }, + { + "epoch": 0.69, + "learning_rate": 1.1722588683851235e-06, + "loss": 1.0729, + "step": 22834 + }, + { + "epoch": 0.69, + "learning_rate": 1.1720521984748795e-06, + "loss": 0.9952, + "step": 22835 + }, + { + "epoch": 0.69, + "learning_rate": 1.1718455412060588e-06, + "loss": 1.0952, + "step": 22836 + }, + { + "epoch": 0.69, + "learning_rate": 1.1716388965806294e-06, + "loss": 1.0676, + "step": 22837 + }, + { + "epoch": 0.69, + "learning_rate": 1.1714322646005585e-06, + "loss": 0.9958, + "step": 22838 + }, + { + "epoch": 0.69, + "learning_rate": 1.1712256452678118e-06, + "loss": 1.1155, + "step": 22839 + }, + { + "epoch": 0.69, + "learning_rate": 1.171019038584357e-06, + "loss": 1.1099, + "step": 22840 + }, + { + "epoch": 0.69, + "learning_rate": 1.1708124445521608e-06, + "loss": 1.0485, + "step": 22841 + }, + { + "epoch": 0.69, + "learning_rate": 1.170605863173191e-06, + "loss": 1.0911, + "step": 22842 + }, + { + "epoch": 0.69, + "learning_rate": 1.170399294449412e-06, + "loss": 1.1838, + "step": 22843 + }, + { + "epoch": 0.69, + "learning_rate": 1.1701927383827913e-06, + "loss": 1.1445, + "step": 22844 + }, + { + "epoch": 0.69, + "learning_rate": 1.1699861949752955e-06, + "loss": 1.0352, + "step": 22845 + }, + { + "epoch": 0.69, + "learning_rate": 1.1697796642288905e-06, + "loss": 1.1772, + "step": 22846 + }, + { + "epoch": 0.69, + "learning_rate": 1.1695731461455433e-06, + "loss": 0.9816, + "step": 22847 + }, + { + "epoch": 0.69, + "learning_rate": 1.1693666407272183e-06, + "loss": 1.1833, + "step": 22848 + }, + { + "epoch": 0.69, + "learning_rate": 1.1691601479758818e-06, + "loss": 1.1541, + "step": 22849 + }, + { + "epoch": 0.69, + "learning_rate": 1.1689536678934998e-06, + "loss": 1.1066, + "step": 22850 + }, + { + "epoch": 0.69, + "learning_rate": 1.1687472004820389e-06, + "loss": 1.1317, + "step": 22851 + }, + { + "epoch": 0.69, + "learning_rate": 1.1685407457434624e-06, + "loss": 1.0861, + "step": 22852 + }, + { + "epoch": 0.69, + "learning_rate": 1.1683343036797369e-06, + "loss": 1.1577, + "step": 22853 + }, + { + "epoch": 0.69, + "learning_rate": 1.1681278742928273e-06, + "loss": 1.0695, + "step": 22854 + }, + { + "epoch": 0.69, + "learning_rate": 1.1679214575846997e-06, + "loss": 1.1675, + "step": 22855 + }, + { + "epoch": 0.69, + "learning_rate": 1.1677150535573175e-06, + "loss": 1.1644, + "step": 22856 + }, + { + "epoch": 0.69, + "learning_rate": 1.1675086622126463e-06, + "loss": 1.1314, + "step": 22857 + }, + { + "epoch": 0.69, + "learning_rate": 1.1673022835526513e-06, + "loss": 1.0789, + "step": 22858 + }, + { + "epoch": 0.69, + "learning_rate": 1.1670959175792961e-06, + "loss": 1.0992, + "step": 22859 + }, + { + "epoch": 0.69, + "learning_rate": 1.166889564294546e-06, + "loss": 1.0263, + "step": 22860 + }, + { + "epoch": 0.69, + "learning_rate": 1.1666832237003654e-06, + "loss": 1.0505, + "step": 22861 + }, + { + "epoch": 0.69, + "learning_rate": 1.1664768957987183e-06, + "loss": 1.1785, + "step": 22862 + }, + { + "epoch": 0.69, + "learning_rate": 1.1662705805915688e-06, + "loss": 1.0811, + "step": 22863 + }, + { + "epoch": 0.69, + "learning_rate": 1.166064278080882e-06, + "loss": 1.0875, + "step": 22864 + }, + { + "epoch": 0.69, + "learning_rate": 1.16585798826862e-06, + "loss": 0.9502, + "step": 22865 + }, + { + "epoch": 0.69, + "learning_rate": 1.1656517111567472e-06, + "loss": 1.0627, + "step": 22866 + }, + { + "epoch": 0.69, + "learning_rate": 1.1654454467472277e-06, + "loss": 1.042, + "step": 22867 + }, + { + "epoch": 0.69, + "learning_rate": 1.1652391950420256e-06, + "loss": 1.2622, + "step": 22868 + }, + { + "epoch": 0.69, + "learning_rate": 1.1650329560431025e-06, + "loss": 1.14, + "step": 22869 + }, + { + "epoch": 0.69, + "learning_rate": 1.1648267297524227e-06, + "loss": 1.098, + "step": 22870 + }, + { + "epoch": 0.69, + "learning_rate": 1.1646205161719495e-06, + "loss": 1.0938, + "step": 22871 + }, + { + "epoch": 0.69, + "learning_rate": 1.1644143153036458e-06, + "loss": 1.161, + "step": 22872 + }, + { + "epoch": 0.69, + "learning_rate": 1.1642081271494756e-06, + "loss": 1.0561, + "step": 22873 + }, + { + "epoch": 0.69, + "learning_rate": 1.1640019517113999e-06, + "loss": 1.1576, + "step": 22874 + }, + { + "epoch": 0.69, + "learning_rate": 1.1637957889913817e-06, + "loss": 1.1489, + "step": 22875 + }, + { + "epoch": 0.69, + "learning_rate": 1.1635896389913846e-06, + "loss": 1.106, + "step": 22876 + }, + { + "epoch": 0.69, + "learning_rate": 1.163383501713371e-06, + "loss": 1.078, + "step": 22877 + }, + { + "epoch": 0.69, + "learning_rate": 1.1631773771593018e-06, + "loss": 1.1799, + "step": 22878 + }, + { + "epoch": 0.69, + "learning_rate": 1.1629712653311407e-06, + "loss": 1.0885, + "step": 22879 + }, + { + "epoch": 0.69, + "learning_rate": 1.1627651662308486e-06, + "loss": 1.085, + "step": 22880 + }, + { + "epoch": 0.69, + "learning_rate": 1.1625590798603892e-06, + "loss": 1.1652, + "step": 22881 + }, + { + "epoch": 0.69, + "learning_rate": 1.1623530062217226e-06, + "loss": 1.0786, + "step": 22882 + }, + { + "epoch": 0.69, + "learning_rate": 1.1621469453168109e-06, + "loss": 1.0388, + "step": 22883 + }, + { + "epoch": 0.69, + "learning_rate": 1.1619408971476157e-06, + "loss": 1.0556, + "step": 22884 + }, + { + "epoch": 0.69, + "learning_rate": 1.161734861716099e-06, + "loss": 1.187, + "step": 22885 + }, + { + "epoch": 0.69, + "learning_rate": 1.1615288390242219e-06, + "loss": 1.1633, + "step": 22886 + }, + { + "epoch": 0.69, + "learning_rate": 1.1613228290739453e-06, + "loss": 0.9442, + "step": 22887 + }, + { + "epoch": 0.69, + "learning_rate": 1.161116831867231e-06, + "loss": 1.0792, + "step": 22888 + }, + { + "epoch": 0.69, + "learning_rate": 1.1609108474060397e-06, + "loss": 1.2335, + "step": 22889 + }, + { + "epoch": 0.69, + "learning_rate": 1.1607048756923327e-06, + "loss": 1.0561, + "step": 22890 + }, + { + "epoch": 0.69, + "learning_rate": 1.1604989167280697e-06, + "loss": 1.1212, + "step": 22891 + }, + { + "epoch": 0.69, + "learning_rate": 1.1602929705152119e-06, + "loss": 1.069, + "step": 22892 + }, + { + "epoch": 0.69, + "learning_rate": 1.1600870370557195e-06, + "loss": 1.1091, + "step": 22893 + }, + { + "epoch": 0.69, + "learning_rate": 1.1598811163515545e-06, + "loss": 1.0748, + "step": 22894 + }, + { + "epoch": 0.69, + "learning_rate": 1.1596752084046748e-06, + "loss": 1.0406, + "step": 22895 + }, + { + "epoch": 0.69, + "learning_rate": 1.1594693132170412e-06, + "loss": 1.1666, + "step": 22896 + }, + { + "epoch": 0.69, + "learning_rate": 1.1592634307906146e-06, + "loss": 1.0816, + "step": 22897 + }, + { + "epoch": 0.69, + "learning_rate": 1.159057561127354e-06, + "loss": 1.2244, + "step": 22898 + }, + { + "epoch": 0.69, + "learning_rate": 1.158851704229221e-06, + "loss": 1.0737, + "step": 22899 + }, + { + "epoch": 0.69, + "learning_rate": 1.1586458600981725e-06, + "loss": 0.9539, + "step": 22900 + }, + { + "epoch": 0.69, + "learning_rate": 1.1584400287361696e-06, + "loss": 1.1066, + "step": 22901 + }, + { + "epoch": 0.69, + "learning_rate": 1.1582342101451715e-06, + "loss": 1.023, + "step": 22902 + }, + { + "epoch": 0.69, + "learning_rate": 1.1580284043271386e-06, + "loss": 1.1501, + "step": 22903 + }, + { + "epoch": 0.69, + "learning_rate": 1.1578226112840279e-06, + "loss": 1.161, + "step": 22904 + }, + { + "epoch": 0.69, + "learning_rate": 1.1576168310177992e-06, + "loss": 1.166, + "step": 22905 + }, + { + "epoch": 0.69, + "learning_rate": 1.1574110635304122e-06, + "loss": 1.2509, + "step": 22906 + }, + { + "epoch": 0.69, + "learning_rate": 1.157205308823826e-06, + "loss": 1.0634, + "step": 22907 + }, + { + "epoch": 0.69, + "learning_rate": 1.1569995668999977e-06, + "loss": 1.1476, + "step": 22908 + }, + { + "epoch": 0.69, + "learning_rate": 1.1567938377608868e-06, + "loss": 1.0925, + "step": 22909 + }, + { + "epoch": 0.69, + "learning_rate": 1.1565881214084514e-06, + "loss": 1.0896, + "step": 22910 + }, + { + "epoch": 0.69, + "learning_rate": 1.1563824178446504e-06, + "loss": 1.1472, + "step": 22911 + }, + { + "epoch": 0.69, + "learning_rate": 1.1561767270714424e-06, + "loss": 1.059, + "step": 22912 + }, + { + "epoch": 0.69, + "learning_rate": 1.1559710490907839e-06, + "loss": 1.1555, + "step": 22913 + }, + { + "epoch": 0.69, + "learning_rate": 1.1557653839046334e-06, + "loss": 1.1237, + "step": 22914 + }, + { + "epoch": 0.69, + "learning_rate": 1.1555597315149494e-06, + "loss": 1.1214, + "step": 22915 + }, + { + "epoch": 0.69, + "learning_rate": 1.1553540919236892e-06, + "loss": 1.0948, + "step": 22916 + }, + { + "epoch": 0.69, + "learning_rate": 1.1551484651328102e-06, + "loss": 1.0657, + "step": 22917 + }, + { + "epoch": 0.69, + "learning_rate": 1.1549428511442703e-06, + "loss": 1.0936, + "step": 22918 + }, + { + "epoch": 0.69, + "learning_rate": 1.1547372499600268e-06, + "loss": 1.1206, + "step": 22919 + }, + { + "epoch": 0.69, + "learning_rate": 1.1545316615820373e-06, + "loss": 1.1166, + "step": 22920 + }, + { + "epoch": 0.69, + "learning_rate": 1.154326086012258e-06, + "loss": 1.1169, + "step": 22921 + }, + { + "epoch": 0.69, + "learning_rate": 1.1541205232526457e-06, + "loss": 1.1953, + "step": 22922 + }, + { + "epoch": 0.69, + "learning_rate": 1.153914973305158e-06, + "loss": 1.2251, + "step": 22923 + }, + { + "epoch": 0.69, + "learning_rate": 1.1537094361717516e-06, + "loss": 1.0798, + "step": 22924 + }, + { + "epoch": 0.69, + "learning_rate": 1.1535039118543839e-06, + "loss": 1.1884, + "step": 22925 + }, + { + "epoch": 0.69, + "learning_rate": 1.1532984003550092e-06, + "loss": 1.0313, + "step": 22926 + }, + { + "epoch": 0.69, + "learning_rate": 1.1530929016755856e-06, + "loss": 1.1276, + "step": 22927 + }, + { + "epoch": 0.69, + "learning_rate": 1.1528874158180689e-06, + "loss": 1.1467, + "step": 22928 + }, + { + "epoch": 0.69, + "learning_rate": 1.1526819427844157e-06, + "loss": 1.2216, + "step": 22929 + }, + { + "epoch": 0.69, + "learning_rate": 1.1524764825765808e-06, + "loss": 1.0931, + "step": 22930 + }, + { + "epoch": 0.69, + "learning_rate": 1.1522710351965208e-06, + "loss": 1.1932, + "step": 22931 + }, + { + "epoch": 0.69, + "learning_rate": 1.1520656006461916e-06, + "loss": 1.1066, + "step": 22932 + }, + { + "epoch": 0.69, + "learning_rate": 1.1518601789275495e-06, + "loss": 1.1347, + "step": 22933 + }, + { + "epoch": 0.69, + "learning_rate": 1.1516547700425481e-06, + "loss": 1.196, + "step": 22934 + }, + { + "epoch": 0.69, + "learning_rate": 1.1514493739931442e-06, + "loss": 0.9997, + "step": 22935 + }, + { + "epoch": 0.69, + "learning_rate": 1.1512439907812928e-06, + "loss": 1.1879, + "step": 22936 + }, + { + "epoch": 0.69, + "learning_rate": 1.1510386204089488e-06, + "loss": 1.2079, + "step": 22937 + }, + { + "epoch": 0.69, + "learning_rate": 1.1508332628780683e-06, + "loss": 1.2489, + "step": 22938 + }, + { + "epoch": 0.69, + "learning_rate": 1.1506279181906047e-06, + "loss": 1.1155, + "step": 22939 + }, + { + "epoch": 0.69, + "learning_rate": 1.1504225863485132e-06, + "loss": 1.0795, + "step": 22940 + }, + { + "epoch": 0.69, + "learning_rate": 1.150217267353749e-06, + "loss": 1.1756, + "step": 22941 + }, + { + "epoch": 0.69, + "learning_rate": 1.150011961208266e-06, + "loss": 1.2043, + "step": 22942 + }, + { + "epoch": 0.69, + "learning_rate": 1.149806667914019e-06, + "loss": 1.0837, + "step": 22943 + }, + { + "epoch": 0.69, + "learning_rate": 1.1496013874729625e-06, + "loss": 1.1207, + "step": 22944 + }, + { + "epoch": 0.69, + "learning_rate": 1.1493961198870503e-06, + "loss": 1.0466, + "step": 22945 + }, + { + "epoch": 0.69, + "learning_rate": 1.1491908651582376e-06, + "loss": 1.1177, + "step": 22946 + }, + { + "epoch": 0.69, + "learning_rate": 1.148985623288476e-06, + "loss": 1.103, + "step": 22947 + }, + { + "epoch": 0.69, + "learning_rate": 1.148780394279721e-06, + "loss": 1.2353, + "step": 22948 + }, + { + "epoch": 0.69, + "learning_rate": 1.1485751781339255e-06, + "loss": 1.1874, + "step": 22949 + }, + { + "epoch": 0.69, + "learning_rate": 1.148369974853044e-06, + "loss": 1.1366, + "step": 22950 + }, + { + "epoch": 0.69, + "learning_rate": 1.1481647844390297e-06, + "loss": 0.9914, + "step": 22951 + }, + { + "epoch": 0.69, + "learning_rate": 1.1479596068938348e-06, + "loss": 1.081, + "step": 22952 + }, + { + "epoch": 0.69, + "learning_rate": 1.1477544422194135e-06, + "loss": 1.0642, + "step": 22953 + }, + { + "epoch": 0.69, + "learning_rate": 1.1475492904177184e-06, + "loss": 1.0871, + "step": 22954 + }, + { + "epoch": 0.69, + "learning_rate": 1.1473441514907037e-06, + "loss": 1.0704, + "step": 22955 + }, + { + "epoch": 0.69, + "learning_rate": 1.1471390254403205e-06, + "loss": 1.1575, + "step": 22956 + }, + { + "epoch": 0.69, + "learning_rate": 1.146933912268522e-06, + "loss": 1.1195, + "step": 22957 + }, + { + "epoch": 0.69, + "learning_rate": 1.146728811977261e-06, + "loss": 1.0294, + "step": 22958 + }, + { + "epoch": 0.69, + "learning_rate": 1.146523724568491e-06, + "loss": 1.0947, + "step": 22959 + }, + { + "epoch": 0.69, + "learning_rate": 1.1463186500441622e-06, + "loss": 1.1874, + "step": 22960 + }, + { + "epoch": 0.69, + "learning_rate": 1.146113588406228e-06, + "loss": 1.1481, + "step": 22961 + }, + { + "epoch": 0.69, + "learning_rate": 1.1459085396566406e-06, + "loss": 1.046, + "step": 22962 + }, + { + "epoch": 0.69, + "learning_rate": 1.1457035037973513e-06, + "loss": 1.2051, + "step": 22963 + }, + { + "epoch": 0.69, + "learning_rate": 1.1454984808303134e-06, + "loss": 1.0955, + "step": 22964 + }, + { + "epoch": 0.69, + "learning_rate": 1.1452934707574769e-06, + "loss": 1.0308, + "step": 22965 + }, + { + "epoch": 0.69, + "learning_rate": 1.145088473580794e-06, + "loss": 1.1433, + "step": 22966 + }, + { + "epoch": 0.69, + "learning_rate": 1.1448834893022165e-06, + "loss": 1.0662, + "step": 22967 + }, + { + "epoch": 0.69, + "learning_rate": 1.1446785179236953e-06, + "loss": 0.9879, + "step": 22968 + }, + { + "epoch": 0.69, + "learning_rate": 1.1444735594471816e-06, + "loss": 1.0497, + "step": 22969 + }, + { + "epoch": 0.69, + "learning_rate": 1.1442686138746273e-06, + "loss": 1.1567, + "step": 22970 + }, + { + "epoch": 0.69, + "learning_rate": 1.1440636812079824e-06, + "loss": 1.0672, + "step": 22971 + }, + { + "epoch": 0.69, + "learning_rate": 1.1438587614491998e-06, + "loss": 1.1052, + "step": 22972 + }, + { + "epoch": 0.69, + "learning_rate": 1.143653854600227e-06, + "loss": 1.0743, + "step": 22973 + }, + { + "epoch": 0.69, + "learning_rate": 1.1434489606630166e-06, + "loss": 1.1331, + "step": 22974 + }, + { + "epoch": 0.69, + "learning_rate": 1.1432440796395188e-06, + "loss": 1.1921, + "step": 22975 + }, + { + "epoch": 0.69, + "learning_rate": 1.1430392115316838e-06, + "loss": 1.1365, + "step": 22976 + }, + { + "epoch": 0.69, + "learning_rate": 1.142834356341463e-06, + "loss": 1.0661, + "step": 22977 + }, + { + "epoch": 0.69, + "learning_rate": 1.1426295140708043e-06, + "loss": 1.0911, + "step": 22978 + }, + { + "epoch": 0.69, + "learning_rate": 1.1424246847216594e-06, + "loss": 1.1481, + "step": 22979 + }, + { + "epoch": 0.69, + "learning_rate": 1.1422198682959774e-06, + "loss": 1.1467, + "step": 22980 + }, + { + "epoch": 0.69, + "learning_rate": 1.142015064795709e-06, + "loss": 1.2308, + "step": 22981 + }, + { + "epoch": 0.69, + "learning_rate": 1.1418102742228027e-06, + "loss": 1.034, + "step": 22982 + }, + { + "epoch": 0.69, + "learning_rate": 1.1416054965792082e-06, + "loss": 1.006, + "step": 22983 + }, + { + "epoch": 0.69, + "learning_rate": 1.141400731866875e-06, + "loss": 1.1009, + "step": 22984 + }, + { + "epoch": 0.69, + "learning_rate": 1.1411959800877537e-06, + "loss": 1.1344, + "step": 22985 + }, + { + "epoch": 0.69, + "learning_rate": 1.1409912412437912e-06, + "loss": 1.1, + "step": 22986 + }, + { + "epoch": 0.69, + "learning_rate": 1.1407865153369375e-06, + "loss": 1.1772, + "step": 22987 + }, + { + "epoch": 0.69, + "learning_rate": 1.1405818023691418e-06, + "loss": 1.1681, + "step": 22988 + }, + { + "epoch": 0.69, + "learning_rate": 1.1403771023423532e-06, + "loss": 1.177, + "step": 22989 + }, + { + "epoch": 0.69, + "learning_rate": 1.1401724152585192e-06, + "loss": 1.0966, + "step": 22990 + }, + { + "epoch": 0.69, + "learning_rate": 1.1399677411195886e-06, + "loss": 1.0953, + "step": 22991 + }, + { + "epoch": 0.69, + "learning_rate": 1.1397630799275103e-06, + "loss": 1.0842, + "step": 22992 + }, + { + "epoch": 0.69, + "learning_rate": 1.1395584316842323e-06, + "loss": 1.0497, + "step": 22993 + }, + { + "epoch": 0.69, + "learning_rate": 1.1393537963917025e-06, + "loss": 1.1013, + "step": 22994 + }, + { + "epoch": 0.69, + "learning_rate": 1.1391491740518707e-06, + "loss": 0.9703, + "step": 22995 + }, + { + "epoch": 0.69, + "learning_rate": 1.1389445646666822e-06, + "loss": 1.0293, + "step": 22996 + }, + { + "epoch": 0.69, + "learning_rate": 1.1387399682380859e-06, + "loss": 1.0226, + "step": 22997 + }, + { + "epoch": 0.69, + "learning_rate": 1.1385353847680294e-06, + "loss": 1.2046, + "step": 22998 + }, + { + "epoch": 0.69, + "learning_rate": 1.1383308142584606e-06, + "loss": 1.1976, + "step": 22999 + }, + { + "epoch": 0.69, + "learning_rate": 1.1381262567113265e-06, + "loss": 1.1415, + "step": 23000 + }, + { + "epoch": 0.69, + "learning_rate": 1.1379217121285747e-06, + "loss": 1.1353, + "step": 23001 + }, + { + "epoch": 0.69, + "learning_rate": 1.137717180512153e-06, + "loss": 1.155, + "step": 23002 + }, + { + "epoch": 0.69, + "learning_rate": 1.1375126618640064e-06, + "loss": 1.0698, + "step": 23003 + }, + { + "epoch": 0.69, + "learning_rate": 1.1373081561860834e-06, + "loss": 1.164, + "step": 23004 + }, + { + "epoch": 0.69, + "learning_rate": 1.1371036634803307e-06, + "loss": 1.0325, + "step": 23005 + }, + { + "epoch": 0.69, + "learning_rate": 1.1368991837486943e-06, + "loss": 0.8745, + "step": 23006 + }, + { + "epoch": 0.69, + "learning_rate": 1.1366947169931222e-06, + "loss": 1.0761, + "step": 23007 + }, + { + "epoch": 0.69, + "learning_rate": 1.1364902632155589e-06, + "loss": 1.0606, + "step": 23008 + }, + { + "epoch": 0.69, + "learning_rate": 1.1362858224179515e-06, + "loss": 1.1002, + "step": 23009 + }, + { + "epoch": 0.69, + "learning_rate": 1.1360813946022466e-06, + "loss": 1.1667, + "step": 23010 + }, + { + "epoch": 0.69, + "learning_rate": 1.1358769797703905e-06, + "loss": 1.1119, + "step": 23011 + }, + { + "epoch": 0.69, + "learning_rate": 1.135672577924328e-06, + "loss": 1.0714, + "step": 23012 + }, + { + "epoch": 0.69, + "learning_rate": 1.1354681890660051e-06, + "loss": 1.2311, + "step": 23013 + }, + { + "epoch": 0.69, + "learning_rate": 1.135263813197368e-06, + "loss": 1.1195, + "step": 23014 + }, + { + "epoch": 0.69, + "learning_rate": 1.1350594503203633e-06, + "loss": 1.0573, + "step": 23015 + }, + { + "epoch": 0.69, + "learning_rate": 1.134855100436934e-06, + "loss": 1.022, + "step": 23016 + }, + { + "epoch": 0.69, + "learning_rate": 1.134650763549027e-06, + "loss": 1.1255, + "step": 23017 + }, + { + "epoch": 0.69, + "learning_rate": 1.1344464396585869e-06, + "loss": 1.1968, + "step": 23018 + }, + { + "epoch": 0.69, + "learning_rate": 1.134242128767559e-06, + "loss": 1.1351, + "step": 23019 + }, + { + "epoch": 0.69, + "learning_rate": 1.1340378308778894e-06, + "loss": 1.0957, + "step": 23020 + }, + { + "epoch": 0.69, + "learning_rate": 1.1338335459915205e-06, + "loss": 1.0001, + "step": 23021 + }, + { + "epoch": 0.69, + "learning_rate": 1.1336292741103986e-06, + "loss": 1.0195, + "step": 23022 + }, + { + "epoch": 0.69, + "learning_rate": 1.133425015236468e-06, + "loss": 1.0854, + "step": 23023 + }, + { + "epoch": 0.69, + "learning_rate": 1.1332207693716728e-06, + "loss": 1.2017, + "step": 23024 + }, + { + "epoch": 0.69, + "learning_rate": 1.1330165365179577e-06, + "loss": 1.2117, + "step": 23025 + }, + { + "epoch": 0.69, + "learning_rate": 1.132812316677267e-06, + "loss": 1.1221, + "step": 23026 + }, + { + "epoch": 0.69, + "learning_rate": 1.1326081098515443e-06, + "loss": 1.0789, + "step": 23027 + }, + { + "epoch": 0.69, + "learning_rate": 1.132403916042735e-06, + "loss": 1.0762, + "step": 23028 + }, + { + "epoch": 0.69, + "learning_rate": 1.1321997352527806e-06, + "loss": 1.2052, + "step": 23029 + }, + { + "epoch": 0.69, + "learning_rate": 1.1319955674836262e-06, + "loss": 1.2523, + "step": 23030 + }, + { + "epoch": 0.69, + "learning_rate": 1.131791412737215e-06, + "loss": 1.1703, + "step": 23031 + }, + { + "epoch": 0.69, + "learning_rate": 1.1315872710154907e-06, + "loss": 1.139, + "step": 23032 + }, + { + "epoch": 0.69, + "learning_rate": 1.1313831423203975e-06, + "loss": 1.1622, + "step": 23033 + }, + { + "epoch": 0.69, + "learning_rate": 1.1311790266538764e-06, + "loss": 1.1841, + "step": 23034 + }, + { + "epoch": 0.69, + "learning_rate": 1.130974924017872e-06, + "loss": 1.1314, + "step": 23035 + }, + { + "epoch": 0.69, + "learning_rate": 1.130770834414327e-06, + "loss": 1.1492, + "step": 23036 + }, + { + "epoch": 0.69, + "learning_rate": 1.1305667578451848e-06, + "loss": 1.0465, + "step": 23037 + }, + { + "epoch": 0.69, + "learning_rate": 1.1303626943123868e-06, + "loss": 1.2209, + "step": 23038 + }, + { + "epoch": 0.69, + "learning_rate": 1.1301586438178766e-06, + "loss": 1.035, + "step": 23039 + }, + { + "epoch": 0.69, + "learning_rate": 1.1299546063635962e-06, + "loss": 1.1209, + "step": 23040 + }, + { + "epoch": 0.69, + "learning_rate": 1.1297505819514886e-06, + "loss": 1.0679, + "step": 23041 + }, + { + "epoch": 0.69, + "learning_rate": 1.129546570583495e-06, + "loss": 1.1448, + "step": 23042 + }, + { + "epoch": 0.69, + "learning_rate": 1.129342572261558e-06, + "loss": 1.1782, + "step": 23043 + }, + { + "epoch": 0.69, + "learning_rate": 1.1291385869876198e-06, + "loss": 0.9553, + "step": 23044 + }, + { + "epoch": 0.69, + "learning_rate": 1.1289346147636215e-06, + "loss": 1.0898, + "step": 23045 + }, + { + "epoch": 0.69, + "learning_rate": 1.1287306555915068e-06, + "loss": 1.1477, + "step": 23046 + }, + { + "epoch": 0.69, + "learning_rate": 1.1285267094732143e-06, + "loss": 1.0404, + "step": 23047 + }, + { + "epoch": 0.69, + "learning_rate": 1.1283227764106876e-06, + "loss": 1.1172, + "step": 23048 + }, + { + "epoch": 0.69, + "learning_rate": 1.1281188564058673e-06, + "loss": 1.0636, + "step": 23049 + }, + { + "epoch": 0.69, + "learning_rate": 1.1279149494606944e-06, + "loss": 1.254, + "step": 23050 + }, + { + "epoch": 0.69, + "learning_rate": 1.1277110555771109e-06, + "loss": 0.9812, + "step": 23051 + }, + { + "epoch": 0.69, + "learning_rate": 1.1275071747570569e-06, + "loss": 1.0583, + "step": 23052 + }, + { + "epoch": 0.69, + "learning_rate": 1.1273033070024736e-06, + "loss": 1.0503, + "step": 23053 + }, + { + "epoch": 0.69, + "learning_rate": 1.1270994523153026e-06, + "loss": 1.1813, + "step": 23054 + }, + { + "epoch": 0.69, + "learning_rate": 1.1268956106974828e-06, + "loss": 1.0862, + "step": 23055 + }, + { + "epoch": 0.69, + "learning_rate": 1.1266917821509555e-06, + "loss": 1.3093, + "step": 23056 + }, + { + "epoch": 0.69, + "learning_rate": 1.126487966677661e-06, + "loss": 1.0377, + "step": 23057 + }, + { + "epoch": 0.69, + "learning_rate": 1.1262841642795394e-06, + "loss": 1.0746, + "step": 23058 + }, + { + "epoch": 0.69, + "learning_rate": 1.126080374958532e-06, + "loss": 1.0325, + "step": 23059 + }, + { + "epoch": 0.69, + "learning_rate": 1.1258765987165769e-06, + "loss": 1.2069, + "step": 23060 + }, + { + "epoch": 0.69, + "learning_rate": 1.1256728355556146e-06, + "loss": 1.0402, + "step": 23061 + }, + { + "epoch": 0.69, + "learning_rate": 1.125469085477585e-06, + "loss": 1.2758, + "step": 23062 + }, + { + "epoch": 0.69, + "learning_rate": 1.1252653484844287e-06, + "loss": 1.1415, + "step": 23063 + }, + { + "epoch": 0.69, + "learning_rate": 1.1250616245780832e-06, + "loss": 1.0547, + "step": 23064 + }, + { + "epoch": 0.69, + "learning_rate": 1.124857913760489e-06, + "loss": 1.0571, + "step": 23065 + }, + { + "epoch": 0.69, + "learning_rate": 1.124654216033585e-06, + "loss": 1.1682, + "step": 23066 + }, + { + "epoch": 0.69, + "learning_rate": 1.1244505313993115e-06, + "loss": 1.117, + "step": 23067 + }, + { + "epoch": 0.69, + "learning_rate": 1.1242468598596055e-06, + "loss": 1.2853, + "step": 23068 + }, + { + "epoch": 0.69, + "learning_rate": 1.1240432014164068e-06, + "loss": 1.1484, + "step": 23069 + }, + { + "epoch": 0.69, + "learning_rate": 1.1238395560716542e-06, + "loss": 1.0284, + "step": 23070 + }, + { + "epoch": 0.7, + "learning_rate": 1.1236359238272862e-06, + "loss": 1.0204, + "step": 23071 + }, + { + "epoch": 0.7, + "learning_rate": 1.1234323046852422e-06, + "loss": 1.0153, + "step": 23072 + }, + { + "epoch": 0.7, + "learning_rate": 1.1232286986474589e-06, + "loss": 1.0853, + "step": 23073 + }, + { + "epoch": 0.7, + "learning_rate": 1.123025105715875e-06, + "loss": 1.1029, + "step": 23074 + }, + { + "epoch": 0.7, + "learning_rate": 1.1228215258924294e-06, + "loss": 1.1163, + "step": 23075 + }, + { + "epoch": 0.7, + "learning_rate": 1.1226179591790593e-06, + "loss": 1.0836, + "step": 23076 + }, + { + "epoch": 0.7, + "learning_rate": 1.1224144055777037e-06, + "loss": 1.1028, + "step": 23077 + }, + { + "epoch": 0.7, + "learning_rate": 1.1222108650902987e-06, + "loss": 1.0689, + "step": 23078 + }, + { + "epoch": 0.7, + "learning_rate": 1.1220073377187827e-06, + "loss": 1.0294, + "step": 23079 + }, + { + "epoch": 0.7, + "learning_rate": 1.1218038234650933e-06, + "loss": 1.101, + "step": 23080 + }, + { + "epoch": 0.7, + "learning_rate": 1.1216003223311675e-06, + "loss": 1.0278, + "step": 23081 + }, + { + "epoch": 0.7, + "learning_rate": 1.1213968343189428e-06, + "loss": 1.2098, + "step": 23082 + }, + { + "epoch": 0.7, + "learning_rate": 1.1211933594303564e-06, + "loss": 1.0721, + "step": 23083 + }, + { + "epoch": 0.7, + "learning_rate": 1.120989897667345e-06, + "loss": 1.0491, + "step": 23084 + }, + { + "epoch": 0.7, + "learning_rate": 1.1207864490318467e-06, + "loss": 1.0632, + "step": 23085 + }, + { + "epoch": 0.7, + "learning_rate": 1.1205830135257961e-06, + "loss": 1.2452, + "step": 23086 + }, + { + "epoch": 0.7, + "learning_rate": 1.120379591151131e-06, + "loss": 1.0984, + "step": 23087 + }, + { + "epoch": 0.7, + "learning_rate": 1.120176181909788e-06, + "loss": 1.0287, + "step": 23088 + }, + { + "epoch": 0.7, + "learning_rate": 1.1199727858037035e-06, + "loss": 1.0284, + "step": 23089 + }, + { + "epoch": 0.7, + "learning_rate": 1.119769402834813e-06, + "loss": 0.9761, + "step": 23090 + }, + { + "epoch": 0.7, + "learning_rate": 1.119566033005053e-06, + "loss": 1.0588, + "step": 23091 + }, + { + "epoch": 0.7, + "learning_rate": 1.1193626763163593e-06, + "loss": 1.088, + "step": 23092 + }, + { + "epoch": 0.7, + "learning_rate": 1.119159332770669e-06, + "loss": 1.1542, + "step": 23093 + }, + { + "epoch": 0.7, + "learning_rate": 1.1189560023699159e-06, + "loss": 1.1822, + "step": 23094 + }, + { + "epoch": 0.7, + "learning_rate": 1.1187526851160365e-06, + "loss": 0.9824, + "step": 23095 + }, + { + "epoch": 0.7, + "learning_rate": 1.1185493810109664e-06, + "loss": 1.1064, + "step": 23096 + }, + { + "epoch": 0.7, + "learning_rate": 1.1183460900566407e-06, + "loss": 1.0474, + "step": 23097 + }, + { + "epoch": 0.7, + "learning_rate": 1.118142812254996e-06, + "loss": 1.1362, + "step": 23098 + }, + { + "epoch": 0.7, + "learning_rate": 1.117939547607965e-06, + "loss": 1.1454, + "step": 23099 + }, + { + "epoch": 0.7, + "learning_rate": 1.117736296117484e-06, + "loss": 1.1829, + "step": 23100 + }, + { + "epoch": 0.7, + "learning_rate": 1.1175330577854876e-06, + "loss": 1.061, + "step": 23101 + }, + { + "epoch": 0.7, + "learning_rate": 1.1173298326139118e-06, + "loss": 1.0728, + "step": 23102 + }, + { + "epoch": 0.7, + "learning_rate": 1.117126620604689e-06, + "loss": 1.0634, + "step": 23103 + }, + { + "epoch": 0.7, + "learning_rate": 1.1169234217597549e-06, + "loss": 1.072, + "step": 23104 + }, + { + "epoch": 0.7, + "learning_rate": 1.1167202360810437e-06, + "loss": 1.1802, + "step": 23105 + }, + { + "epoch": 0.7, + "learning_rate": 1.1165170635704894e-06, + "loss": 1.0425, + "step": 23106 + }, + { + "epoch": 0.7, + "learning_rate": 1.1163139042300267e-06, + "loss": 0.9874, + "step": 23107 + }, + { + "epoch": 0.7, + "learning_rate": 1.1161107580615887e-06, + "loss": 1.0184, + "step": 23108 + }, + { + "epoch": 0.7, + "learning_rate": 1.1159076250671102e-06, + "loss": 1.0765, + "step": 23109 + }, + { + "epoch": 0.7, + "learning_rate": 1.1157045052485247e-06, + "loss": 1.1082, + "step": 23110 + }, + { + "epoch": 0.7, + "learning_rate": 1.1155013986077662e-06, + "loss": 1.085, + "step": 23111 + }, + { + "epoch": 0.7, + "learning_rate": 1.1152983051467667e-06, + "loss": 1.1938, + "step": 23112 + }, + { + "epoch": 0.7, + "learning_rate": 1.1150952248674604e-06, + "loss": 1.1004, + "step": 23113 + }, + { + "epoch": 0.7, + "learning_rate": 1.1148921577717806e-06, + "loss": 1.1223, + "step": 23114 + }, + { + "epoch": 0.7, + "learning_rate": 1.1146891038616615e-06, + "loss": 1.0513, + "step": 23115 + }, + { + "epoch": 0.7, + "learning_rate": 1.1144860631390337e-06, + "loss": 1.0989, + "step": 23116 + }, + { + "epoch": 0.7, + "learning_rate": 1.1142830356058315e-06, + "loss": 1.0717, + "step": 23117 + }, + { + "epoch": 0.7, + "learning_rate": 1.1140800212639875e-06, + "loss": 1.0792, + "step": 23118 + }, + { + "epoch": 0.7, + "learning_rate": 1.1138770201154348e-06, + "loss": 1.2072, + "step": 23119 + }, + { + "epoch": 0.7, + "learning_rate": 1.1136740321621046e-06, + "loss": 1.0024, + "step": 23120 + }, + { + "epoch": 0.7, + "learning_rate": 1.11347105740593e-06, + "loss": 1.1379, + "step": 23121 + }, + { + "epoch": 0.7, + "learning_rate": 1.1132680958488428e-06, + "loss": 1.0991, + "step": 23122 + }, + { + "epoch": 0.7, + "learning_rate": 1.113065147492776e-06, + "loss": 1.127, + "step": 23123 + }, + { + "epoch": 0.7, + "learning_rate": 1.1128622123396616e-06, + "loss": 1.0203, + "step": 23124 + }, + { + "epoch": 0.7, + "learning_rate": 1.1126592903914299e-06, + "loss": 1.0831, + "step": 23125 + }, + { + "epoch": 0.7, + "learning_rate": 1.1124563816500137e-06, + "loss": 1.1544, + "step": 23126 + }, + { + "epoch": 0.7, + "learning_rate": 1.1122534861173445e-06, + "loss": 1.0595, + "step": 23127 + }, + { + "epoch": 0.7, + "learning_rate": 1.1120506037953546e-06, + "loss": 1.151, + "step": 23128 + }, + { + "epoch": 0.7, + "learning_rate": 1.1118477346859737e-06, + "loss": 1.0624, + "step": 23129 + }, + { + "epoch": 0.7, + "learning_rate": 1.1116448787911339e-06, + "loss": 1.1458, + "step": 23130 + }, + { + "epoch": 0.7, + "learning_rate": 1.111442036112766e-06, + "loss": 1.0674, + "step": 23131 + }, + { + "epoch": 0.7, + "learning_rate": 1.111239206652801e-06, + "loss": 1.0565, + "step": 23132 + }, + { + "epoch": 0.7, + "learning_rate": 1.11103639041317e-06, + "loss": 1.0894, + "step": 23133 + }, + { + "epoch": 0.7, + "learning_rate": 1.110833587395804e-06, + "loss": 0.9564, + "step": 23134 + }, + { + "epoch": 0.7, + "learning_rate": 1.1106307976026328e-06, + "loss": 1.0522, + "step": 23135 + }, + { + "epoch": 0.7, + "learning_rate": 1.1104280210355871e-06, + "loss": 1.2006, + "step": 23136 + }, + { + "epoch": 0.7, + "learning_rate": 1.1102252576965988e-06, + "loss": 1.0871, + "step": 23137 + }, + { + "epoch": 0.7, + "learning_rate": 1.1100225075875956e-06, + "loss": 1.1307, + "step": 23138 + }, + { + "epoch": 0.7, + "learning_rate": 1.1098197707105087e-06, + "loss": 1.1278, + "step": 23139 + }, + { + "epoch": 0.7, + "learning_rate": 1.109617047067268e-06, + "loss": 0.9947, + "step": 23140 + }, + { + "epoch": 0.7, + "learning_rate": 1.1094143366598042e-06, + "loss": 1.0858, + "step": 23141 + }, + { + "epoch": 0.7, + "learning_rate": 1.1092116394900457e-06, + "loss": 1.1146, + "step": 23142 + }, + { + "epoch": 0.7, + "learning_rate": 1.109008955559922e-06, + "loss": 1.1772, + "step": 23143 + }, + { + "epoch": 0.7, + "learning_rate": 1.1088062848713636e-06, + "loss": 1.0555, + "step": 23144 + }, + { + "epoch": 0.7, + "learning_rate": 1.1086036274262998e-06, + "loss": 1.1117, + "step": 23145 + }, + { + "epoch": 0.7, + "learning_rate": 1.1084009832266587e-06, + "loss": 1.0289, + "step": 23146 + }, + { + "epoch": 0.7, + "learning_rate": 1.10819835227437e-06, + "loss": 1.1471, + "step": 23147 + }, + { + "epoch": 0.7, + "learning_rate": 1.1079957345713627e-06, + "loss": 1.0048, + "step": 23148 + }, + { + "epoch": 0.7, + "learning_rate": 1.1077931301195658e-06, + "loss": 1.1194, + "step": 23149 + }, + { + "epoch": 0.7, + "learning_rate": 1.1075905389209082e-06, + "loss": 1.1056, + "step": 23150 + }, + { + "epoch": 0.7, + "learning_rate": 1.1073879609773175e-06, + "loss": 1.1258, + "step": 23151 + }, + { + "epoch": 0.7, + "learning_rate": 1.1071853962907226e-06, + "loss": 1.1428, + "step": 23152 + }, + { + "epoch": 0.7, + "learning_rate": 1.106982844863052e-06, + "loss": 1.0398, + "step": 23153 + }, + { + "epoch": 0.7, + "learning_rate": 1.1067803066962347e-06, + "loss": 1.022, + "step": 23154 + }, + { + "epoch": 0.7, + "learning_rate": 1.106577781792197e-06, + "loss": 1.1111, + "step": 23155 + }, + { + "epoch": 0.7, + "learning_rate": 1.1063752701528676e-06, + "loss": 1.05, + "step": 23156 + }, + { + "epoch": 0.7, + "learning_rate": 1.1061727717801746e-06, + "loss": 1.0698, + "step": 23157 + }, + { + "epoch": 0.7, + "learning_rate": 1.1059702866760452e-06, + "loss": 1.0977, + "step": 23158 + }, + { + "epoch": 0.7, + "learning_rate": 1.1057678148424086e-06, + "loss": 1.069, + "step": 23159 + }, + { + "epoch": 0.7, + "learning_rate": 1.1055653562811897e-06, + "loss": 0.9819, + "step": 23160 + }, + { + "epoch": 0.7, + "learning_rate": 1.1053629109943173e-06, + "loss": 1.1203, + "step": 23161 + }, + { + "epoch": 0.7, + "learning_rate": 1.105160478983718e-06, + "loss": 1.0517, + "step": 23162 + }, + { + "epoch": 0.7, + "learning_rate": 1.1049580602513192e-06, + "loss": 1.0976, + "step": 23163 + }, + { + "epoch": 0.7, + "learning_rate": 1.1047556547990482e-06, + "loss": 1.085, + "step": 23164 + }, + { + "epoch": 0.7, + "learning_rate": 1.104553262628831e-06, + "loss": 1.0063, + "step": 23165 + }, + { + "epoch": 0.7, + "learning_rate": 1.1043508837425948e-06, + "loss": 1.0366, + "step": 23166 + }, + { + "epoch": 0.7, + "learning_rate": 1.104148518142267e-06, + "loss": 0.9575, + "step": 23167 + }, + { + "epoch": 0.7, + "learning_rate": 1.103946165829772e-06, + "loss": 1.2103, + "step": 23168 + }, + { + "epoch": 0.7, + "learning_rate": 1.1037438268070372e-06, + "loss": 1.1337, + "step": 23169 + }, + { + "epoch": 0.7, + "learning_rate": 1.1035415010759886e-06, + "loss": 1.1536, + "step": 23170 + }, + { + "epoch": 0.7, + "learning_rate": 1.1033391886385533e-06, + "loss": 1.0427, + "step": 23171 + }, + { + "epoch": 0.7, + "learning_rate": 1.1031368894966554e-06, + "loss": 1.0988, + "step": 23172 + }, + { + "epoch": 0.7, + "learning_rate": 1.1029346036522214e-06, + "loss": 1.0406, + "step": 23173 + }, + { + "epoch": 0.7, + "learning_rate": 1.1027323311071775e-06, + "loss": 1.1959, + "step": 23174 + }, + { + "epoch": 0.7, + "learning_rate": 1.1025300718634497e-06, + "loss": 1.1653, + "step": 23175 + }, + { + "epoch": 0.7, + "learning_rate": 1.1023278259229615e-06, + "loss": 1.1497, + "step": 23176 + }, + { + "epoch": 0.7, + "learning_rate": 1.1021255932876392e-06, + "loss": 1.1265, + "step": 23177 + }, + { + "epoch": 0.7, + "learning_rate": 1.1019233739594081e-06, + "loss": 1.0702, + "step": 23178 + }, + { + "epoch": 0.7, + "learning_rate": 1.1017211679401932e-06, + "loss": 1.061, + "step": 23179 + }, + { + "epoch": 0.7, + "learning_rate": 1.10151897523192e-06, + "loss": 1.1485, + "step": 23180 + }, + { + "epoch": 0.7, + "learning_rate": 1.101316795836512e-06, + "loss": 1.1893, + "step": 23181 + }, + { + "epoch": 0.7, + "learning_rate": 1.1011146297558945e-06, + "loss": 1.0677, + "step": 23182 + }, + { + "epoch": 0.7, + "learning_rate": 1.100912476991992e-06, + "loss": 1.1249, + "step": 23183 + }, + { + "epoch": 0.7, + "learning_rate": 1.1007103375467293e-06, + "loss": 1.0903, + "step": 23184 + }, + { + "epoch": 0.7, + "learning_rate": 1.1005082114220296e-06, + "loss": 1.052, + "step": 23185 + }, + { + "epoch": 0.7, + "learning_rate": 1.100306098619818e-06, + "loss": 1.1368, + "step": 23186 + }, + { + "epoch": 0.7, + "learning_rate": 1.100103999142018e-06, + "loss": 1.2662, + "step": 23187 + }, + { + "epoch": 0.7, + "learning_rate": 1.0999019129905538e-06, + "loss": 1.132, + "step": 23188 + }, + { + "epoch": 0.7, + "learning_rate": 1.0996998401673492e-06, + "loss": 1.0578, + "step": 23189 + }, + { + "epoch": 0.7, + "learning_rate": 1.0994977806743276e-06, + "loss": 1.0809, + "step": 23190 + }, + { + "epoch": 0.7, + "learning_rate": 1.0992957345134125e-06, + "loss": 1.1045, + "step": 23191 + }, + { + "epoch": 0.7, + "learning_rate": 1.0990937016865275e-06, + "loss": 1.0834, + "step": 23192 + }, + { + "epoch": 0.7, + "learning_rate": 1.0988916821955967e-06, + "loss": 1.1629, + "step": 23193 + }, + { + "epoch": 0.7, + "learning_rate": 1.0986896760425414e-06, + "loss": 1.2087, + "step": 23194 + }, + { + "epoch": 0.7, + "learning_rate": 1.0984876832292853e-06, + "loss": 1.0912, + "step": 23195 + }, + { + "epoch": 0.7, + "learning_rate": 1.098285703757752e-06, + "loss": 1.1219, + "step": 23196 + }, + { + "epoch": 0.7, + "learning_rate": 1.098083737629864e-06, + "loss": 1.1106, + "step": 23197 + }, + { + "epoch": 0.7, + "learning_rate": 1.097881784847543e-06, + "loss": 1.1434, + "step": 23198 + }, + { + "epoch": 0.7, + "learning_rate": 1.097679845412712e-06, + "loss": 1.1579, + "step": 23199 + }, + { + "epoch": 0.7, + "learning_rate": 1.0974779193272937e-06, + "loss": 1.2173, + "step": 23200 + }, + { + "epoch": 0.7, + "learning_rate": 1.097276006593211e-06, + "loss": 1.1439, + "step": 23201 + }, + { + "epoch": 0.7, + "learning_rate": 1.0970741072123838e-06, + "loss": 1.0787, + "step": 23202 + }, + { + "epoch": 0.7, + "learning_rate": 1.0968722211867358e-06, + "loss": 1.1813, + "step": 23203 + }, + { + "epoch": 0.7, + "learning_rate": 1.0966703485181887e-06, + "loss": 1.0087, + "step": 23204 + }, + { + "epoch": 0.7, + "learning_rate": 1.0964684892086635e-06, + "loss": 1.1247, + "step": 23205 + }, + { + "epoch": 0.7, + "learning_rate": 1.0962666432600836e-06, + "loss": 1.1813, + "step": 23206 + }, + { + "epoch": 0.7, + "learning_rate": 1.0960648106743683e-06, + "loss": 1.1237, + "step": 23207 + }, + { + "epoch": 0.7, + "learning_rate": 1.0958629914534397e-06, + "loss": 1.1188, + "step": 23208 + }, + { + "epoch": 0.7, + "learning_rate": 1.0956611855992191e-06, + "loss": 1.1592, + "step": 23209 + }, + { + "epoch": 0.7, + "learning_rate": 1.0954593931136287e-06, + "loss": 1.0851, + "step": 23210 + }, + { + "epoch": 0.7, + "learning_rate": 1.0952576139985875e-06, + "loss": 1.0436, + "step": 23211 + }, + { + "epoch": 0.7, + "learning_rate": 1.0950558482560172e-06, + "loss": 1.1816, + "step": 23212 + }, + { + "epoch": 0.7, + "learning_rate": 1.0948540958878387e-06, + "loss": 1.221, + "step": 23213 + }, + { + "epoch": 0.7, + "learning_rate": 1.0946523568959724e-06, + "loss": 1.0831, + "step": 23214 + }, + { + "epoch": 0.7, + "learning_rate": 1.0944506312823388e-06, + "loss": 1.1783, + "step": 23215 + }, + { + "epoch": 0.7, + "learning_rate": 1.0942489190488583e-06, + "loss": 1.161, + "step": 23216 + }, + { + "epoch": 0.7, + "learning_rate": 1.0940472201974508e-06, + "loss": 1.145, + "step": 23217 + }, + { + "epoch": 0.7, + "learning_rate": 1.093845534730037e-06, + "loss": 1.056, + "step": 23218 + }, + { + "epoch": 0.7, + "learning_rate": 1.0936438626485374e-06, + "loss": 1.1945, + "step": 23219 + }, + { + "epoch": 0.7, + "learning_rate": 1.0934422039548699e-06, + "loss": 1.0659, + "step": 23220 + }, + { + "epoch": 0.7, + "learning_rate": 1.0932405586509551e-06, + "loss": 1.063, + "step": 23221 + }, + { + "epoch": 0.7, + "learning_rate": 1.0930389267387126e-06, + "loss": 0.9824, + "step": 23222 + }, + { + "epoch": 0.7, + "learning_rate": 1.092837308220063e-06, + "loss": 1.1447, + "step": 23223 + }, + { + "epoch": 0.7, + "learning_rate": 1.0926357030969234e-06, + "loss": 1.1447, + "step": 23224 + }, + { + "epoch": 0.7, + "learning_rate": 1.0924341113712142e-06, + "loss": 1.2352, + "step": 23225 + }, + { + "epoch": 0.7, + "learning_rate": 1.0922325330448545e-06, + "loss": 1.139, + "step": 23226 + }, + { + "epoch": 0.7, + "learning_rate": 1.0920309681197639e-06, + "loss": 1.1517, + "step": 23227 + }, + { + "epoch": 0.7, + "learning_rate": 1.0918294165978594e-06, + "loss": 0.9886, + "step": 23228 + }, + { + "epoch": 0.7, + "learning_rate": 1.0916278784810607e-06, + "loss": 1.0562, + "step": 23229 + }, + { + "epoch": 0.7, + "learning_rate": 1.0914263537712862e-06, + "loss": 1.1584, + "step": 23230 + }, + { + "epoch": 0.7, + "learning_rate": 1.0912248424704543e-06, + "loss": 1.0961, + "step": 23231 + }, + { + "epoch": 0.7, + "learning_rate": 1.0910233445804846e-06, + "loss": 1.075, + "step": 23232 + }, + { + "epoch": 0.7, + "learning_rate": 1.0908218601032932e-06, + "loss": 1.149, + "step": 23233 + }, + { + "epoch": 0.7, + "learning_rate": 1.090620389040799e-06, + "loss": 1.1226, + "step": 23234 + }, + { + "epoch": 0.7, + "learning_rate": 1.09041893139492e-06, + "loss": 1.1697, + "step": 23235 + }, + { + "epoch": 0.7, + "learning_rate": 1.0902174871675744e-06, + "loss": 1.0967, + "step": 23236 + }, + { + "epoch": 0.7, + "learning_rate": 1.0900160563606786e-06, + "loss": 1.1583, + "step": 23237 + }, + { + "epoch": 0.7, + "learning_rate": 1.0898146389761511e-06, + "loss": 1.1682, + "step": 23238 + }, + { + "epoch": 0.7, + "learning_rate": 1.089613235015909e-06, + "loss": 1.0896, + "step": 23239 + }, + { + "epoch": 0.7, + "learning_rate": 1.0894118444818693e-06, + "loss": 1.0851, + "step": 23240 + }, + { + "epoch": 0.7, + "learning_rate": 1.08921046737595e-06, + "loss": 1.1207, + "step": 23241 + }, + { + "epoch": 0.7, + "learning_rate": 1.089009103700068e-06, + "loss": 1.0463, + "step": 23242 + }, + { + "epoch": 0.7, + "learning_rate": 1.0888077534561392e-06, + "loss": 1.1697, + "step": 23243 + }, + { + "epoch": 0.7, + "learning_rate": 1.0886064166460808e-06, + "loss": 1.1617, + "step": 23244 + }, + { + "epoch": 0.7, + "learning_rate": 1.0884050932718097e-06, + "loss": 1.1864, + "step": 23245 + }, + { + "epoch": 0.7, + "learning_rate": 1.0882037833352417e-06, + "loss": 0.985, + "step": 23246 + }, + { + "epoch": 0.7, + "learning_rate": 1.0880024868382944e-06, + "loss": 1.0269, + "step": 23247 + }, + { + "epoch": 0.7, + "learning_rate": 1.0878012037828831e-06, + "loss": 1.175, + "step": 23248 + }, + { + "epoch": 0.7, + "learning_rate": 1.0875999341709253e-06, + "loss": 1.2622, + "step": 23249 + }, + { + "epoch": 0.7, + "learning_rate": 1.087398678004335e-06, + "loss": 1.092, + "step": 23250 + }, + { + "epoch": 0.7, + "learning_rate": 1.0871974352850288e-06, + "loss": 1.0773, + "step": 23251 + }, + { + "epoch": 0.7, + "learning_rate": 1.0869962060149225e-06, + "loss": 1.2125, + "step": 23252 + }, + { + "epoch": 0.7, + "learning_rate": 1.0867949901959326e-06, + "loss": 1.1725, + "step": 23253 + }, + { + "epoch": 0.7, + "learning_rate": 1.0865937878299732e-06, + "loss": 1.2433, + "step": 23254 + }, + { + "epoch": 0.7, + "learning_rate": 1.0863925989189602e-06, + "loss": 1.0915, + "step": 23255 + }, + { + "epoch": 0.7, + "learning_rate": 1.0861914234648085e-06, + "loss": 1.051, + "step": 23256 + }, + { + "epoch": 0.7, + "learning_rate": 1.085990261469434e-06, + "loss": 1.0469, + "step": 23257 + }, + { + "epoch": 0.7, + "learning_rate": 1.0857891129347516e-06, + "loss": 1.093, + "step": 23258 + }, + { + "epoch": 0.7, + "learning_rate": 1.0855879778626753e-06, + "loss": 1.1578, + "step": 23259 + }, + { + "epoch": 0.7, + "learning_rate": 1.0853868562551202e-06, + "loss": 1.1022, + "step": 23260 + }, + { + "epoch": 0.7, + "learning_rate": 1.0851857481140007e-06, + "loss": 1.0418, + "step": 23261 + }, + { + "epoch": 0.7, + "learning_rate": 1.0849846534412323e-06, + "loss": 1.0846, + "step": 23262 + }, + { + "epoch": 0.7, + "learning_rate": 1.0847835722387279e-06, + "loss": 1.0436, + "step": 23263 + }, + { + "epoch": 0.7, + "learning_rate": 1.0845825045084021e-06, + "loss": 1.0697, + "step": 23264 + }, + { + "epoch": 0.7, + "learning_rate": 1.0843814502521693e-06, + "loss": 1.1638, + "step": 23265 + }, + { + "epoch": 0.7, + "learning_rate": 1.084180409471944e-06, + "loss": 1.1063, + "step": 23266 + }, + { + "epoch": 0.7, + "learning_rate": 1.0839793821696388e-06, + "loss": 1.1982, + "step": 23267 + }, + { + "epoch": 0.7, + "learning_rate": 1.0837783683471675e-06, + "loss": 1.1529, + "step": 23268 + }, + { + "epoch": 0.7, + "learning_rate": 1.0835773680064444e-06, + "loss": 1.075, + "step": 23269 + }, + { + "epoch": 0.7, + "learning_rate": 1.0833763811493822e-06, + "loss": 0.9865, + "step": 23270 + }, + { + "epoch": 0.7, + "learning_rate": 1.0831754077778946e-06, + "loss": 1.0597, + "step": 23271 + }, + { + "epoch": 0.7, + "learning_rate": 1.082974447893895e-06, + "loss": 0.9672, + "step": 23272 + }, + { + "epoch": 0.7, + "learning_rate": 1.0827735014992962e-06, + "loss": 1.144, + "step": 23273 + }, + { + "epoch": 0.7, + "learning_rate": 1.0825725685960112e-06, + "loss": 1.1439, + "step": 23274 + }, + { + "epoch": 0.7, + "learning_rate": 1.0823716491859533e-06, + "loss": 1.1697, + "step": 23275 + }, + { + "epoch": 0.7, + "learning_rate": 1.0821707432710339e-06, + "loss": 1.1501, + "step": 23276 + }, + { + "epoch": 0.7, + "learning_rate": 1.081969850853166e-06, + "loss": 1.0356, + "step": 23277 + }, + { + "epoch": 0.7, + "learning_rate": 1.0817689719342623e-06, + "loss": 1.1794, + "step": 23278 + }, + { + "epoch": 0.7, + "learning_rate": 1.0815681065162355e-06, + "loss": 1.1574, + "step": 23279 + }, + { + "epoch": 0.7, + "learning_rate": 1.0813672546009967e-06, + "loss": 1.1833, + "step": 23280 + }, + { + "epoch": 0.7, + "learning_rate": 1.0811664161904584e-06, + "loss": 1.0623, + "step": 23281 + }, + { + "epoch": 0.7, + "learning_rate": 1.080965591286532e-06, + "loss": 1.122, + "step": 23282 + }, + { + "epoch": 0.7, + "learning_rate": 1.0807647798911302e-06, + "loss": 1.121, + "step": 23283 + }, + { + "epoch": 0.7, + "learning_rate": 1.080563982006165e-06, + "loss": 1.1375, + "step": 23284 + }, + { + "epoch": 0.7, + "learning_rate": 1.080363197633546e-06, + "loss": 1.0851, + "step": 23285 + }, + { + "epoch": 0.7, + "learning_rate": 1.0801624267751858e-06, + "loss": 1.1438, + "step": 23286 + }, + { + "epoch": 0.7, + "learning_rate": 1.0799616694329954e-06, + "loss": 0.9787, + "step": 23287 + }, + { + "epoch": 0.7, + "learning_rate": 1.079760925608887e-06, + "loss": 1.1509, + "step": 23288 + }, + { + "epoch": 0.7, + "learning_rate": 1.0795601953047696e-06, + "loss": 1.074, + "step": 23289 + }, + { + "epoch": 0.7, + "learning_rate": 1.079359478522555e-06, + "loss": 1.0218, + "step": 23290 + }, + { + "epoch": 0.7, + "learning_rate": 1.079158775264154e-06, + "loss": 1.1589, + "step": 23291 + }, + { + "epoch": 0.7, + "learning_rate": 1.0789580855314779e-06, + "loss": 1.1074, + "step": 23292 + }, + { + "epoch": 0.7, + "learning_rate": 1.0787574093264358e-06, + "loss": 1.1411, + "step": 23293 + }, + { + "epoch": 0.7, + "learning_rate": 1.0785567466509386e-06, + "loss": 1.0684, + "step": 23294 + }, + { + "epoch": 0.7, + "learning_rate": 1.0783560975068965e-06, + "loss": 1.1047, + "step": 23295 + }, + { + "epoch": 0.7, + "learning_rate": 1.0781554618962197e-06, + "loss": 1.0259, + "step": 23296 + }, + { + "epoch": 0.7, + "learning_rate": 1.0779548398208182e-06, + "loss": 1.035, + "step": 23297 + }, + { + "epoch": 0.7, + "learning_rate": 1.0777542312826017e-06, + "loss": 1.0641, + "step": 23298 + }, + { + "epoch": 0.7, + "learning_rate": 1.07755363628348e-06, + "loss": 1.163, + "step": 23299 + }, + { + "epoch": 0.7, + "learning_rate": 1.0773530548253623e-06, + "loss": 1.1041, + "step": 23300 + }, + { + "epoch": 0.7, + "learning_rate": 1.0771524869101594e-06, + "loss": 0.9713, + "step": 23301 + }, + { + "epoch": 0.7, + "learning_rate": 1.0769519325397787e-06, + "loss": 1.0789, + "step": 23302 + }, + { + "epoch": 0.7, + "learning_rate": 1.0767513917161303e-06, + "loss": 1.1328, + "step": 23303 + }, + { + "epoch": 0.7, + "learning_rate": 1.0765508644411232e-06, + "loss": 1.0689, + "step": 23304 + }, + { + "epoch": 0.7, + "learning_rate": 1.076350350716667e-06, + "loss": 1.1428, + "step": 23305 + }, + { + "epoch": 0.7, + "learning_rate": 1.076149850544669e-06, + "loss": 1.1218, + "step": 23306 + }, + { + "epoch": 0.7, + "learning_rate": 1.0759493639270388e-06, + "loss": 1.0497, + "step": 23307 + }, + { + "epoch": 0.7, + "learning_rate": 1.0757488908656849e-06, + "loss": 1.1609, + "step": 23308 + }, + { + "epoch": 0.7, + "learning_rate": 1.0755484313625152e-06, + "loss": 1.1219, + "step": 23309 + }, + { + "epoch": 0.7, + "learning_rate": 1.07534798541944e-06, + "loss": 1.1343, + "step": 23310 + }, + { + "epoch": 0.7, + "learning_rate": 1.0751475530383644e-06, + "loss": 1.1818, + "step": 23311 + }, + { + "epoch": 0.7, + "learning_rate": 1.0749471342211977e-06, + "loss": 1.1133, + "step": 23312 + }, + { + "epoch": 0.7, + "learning_rate": 1.0747467289698484e-06, + "loss": 0.9638, + "step": 23313 + }, + { + "epoch": 0.7, + "learning_rate": 1.0745463372862244e-06, + "loss": 1.1371, + "step": 23314 + }, + { + "epoch": 0.7, + "learning_rate": 1.074345959172232e-06, + "loss": 1.1194, + "step": 23315 + }, + { + "epoch": 0.7, + "learning_rate": 1.0741455946297796e-06, + "loss": 1.1097, + "step": 23316 + }, + { + "epoch": 0.7, + "learning_rate": 1.0739452436607741e-06, + "loss": 1.0234, + "step": 23317 + }, + { + "epoch": 0.7, + "learning_rate": 1.0737449062671244e-06, + "loss": 1.1505, + "step": 23318 + }, + { + "epoch": 0.7, + "learning_rate": 1.073544582450735e-06, + "loss": 1.079, + "step": 23319 + }, + { + "epoch": 0.7, + "learning_rate": 1.0733442722135144e-06, + "loss": 1.0415, + "step": 23320 + }, + { + "epoch": 0.7, + "learning_rate": 1.073143975557369e-06, + "loss": 1.0857, + "step": 23321 + }, + { + "epoch": 0.7, + "learning_rate": 1.0729436924842058e-06, + "loss": 1.0425, + "step": 23322 + }, + { + "epoch": 0.7, + "learning_rate": 1.0727434229959313e-06, + "loss": 1.1305, + "step": 23323 + }, + { + "epoch": 0.7, + "learning_rate": 1.072543167094453e-06, + "loss": 1.2446, + "step": 23324 + }, + { + "epoch": 0.7, + "learning_rate": 1.0723429247816754e-06, + "loss": 1.0834, + "step": 23325 + }, + { + "epoch": 0.7, + "learning_rate": 1.0721426960595057e-06, + "loss": 1.085, + "step": 23326 + }, + { + "epoch": 0.7, + "learning_rate": 1.0719424809298495e-06, + "loss": 1.0314, + "step": 23327 + }, + { + "epoch": 0.7, + "learning_rate": 1.0717422793946136e-06, + "loss": 1.0579, + "step": 23328 + }, + { + "epoch": 0.7, + "learning_rate": 1.0715420914557028e-06, + "loss": 1.0589, + "step": 23329 + }, + { + "epoch": 0.7, + "learning_rate": 1.0713419171150238e-06, + "loss": 1.142, + "step": 23330 + }, + { + "epoch": 0.7, + "learning_rate": 1.0711417563744822e-06, + "loss": 1.0801, + "step": 23331 + }, + { + "epoch": 0.7, + "learning_rate": 1.0709416092359824e-06, + "loss": 1.1315, + "step": 23332 + }, + { + "epoch": 0.7, + "learning_rate": 1.0707414757014299e-06, + "loss": 1.1127, + "step": 23333 + }, + { + "epoch": 0.7, + "learning_rate": 1.0705413557727303e-06, + "loss": 1.0547, + "step": 23334 + }, + { + "epoch": 0.7, + "learning_rate": 1.0703412494517885e-06, + "loss": 1.1158, + "step": 23335 + }, + { + "epoch": 0.7, + "learning_rate": 1.0701411567405104e-06, + "loss": 1.182, + "step": 23336 + }, + { + "epoch": 0.7, + "learning_rate": 1.069941077640799e-06, + "loss": 1.2079, + "step": 23337 + }, + { + "epoch": 0.7, + "learning_rate": 1.0697410121545596e-06, + "loss": 0.9655, + "step": 23338 + }, + { + "epoch": 0.7, + "learning_rate": 1.069540960283697e-06, + "loss": 1.1065, + "step": 23339 + }, + { + "epoch": 0.7, + "learning_rate": 1.0693409220301168e-06, + "loss": 1.1406, + "step": 23340 + }, + { + "epoch": 0.7, + "learning_rate": 1.0691408973957207e-06, + "loss": 1.1609, + "step": 23341 + }, + { + "epoch": 0.7, + "learning_rate": 1.0689408863824141e-06, + "loss": 1.0563, + "step": 23342 + }, + { + "epoch": 0.7, + "learning_rate": 1.068740888992101e-06, + "loss": 1.2198, + "step": 23343 + }, + { + "epoch": 0.7, + "learning_rate": 1.0685409052266866e-06, + "loss": 1.1319, + "step": 23344 + }, + { + "epoch": 0.7, + "learning_rate": 1.068340935088072e-06, + "loss": 1.0779, + "step": 23345 + }, + { + "epoch": 0.7, + "learning_rate": 1.0681409785781626e-06, + "loss": 1.0462, + "step": 23346 + }, + { + "epoch": 0.7, + "learning_rate": 1.0679410356988615e-06, + "loss": 1.0656, + "step": 23347 + }, + { + "epoch": 0.7, + "learning_rate": 1.0677411064520719e-06, + "loss": 1.1127, + "step": 23348 + }, + { + "epoch": 0.7, + "learning_rate": 1.067541190839698e-06, + "loss": 1.0733, + "step": 23349 + }, + { + "epoch": 0.7, + "learning_rate": 1.0673412888636411e-06, + "loss": 1.1926, + "step": 23350 + }, + { + "epoch": 0.7, + "learning_rate": 1.0671414005258052e-06, + "loss": 1.1609, + "step": 23351 + }, + { + "epoch": 0.7, + "learning_rate": 1.066941525828093e-06, + "loss": 1.1594, + "step": 23352 + }, + { + "epoch": 0.7, + "learning_rate": 1.0667416647724075e-06, + "loss": 1.0285, + "step": 23353 + }, + { + "epoch": 0.7, + "learning_rate": 1.066541817360651e-06, + "loss": 1.1921, + "step": 23354 + }, + { + "epoch": 0.7, + "learning_rate": 1.0663419835947258e-06, + "loss": 1.1053, + "step": 23355 + }, + { + "epoch": 0.7, + "learning_rate": 1.0661421634765348e-06, + "loss": 1.3097, + "step": 23356 + }, + { + "epoch": 0.7, + "learning_rate": 1.0659423570079806e-06, + "loss": 1.2325, + "step": 23357 + }, + { + "epoch": 0.7, + "learning_rate": 1.0657425641909636e-06, + "loss": 1.0502, + "step": 23358 + }, + { + "epoch": 0.7, + "learning_rate": 1.0655427850273864e-06, + "loss": 1.0055, + "step": 23359 + }, + { + "epoch": 0.7, + "learning_rate": 1.065343019519151e-06, + "loss": 1.1514, + "step": 23360 + }, + { + "epoch": 0.7, + "learning_rate": 1.0651432676681605e-06, + "loss": 1.0567, + "step": 23361 + }, + { + "epoch": 0.7, + "learning_rate": 1.064943529476314e-06, + "loss": 1.1303, + "step": 23362 + }, + { + "epoch": 0.7, + "learning_rate": 1.0647438049455137e-06, + "loss": 1.1095, + "step": 23363 + }, + { + "epoch": 0.7, + "learning_rate": 1.064544094077661e-06, + "loss": 1.0092, + "step": 23364 + }, + { + "epoch": 0.7, + "learning_rate": 1.0643443968746575e-06, + "loss": 1.1025, + "step": 23365 + }, + { + "epoch": 0.7, + "learning_rate": 1.0641447133384047e-06, + "loss": 1.1228, + "step": 23366 + }, + { + "epoch": 0.7, + "learning_rate": 1.0639450434708018e-06, + "loss": 1.0981, + "step": 23367 + }, + { + "epoch": 0.7, + "learning_rate": 1.0637453872737505e-06, + "loss": 1.1781, + "step": 23368 + }, + { + "epoch": 0.7, + "learning_rate": 1.0635457447491515e-06, + "loss": 1.0623, + "step": 23369 + }, + { + "epoch": 0.7, + "learning_rate": 1.0633461158989058e-06, + "loss": 1.0364, + "step": 23370 + }, + { + "epoch": 0.7, + "learning_rate": 1.0631465007249126e-06, + "loss": 1.1947, + "step": 23371 + }, + { + "epoch": 0.7, + "learning_rate": 1.0629468992290726e-06, + "loss": 1.084, + "step": 23372 + }, + { + "epoch": 0.7, + "learning_rate": 1.0627473114132858e-06, + "loss": 1.2218, + "step": 23373 + }, + { + "epoch": 0.7, + "learning_rate": 1.0625477372794536e-06, + "loss": 1.1915, + "step": 23374 + }, + { + "epoch": 0.7, + "learning_rate": 1.0623481768294734e-06, + "loss": 1.1951, + "step": 23375 + }, + { + "epoch": 0.7, + "learning_rate": 1.0621486300652465e-06, + "loss": 1.1279, + "step": 23376 + }, + { + "epoch": 0.7, + "learning_rate": 1.0619490969886716e-06, + "loss": 1.0981, + "step": 23377 + }, + { + "epoch": 0.7, + "learning_rate": 1.0617495776016493e-06, + "loss": 1.0385, + "step": 23378 + }, + { + "epoch": 0.7, + "learning_rate": 1.061550071906078e-06, + "loss": 1.0572, + "step": 23379 + }, + { + "epoch": 0.7, + "learning_rate": 1.0613505799038573e-06, + "loss": 1.142, + "step": 23380 + }, + { + "epoch": 0.7, + "learning_rate": 1.0611511015968864e-06, + "loss": 1.1304, + "step": 23381 + }, + { + "epoch": 0.7, + "learning_rate": 1.060951636987064e-06, + "loss": 1.0731, + "step": 23382 + }, + { + "epoch": 0.7, + "learning_rate": 1.0607521860762896e-06, + "loss": 1.0798, + "step": 23383 + }, + { + "epoch": 0.7, + "learning_rate": 1.0605527488664605e-06, + "loss": 1.0499, + "step": 23384 + }, + { + "epoch": 0.7, + "learning_rate": 1.0603533253594757e-06, + "loss": 1.1272, + "step": 23385 + }, + { + "epoch": 0.7, + "learning_rate": 1.0601539155572344e-06, + "loss": 1.0792, + "step": 23386 + }, + { + "epoch": 0.7, + "learning_rate": 1.0599545194616347e-06, + "loss": 1.1152, + "step": 23387 + }, + { + "epoch": 0.7, + "learning_rate": 1.059755137074574e-06, + "loss": 1.2581, + "step": 23388 + }, + { + "epoch": 0.7, + "learning_rate": 1.0595557683979505e-06, + "loss": 1.1027, + "step": 23389 + }, + { + "epoch": 0.7, + "learning_rate": 1.0593564134336626e-06, + "loss": 0.9985, + "step": 23390 + }, + { + "epoch": 0.7, + "learning_rate": 1.0591570721836076e-06, + "loss": 1.0909, + "step": 23391 + }, + { + "epoch": 0.7, + "learning_rate": 1.058957744649684e-06, + "loss": 1.0554, + "step": 23392 + }, + { + "epoch": 0.7, + "learning_rate": 1.058758430833788e-06, + "loss": 1.2074, + "step": 23393 + }, + { + "epoch": 0.7, + "learning_rate": 1.0585591307378177e-06, + "loss": 1.0688, + "step": 23394 + }, + { + "epoch": 0.7, + "learning_rate": 1.0583598443636703e-06, + "loss": 1.1241, + "step": 23395 + }, + { + "epoch": 0.7, + "learning_rate": 1.0581605717132434e-06, + "loss": 1.1271, + "step": 23396 + }, + { + "epoch": 0.7, + "learning_rate": 1.0579613127884328e-06, + "loss": 1.09, + "step": 23397 + }, + { + "epoch": 0.7, + "learning_rate": 1.057762067591136e-06, + "loss": 1.0529, + "step": 23398 + }, + { + "epoch": 0.7, + "learning_rate": 1.0575628361232496e-06, + "loss": 1.2007, + "step": 23399 + }, + { + "epoch": 0.7, + "learning_rate": 1.0573636183866714e-06, + "loss": 1.0645, + "step": 23400 + }, + { + "epoch": 0.7, + "learning_rate": 1.0571644143832956e-06, + "loss": 1.1383, + "step": 23401 + }, + { + "epoch": 0.7, + "learning_rate": 1.05696522411502e-06, + "loss": 1.0056, + "step": 23402 + }, + { + "epoch": 0.71, + "learning_rate": 1.0567660475837401e-06, + "loss": 1.0992, + "step": 23403 + }, + { + "epoch": 0.71, + "learning_rate": 1.0565668847913527e-06, + "loss": 1.1415, + "step": 23404 + }, + { + "epoch": 0.71, + "learning_rate": 1.0563677357397532e-06, + "loss": 1.1946, + "step": 23405 + }, + { + "epoch": 0.71, + "learning_rate": 1.0561686004308384e-06, + "loss": 1.2043, + "step": 23406 + }, + { + "epoch": 0.71, + "learning_rate": 1.0559694788665024e-06, + "loss": 1.1409, + "step": 23407 + }, + { + "epoch": 0.71, + "learning_rate": 1.0557703710486414e-06, + "loss": 1.15, + "step": 23408 + }, + { + "epoch": 0.71, + "learning_rate": 1.055571276979151e-06, + "loss": 1.1855, + "step": 23409 + }, + { + "epoch": 0.71, + "learning_rate": 1.0553721966599262e-06, + "loss": 1.0435, + "step": 23410 + }, + { + "epoch": 0.71, + "learning_rate": 1.0551731300928626e-06, + "loss": 1.1065, + "step": 23411 + }, + { + "epoch": 0.71, + "learning_rate": 1.0549740772798545e-06, + "loss": 1.1057, + "step": 23412 + }, + { + "epoch": 0.71, + "learning_rate": 1.0547750382227984e-06, + "loss": 1.2678, + "step": 23413 + }, + { + "epoch": 0.71, + "learning_rate": 1.0545760129235872e-06, + "loss": 1.1301, + "step": 23414 + }, + { + "epoch": 0.71, + "learning_rate": 1.054377001384116e-06, + "loss": 1.1827, + "step": 23415 + }, + { + "epoch": 0.71, + "learning_rate": 1.0541780036062792e-06, + "loss": 1.1328, + "step": 23416 + }, + { + "epoch": 0.71, + "learning_rate": 1.0539790195919723e-06, + "loss": 1.0148, + "step": 23417 + }, + { + "epoch": 0.71, + "learning_rate": 1.053780049343089e-06, + "loss": 1.1999, + "step": 23418 + }, + { + "epoch": 0.71, + "learning_rate": 1.0535810928615223e-06, + "loss": 1.1912, + "step": 23419 + }, + { + "epoch": 0.71, + "learning_rate": 1.053382150149167e-06, + "loss": 1.1136, + "step": 23420 + }, + { + "epoch": 0.71, + "learning_rate": 1.0531832212079169e-06, + "loss": 1.0878, + "step": 23421 + }, + { + "epoch": 0.71, + "learning_rate": 1.0529843060396667e-06, + "loss": 1.1458, + "step": 23422 + }, + { + "epoch": 0.71, + "learning_rate": 1.0527854046463078e-06, + "loss": 1.0258, + "step": 23423 + }, + { + "epoch": 0.71, + "learning_rate": 1.0525865170297353e-06, + "loss": 1.0298, + "step": 23424 + }, + { + "epoch": 0.71, + "learning_rate": 1.0523876431918418e-06, + "loss": 1.1337, + "step": 23425 + }, + { + "epoch": 0.71, + "learning_rate": 1.0521887831345217e-06, + "loss": 1.239, + "step": 23426 + }, + { + "epoch": 0.71, + "learning_rate": 1.0519899368596662e-06, + "loss": 1.0947, + "step": 23427 + }, + { + "epoch": 0.71, + "learning_rate": 1.0517911043691689e-06, + "loss": 1.1742, + "step": 23428 + }, + { + "epoch": 0.71, + "learning_rate": 1.051592285664923e-06, + "loss": 1.1415, + "step": 23429 + }, + { + "epoch": 0.71, + "learning_rate": 1.051393480748821e-06, + "loss": 1.1246, + "step": 23430 + }, + { + "epoch": 0.71, + "learning_rate": 1.0511946896227563e-06, + "loss": 1.1547, + "step": 23431 + }, + { + "epoch": 0.71, + "learning_rate": 1.0509959122886197e-06, + "loss": 1.0674, + "step": 23432 + }, + { + "epoch": 0.71, + "learning_rate": 1.0507971487483038e-06, + "loss": 1.0419, + "step": 23433 + }, + { + "epoch": 0.71, + "learning_rate": 1.050598399003701e-06, + "loss": 1.0256, + "step": 23434 + }, + { + "epoch": 0.71, + "learning_rate": 1.0503996630567036e-06, + "loss": 1.1, + "step": 23435 + }, + { + "epoch": 0.71, + "learning_rate": 1.0502009409092032e-06, + "loss": 1.1637, + "step": 23436 + }, + { + "epoch": 0.71, + "learning_rate": 1.0500022325630918e-06, + "loss": 1.1584, + "step": 23437 + }, + { + "epoch": 0.71, + "learning_rate": 1.0498035380202606e-06, + "loss": 1.1539, + "step": 23438 + }, + { + "epoch": 0.71, + "learning_rate": 1.049604857282602e-06, + "loss": 1.0374, + "step": 23439 + }, + { + "epoch": 0.71, + "learning_rate": 1.0494061903520062e-06, + "loss": 1.0859, + "step": 23440 + }, + { + "epoch": 0.71, + "learning_rate": 1.0492075372303646e-06, + "loss": 1.052, + "step": 23441 + }, + { + "epoch": 0.71, + "learning_rate": 1.0490088979195684e-06, + "loss": 1.2067, + "step": 23442 + }, + { + "epoch": 0.71, + "learning_rate": 1.0488102724215086e-06, + "loss": 1.0821, + "step": 23443 + }, + { + "epoch": 0.71, + "learning_rate": 1.0486116607380771e-06, + "loss": 1.1718, + "step": 23444 + }, + { + "epoch": 0.71, + "learning_rate": 1.0484130628711627e-06, + "loss": 1.1365, + "step": 23445 + }, + { + "epoch": 0.71, + "learning_rate": 1.048214478822657e-06, + "loss": 1.1672, + "step": 23446 + }, + { + "epoch": 0.71, + "learning_rate": 1.04801590859445e-06, + "loss": 1.122, + "step": 23447 + }, + { + "epoch": 0.71, + "learning_rate": 1.0478173521884333e-06, + "loss": 1.09, + "step": 23448 + }, + { + "epoch": 0.71, + "learning_rate": 1.0476188096064952e-06, + "loss": 1.1216, + "step": 23449 + }, + { + "epoch": 0.71, + "learning_rate": 1.0474202808505263e-06, + "loss": 1.1671, + "step": 23450 + }, + { + "epoch": 0.71, + "learning_rate": 1.0472217659224167e-06, + "loss": 0.9888, + "step": 23451 + }, + { + "epoch": 0.71, + "learning_rate": 1.0470232648240574e-06, + "loss": 1.0866, + "step": 23452 + }, + { + "epoch": 0.71, + "learning_rate": 1.0468247775573359e-06, + "loss": 1.1267, + "step": 23453 + }, + { + "epoch": 0.71, + "learning_rate": 1.0466263041241426e-06, + "loss": 1.0219, + "step": 23454 + }, + { + "epoch": 0.71, + "learning_rate": 1.0464278445263667e-06, + "loss": 1.1815, + "step": 23455 + }, + { + "epoch": 0.71, + "learning_rate": 1.0462293987658977e-06, + "loss": 1.0685, + "step": 23456 + }, + { + "epoch": 0.71, + "learning_rate": 1.0460309668446258e-06, + "loss": 1.077, + "step": 23457 + }, + { + "epoch": 0.71, + "learning_rate": 1.0458325487644378e-06, + "loss": 1.0848, + "step": 23458 + }, + { + "epoch": 0.71, + "learning_rate": 1.0456341445272236e-06, + "loss": 1.0789, + "step": 23459 + }, + { + "epoch": 0.71, + "learning_rate": 1.045435754134872e-06, + "loss": 1.1421, + "step": 23460 + }, + { + "epoch": 0.71, + "learning_rate": 1.0452373775892712e-06, + "loss": 1.2532, + "step": 23461 + }, + { + "epoch": 0.71, + "learning_rate": 1.0450390148923103e-06, + "loss": 1.0635, + "step": 23462 + }, + { + "epoch": 0.71, + "learning_rate": 1.044840666045877e-06, + "loss": 1.0537, + "step": 23463 + }, + { + "epoch": 0.71, + "learning_rate": 1.0446423310518596e-06, + "loss": 1.1188, + "step": 23464 + }, + { + "epoch": 0.71, + "learning_rate": 1.0444440099121475e-06, + "loss": 1.1512, + "step": 23465 + }, + { + "epoch": 0.71, + "learning_rate": 1.0442457026286264e-06, + "loss": 1.1042, + "step": 23466 + }, + { + "epoch": 0.71, + "learning_rate": 1.0440474092031852e-06, + "loss": 1.1791, + "step": 23467 + }, + { + "epoch": 0.71, + "learning_rate": 1.0438491296377113e-06, + "loss": 1.0431, + "step": 23468 + }, + { + "epoch": 0.71, + "learning_rate": 1.0436508639340923e-06, + "loss": 1.1453, + "step": 23469 + }, + { + "epoch": 0.71, + "learning_rate": 1.0434526120942168e-06, + "loss": 1.1777, + "step": 23470 + }, + { + "epoch": 0.71, + "learning_rate": 1.0432543741199698e-06, + "loss": 1.0029, + "step": 23471 + }, + { + "epoch": 0.71, + "learning_rate": 1.0430561500132397e-06, + "loss": 1.1893, + "step": 23472 + }, + { + "epoch": 0.71, + "learning_rate": 1.0428579397759133e-06, + "loss": 1.0161, + "step": 23473 + }, + { + "epoch": 0.71, + "learning_rate": 1.0426597434098784e-06, + "loss": 1.1451, + "step": 23474 + }, + { + "epoch": 0.71, + "learning_rate": 1.0424615609170202e-06, + "loss": 1.0479, + "step": 23475 + }, + { + "epoch": 0.71, + "learning_rate": 1.0422633922992255e-06, + "loss": 1.1328, + "step": 23476 + }, + { + "epoch": 0.71, + "learning_rate": 1.0420652375583816e-06, + "loss": 1.0363, + "step": 23477 + }, + { + "epoch": 0.71, + "learning_rate": 1.0418670966963756e-06, + "loss": 1.0656, + "step": 23478 + }, + { + "epoch": 0.71, + "learning_rate": 1.0416689697150914e-06, + "loss": 1.0886, + "step": 23479 + }, + { + "epoch": 0.71, + "learning_rate": 1.0414708566164162e-06, + "loss": 1.0592, + "step": 23480 + }, + { + "epoch": 0.71, + "learning_rate": 1.041272757402236e-06, + "loss": 1.1847, + "step": 23481 + }, + { + "epoch": 0.71, + "learning_rate": 1.0410746720744367e-06, + "loss": 1.0926, + "step": 23482 + }, + { + "epoch": 0.71, + "learning_rate": 1.0408766006349047e-06, + "loss": 1.1165, + "step": 23483 + }, + { + "epoch": 0.71, + "learning_rate": 1.0406785430855237e-06, + "loss": 1.0848, + "step": 23484 + }, + { + "epoch": 0.71, + "learning_rate": 1.0404804994281804e-06, + "loss": 1.0798, + "step": 23485 + }, + { + "epoch": 0.71, + "learning_rate": 1.0402824696647596e-06, + "loss": 1.1263, + "step": 23486 + }, + { + "epoch": 0.71, + "learning_rate": 1.040084453797147e-06, + "loss": 0.9749, + "step": 23487 + }, + { + "epoch": 0.71, + "learning_rate": 1.0398864518272266e-06, + "loss": 1.0593, + "step": 23488 + }, + { + "epoch": 0.71, + "learning_rate": 1.0396884637568855e-06, + "loss": 1.2388, + "step": 23489 + }, + { + "epoch": 0.71, + "learning_rate": 1.039490489588006e-06, + "loss": 1.0173, + "step": 23490 + }, + { + "epoch": 0.71, + "learning_rate": 1.0392925293224731e-06, + "loss": 1.0393, + "step": 23491 + }, + { + "epoch": 0.71, + "learning_rate": 1.0390945829621724e-06, + "loss": 1.1631, + "step": 23492 + }, + { + "epoch": 0.71, + "learning_rate": 1.0388966505089872e-06, + "loss": 1.1199, + "step": 23493 + }, + { + "epoch": 0.71, + "learning_rate": 1.0386987319648026e-06, + "loss": 0.9772, + "step": 23494 + }, + { + "epoch": 0.71, + "learning_rate": 1.0385008273315022e-06, + "loss": 1.059, + "step": 23495 + }, + { + "epoch": 0.71, + "learning_rate": 1.038302936610971e-06, + "loss": 1.0353, + "step": 23496 + }, + { + "epoch": 0.71, + "learning_rate": 1.0381050598050907e-06, + "loss": 1.1812, + "step": 23497 + }, + { + "epoch": 0.71, + "learning_rate": 1.037907196915746e-06, + "loss": 1.1795, + "step": 23498 + }, + { + "epoch": 0.71, + "learning_rate": 1.0377093479448212e-06, + "loss": 1.095, + "step": 23499 + }, + { + "epoch": 0.71, + "learning_rate": 1.0375115128941998e-06, + "loss": 1.1221, + "step": 23500 + }, + { + "epoch": 0.71, + "learning_rate": 1.0373136917657633e-06, + "loss": 0.9778, + "step": 23501 + }, + { + "epoch": 0.71, + "learning_rate": 1.0371158845613963e-06, + "loss": 1.0742, + "step": 23502 + }, + { + "epoch": 0.71, + "learning_rate": 1.0369180912829815e-06, + "loss": 1.0689, + "step": 23503 + }, + { + "epoch": 0.71, + "learning_rate": 1.0367203119324027e-06, + "loss": 1.0995, + "step": 23504 + }, + { + "epoch": 0.71, + "learning_rate": 1.0365225465115408e-06, + "loss": 1.0917, + "step": 23505 + }, + { + "epoch": 0.71, + "learning_rate": 1.0363247950222793e-06, + "loss": 1.1385, + "step": 23506 + }, + { + "epoch": 0.71, + "learning_rate": 1.0361270574665012e-06, + "loss": 0.9894, + "step": 23507 + }, + { + "epoch": 0.71, + "learning_rate": 1.0359293338460882e-06, + "loss": 1.0681, + "step": 23508 + }, + { + "epoch": 0.71, + "learning_rate": 1.0357316241629236e-06, + "loss": 1.0623, + "step": 23509 + }, + { + "epoch": 0.71, + "learning_rate": 1.0355339284188882e-06, + "loss": 1.1713, + "step": 23510 + }, + { + "epoch": 0.71, + "learning_rate": 1.0353362466158641e-06, + "loss": 1.0629, + "step": 23511 + }, + { + "epoch": 0.71, + "learning_rate": 1.0351385787557338e-06, + "loss": 1.1627, + "step": 23512 + }, + { + "epoch": 0.71, + "learning_rate": 1.0349409248403798e-06, + "loss": 1.1127, + "step": 23513 + }, + { + "epoch": 0.71, + "learning_rate": 1.0347432848716813e-06, + "loss": 1.2274, + "step": 23514 + }, + { + "epoch": 0.71, + "learning_rate": 1.0345456588515212e-06, + "loss": 0.9919, + "step": 23515 + }, + { + "epoch": 0.71, + "learning_rate": 1.0343480467817807e-06, + "loss": 1.1545, + "step": 23516 + }, + { + "epoch": 0.71, + "learning_rate": 1.0341504486643409e-06, + "loss": 1.0677, + "step": 23517 + }, + { + "epoch": 0.71, + "learning_rate": 1.0339528645010828e-06, + "loss": 1.0381, + "step": 23518 + }, + { + "epoch": 0.71, + "learning_rate": 1.0337552942938872e-06, + "loss": 1.1685, + "step": 23519 + }, + { + "epoch": 0.71, + "learning_rate": 1.0335577380446352e-06, + "loss": 1.0829, + "step": 23520 + }, + { + "epoch": 0.71, + "learning_rate": 1.0333601957552072e-06, + "loss": 1.03, + "step": 23521 + }, + { + "epoch": 0.71, + "learning_rate": 1.0331626674274847e-06, + "loss": 1.0574, + "step": 23522 + }, + { + "epoch": 0.71, + "learning_rate": 1.0329651530633464e-06, + "loss": 1.1439, + "step": 23523 + }, + { + "epoch": 0.71, + "learning_rate": 1.0327676526646732e-06, + "loss": 0.999, + "step": 23524 + }, + { + "epoch": 0.71, + "learning_rate": 1.0325701662333451e-06, + "loss": 1.0104, + "step": 23525 + }, + { + "epoch": 0.71, + "learning_rate": 1.0323726937712436e-06, + "loss": 1.0654, + "step": 23526 + }, + { + "epoch": 0.71, + "learning_rate": 1.032175235280246e-06, + "loss": 1.0747, + "step": 23527 + }, + { + "epoch": 0.71, + "learning_rate": 1.0319777907622332e-06, + "loss": 1.1288, + "step": 23528 + }, + { + "epoch": 0.71, + "learning_rate": 1.0317803602190852e-06, + "loss": 1.0201, + "step": 23529 + }, + { + "epoch": 0.71, + "learning_rate": 1.0315829436526815e-06, + "loss": 1.1627, + "step": 23530 + }, + { + "epoch": 0.71, + "learning_rate": 1.0313855410649e-06, + "loss": 1.0585, + "step": 23531 + }, + { + "epoch": 0.71, + "learning_rate": 1.0311881524576214e-06, + "loss": 1.1069, + "step": 23532 + }, + { + "epoch": 0.71, + "learning_rate": 1.0309907778327239e-06, + "loss": 1.1361, + "step": 23533 + }, + { + "epoch": 0.71, + "learning_rate": 1.0307934171920866e-06, + "loss": 1.0051, + "step": 23534 + }, + { + "epoch": 0.71, + "learning_rate": 1.0305960705375892e-06, + "loss": 1.107, + "step": 23535 + }, + { + "epoch": 0.71, + "learning_rate": 1.0303987378711089e-06, + "loss": 1.1726, + "step": 23536 + }, + { + "epoch": 0.71, + "learning_rate": 1.0302014191945246e-06, + "loss": 1.1594, + "step": 23537 + }, + { + "epoch": 0.71, + "learning_rate": 1.030004114509715e-06, + "loss": 1.069, + "step": 23538 + }, + { + "epoch": 0.71, + "learning_rate": 1.029806823818559e-06, + "loss": 1.1646, + "step": 23539 + }, + { + "epoch": 0.71, + "learning_rate": 1.0296095471229333e-06, + "loss": 1.1015, + "step": 23540 + }, + { + "epoch": 0.71, + "learning_rate": 1.0294122844247164e-06, + "loss": 1.0965, + "step": 23541 + }, + { + "epoch": 0.71, + "learning_rate": 1.0292150357257866e-06, + "loss": 1.1506, + "step": 23542 + }, + { + "epoch": 0.71, + "learning_rate": 1.029017801028021e-06, + "loss": 1.2209, + "step": 23543 + }, + { + "epoch": 0.71, + "learning_rate": 1.0288205803332976e-06, + "loss": 1.1109, + "step": 23544 + }, + { + "epoch": 0.71, + "learning_rate": 1.0286233736434936e-06, + "loss": 1.1701, + "step": 23545 + }, + { + "epoch": 0.71, + "learning_rate": 1.0284261809604865e-06, + "loss": 1.0919, + "step": 23546 + }, + { + "epoch": 0.71, + "learning_rate": 1.0282290022861543e-06, + "loss": 1.082, + "step": 23547 + }, + { + "epoch": 0.71, + "learning_rate": 1.0280318376223724e-06, + "loss": 1.2153, + "step": 23548 + }, + { + "epoch": 0.71, + "learning_rate": 1.0278346869710184e-06, + "loss": 1.1623, + "step": 23549 + }, + { + "epoch": 0.71, + "learning_rate": 1.0276375503339692e-06, + "loss": 1.0772, + "step": 23550 + }, + { + "epoch": 0.71, + "learning_rate": 1.0274404277131015e-06, + "loss": 1.1295, + "step": 23551 + }, + { + "epoch": 0.71, + "learning_rate": 1.0272433191102924e-06, + "loss": 1.152, + "step": 23552 + }, + { + "epoch": 0.71, + "learning_rate": 1.0270462245274165e-06, + "loss": 0.974, + "step": 23553 + }, + { + "epoch": 0.71, + "learning_rate": 1.0268491439663516e-06, + "loss": 0.975, + "step": 23554 + }, + { + "epoch": 0.71, + "learning_rate": 1.0266520774289732e-06, + "loss": 1.0199, + "step": 23555 + }, + { + "epoch": 0.71, + "learning_rate": 1.0264550249171581e-06, + "loss": 1.2222, + "step": 23556 + }, + { + "epoch": 0.71, + "learning_rate": 1.026257986432781e-06, + "loss": 1.1206, + "step": 23557 + }, + { + "epoch": 0.71, + "learning_rate": 1.0260609619777178e-06, + "loss": 1.0941, + "step": 23558 + }, + { + "epoch": 0.71, + "learning_rate": 1.0258639515538446e-06, + "loss": 1.0639, + "step": 23559 + }, + { + "epoch": 0.71, + "learning_rate": 1.0256669551630372e-06, + "loss": 1.1079, + "step": 23560 + }, + { + "epoch": 0.71, + "learning_rate": 1.0254699728071696e-06, + "loss": 1.1489, + "step": 23561 + }, + { + "epoch": 0.71, + "learning_rate": 1.0252730044881178e-06, + "loss": 1.1057, + "step": 23562 + }, + { + "epoch": 0.71, + "learning_rate": 1.0250760502077567e-06, + "loss": 0.9813, + "step": 23563 + }, + { + "epoch": 0.71, + "learning_rate": 1.0248791099679611e-06, + "loss": 1.1553, + "step": 23564 + }, + { + "epoch": 0.71, + "learning_rate": 1.024682183770607e-06, + "loss": 1.0409, + "step": 23565 + }, + { + "epoch": 0.71, + "learning_rate": 1.0244852716175668e-06, + "loss": 1.0739, + "step": 23566 + }, + { + "epoch": 0.71, + "learning_rate": 1.0242883735107166e-06, + "loss": 1.2073, + "step": 23567 + }, + { + "epoch": 0.71, + "learning_rate": 1.02409148945193e-06, + "loss": 1.1441, + "step": 23568 + }, + { + "epoch": 0.71, + "learning_rate": 1.0238946194430818e-06, + "loss": 1.106, + "step": 23569 + }, + { + "epoch": 0.71, + "learning_rate": 1.0236977634860456e-06, + "loss": 1.1781, + "step": 23570 + }, + { + "epoch": 0.71, + "learning_rate": 1.023500921582697e-06, + "loss": 1.2273, + "step": 23571 + }, + { + "epoch": 0.71, + "learning_rate": 1.0233040937349073e-06, + "loss": 1.0632, + "step": 23572 + }, + { + "epoch": 0.71, + "learning_rate": 1.0231072799445519e-06, + "loss": 1.1107, + "step": 23573 + }, + { + "epoch": 0.71, + "learning_rate": 1.0229104802135034e-06, + "loss": 1.1623, + "step": 23574 + }, + { + "epoch": 0.71, + "learning_rate": 1.0227136945436358e-06, + "loss": 1.0522, + "step": 23575 + }, + { + "epoch": 0.71, + "learning_rate": 1.0225169229368226e-06, + "loss": 1.1224, + "step": 23576 + }, + { + "epoch": 0.71, + "learning_rate": 1.0223201653949362e-06, + "loss": 1.0068, + "step": 23577 + }, + { + "epoch": 0.71, + "learning_rate": 1.0221234219198516e-06, + "loss": 1.0579, + "step": 23578 + }, + { + "epoch": 0.71, + "learning_rate": 1.0219266925134391e-06, + "loss": 1.2471, + "step": 23579 + }, + { + "epoch": 0.71, + "learning_rate": 1.021729977177573e-06, + "loss": 1.134, + "step": 23580 + }, + { + "epoch": 0.71, + "learning_rate": 1.021533275914125e-06, + "loss": 1.0911, + "step": 23581 + }, + { + "epoch": 0.71, + "learning_rate": 1.0213365887249694e-06, + "loss": 1.1682, + "step": 23582 + }, + { + "epoch": 0.71, + "learning_rate": 1.0211399156119763e-06, + "loss": 1.0493, + "step": 23583 + }, + { + "epoch": 0.71, + "learning_rate": 1.0209432565770188e-06, + "loss": 1.0312, + "step": 23584 + }, + { + "epoch": 0.71, + "learning_rate": 1.0207466116219693e-06, + "loss": 1.1511, + "step": 23585 + }, + { + "epoch": 0.71, + "learning_rate": 1.0205499807487007e-06, + "loss": 1.1259, + "step": 23586 + }, + { + "epoch": 0.71, + "learning_rate": 1.0203533639590828e-06, + "loss": 1.1055, + "step": 23587 + }, + { + "epoch": 0.71, + "learning_rate": 1.0201567612549882e-06, + "loss": 1.0787, + "step": 23588 + }, + { + "epoch": 0.71, + "learning_rate": 1.0199601726382886e-06, + "loss": 1.1356, + "step": 23589 + }, + { + "epoch": 0.71, + "learning_rate": 1.019763598110855e-06, + "loss": 1.0585, + "step": 23590 + }, + { + "epoch": 0.71, + "learning_rate": 1.0195670376745604e-06, + "loss": 1.1307, + "step": 23591 + }, + { + "epoch": 0.71, + "learning_rate": 1.0193704913312735e-06, + "loss": 1.1716, + "step": 23592 + }, + { + "epoch": 0.71, + "learning_rate": 1.0191739590828665e-06, + "loss": 1.1762, + "step": 23593 + }, + { + "epoch": 0.71, + "learning_rate": 1.01897744093121e-06, + "loss": 1.1147, + "step": 23594 + }, + { + "epoch": 0.71, + "learning_rate": 1.018780936878176e-06, + "loss": 1.0769, + "step": 23595 + }, + { + "epoch": 0.71, + "learning_rate": 1.0185844469256331e-06, + "loss": 1.1097, + "step": 23596 + }, + { + "epoch": 0.71, + "learning_rate": 1.018387971075453e-06, + "loss": 0.9634, + "step": 23597 + }, + { + "epoch": 0.71, + "learning_rate": 1.0181915093295056e-06, + "loss": 1.1552, + "step": 23598 + }, + { + "epoch": 0.71, + "learning_rate": 1.0179950616896617e-06, + "loss": 1.0605, + "step": 23599 + }, + { + "epoch": 0.71, + "learning_rate": 1.0177986281577907e-06, + "loss": 1.0333, + "step": 23600 + }, + { + "epoch": 0.71, + "learning_rate": 1.017602208735763e-06, + "loss": 1.0353, + "step": 23601 + }, + { + "epoch": 0.71, + "learning_rate": 1.0174058034254485e-06, + "loss": 1.1469, + "step": 23602 + }, + { + "epoch": 0.71, + "learning_rate": 1.0172094122287165e-06, + "loss": 1.1588, + "step": 23603 + }, + { + "epoch": 0.71, + "learning_rate": 1.0170130351474379e-06, + "loss": 1.1187, + "step": 23604 + }, + { + "epoch": 0.71, + "learning_rate": 1.01681667218348e-06, + "loss": 1.1302, + "step": 23605 + }, + { + "epoch": 0.71, + "learning_rate": 1.0166203233387129e-06, + "loss": 1.1318, + "step": 23606 + }, + { + "epoch": 0.71, + "learning_rate": 1.016423988615006e-06, + "loss": 1.1232, + "step": 23607 + }, + { + "epoch": 0.71, + "learning_rate": 1.0162276680142292e-06, + "loss": 1.0939, + "step": 23608 + }, + { + "epoch": 0.71, + "learning_rate": 1.0160313615382495e-06, + "loss": 1.0452, + "step": 23609 + }, + { + "epoch": 0.71, + "learning_rate": 1.0158350691889363e-06, + "loss": 1.0868, + "step": 23610 + }, + { + "epoch": 0.71, + "learning_rate": 1.0156387909681586e-06, + "loss": 1.1671, + "step": 23611 + }, + { + "epoch": 0.71, + "learning_rate": 1.0154425268777857e-06, + "loss": 1.1816, + "step": 23612 + }, + { + "epoch": 0.71, + "learning_rate": 1.0152462769196838e-06, + "loss": 1.0854, + "step": 23613 + }, + { + "epoch": 0.71, + "learning_rate": 1.0150500410957223e-06, + "loss": 1.1558, + "step": 23614 + }, + { + "epoch": 0.71, + "learning_rate": 1.0148538194077696e-06, + "loss": 1.1177, + "step": 23615 + }, + { + "epoch": 0.71, + "learning_rate": 1.014657611857693e-06, + "loss": 1.175, + "step": 23616 + }, + { + "epoch": 0.71, + "learning_rate": 1.0144614184473613e-06, + "loss": 1.0275, + "step": 23617 + }, + { + "epoch": 0.71, + "learning_rate": 1.014265239178641e-06, + "loss": 1.2281, + "step": 23618 + }, + { + "epoch": 0.71, + "learning_rate": 1.0140690740533995e-06, + "loss": 1.2523, + "step": 23619 + }, + { + "epoch": 0.71, + "learning_rate": 1.013872923073505e-06, + "loss": 1.1443, + "step": 23620 + }, + { + "epoch": 0.71, + "learning_rate": 1.0136767862408257e-06, + "loss": 1.1525, + "step": 23621 + }, + { + "epoch": 0.71, + "learning_rate": 1.0134806635572263e-06, + "loss": 1.0048, + "step": 23622 + }, + { + "epoch": 0.71, + "learning_rate": 1.0132845550245755e-06, + "loss": 1.0773, + "step": 23623 + }, + { + "epoch": 0.71, + "learning_rate": 1.0130884606447392e-06, + "loss": 1.3239, + "step": 23624 + }, + { + "epoch": 0.71, + "learning_rate": 1.0128923804195847e-06, + "loss": 1.1398, + "step": 23625 + }, + { + "epoch": 0.71, + "learning_rate": 1.0126963143509787e-06, + "loss": 1.0593, + "step": 23626 + }, + { + "epoch": 0.71, + "learning_rate": 1.0125002624407876e-06, + "loss": 1.155, + "step": 23627 + }, + { + "epoch": 0.71, + "learning_rate": 1.0123042246908774e-06, + "loss": 1.1263, + "step": 23628 + }, + { + "epoch": 0.71, + "learning_rate": 1.0121082011031144e-06, + "loss": 1.0592, + "step": 23629 + }, + { + "epoch": 0.71, + "learning_rate": 1.0119121916793658e-06, + "loss": 1.4125, + "step": 23630 + }, + { + "epoch": 0.71, + "learning_rate": 1.0117161964214955e-06, + "loss": 1.2554, + "step": 23631 + }, + { + "epoch": 0.71, + "learning_rate": 1.0115202153313702e-06, + "loss": 1.0433, + "step": 23632 + }, + { + "epoch": 0.71, + "learning_rate": 1.0113242484108557e-06, + "loss": 1.1638, + "step": 23633 + }, + { + "epoch": 0.71, + "learning_rate": 1.0111282956618182e-06, + "loss": 1.1559, + "step": 23634 + }, + { + "epoch": 0.71, + "learning_rate": 1.0109323570861213e-06, + "loss": 1.1687, + "step": 23635 + }, + { + "epoch": 0.71, + "learning_rate": 1.0107364326856312e-06, + "loss": 1.1348, + "step": 23636 + }, + { + "epoch": 0.71, + "learning_rate": 1.010540522462213e-06, + "loss": 0.9702, + "step": 23637 + }, + { + "epoch": 0.71, + "learning_rate": 1.0103446264177327e-06, + "loss": 1.0425, + "step": 23638 + }, + { + "epoch": 0.71, + "learning_rate": 1.010148744554053e-06, + "loss": 1.1664, + "step": 23639 + }, + { + "epoch": 0.71, + "learning_rate": 1.0099528768730398e-06, + "loss": 1.0812, + "step": 23640 + }, + { + "epoch": 0.71, + "learning_rate": 1.0097570233765577e-06, + "loss": 1.0308, + "step": 23641 + }, + { + "epoch": 0.71, + "learning_rate": 1.009561184066471e-06, + "loss": 0.9604, + "step": 23642 + }, + { + "epoch": 0.71, + "learning_rate": 1.0093653589446447e-06, + "loss": 1.1519, + "step": 23643 + }, + { + "epoch": 0.71, + "learning_rate": 1.009169548012942e-06, + "loss": 1.1882, + "step": 23644 + }, + { + "epoch": 0.71, + "learning_rate": 1.0089737512732265e-06, + "loss": 1.0898, + "step": 23645 + }, + { + "epoch": 0.71, + "learning_rate": 1.008777968727363e-06, + "loss": 1.0419, + "step": 23646 + }, + { + "epoch": 0.71, + "learning_rate": 1.0085822003772157e-06, + "loss": 1.106, + "step": 23647 + }, + { + "epoch": 0.71, + "learning_rate": 1.008386446224647e-06, + "loss": 1.0358, + "step": 23648 + }, + { + "epoch": 0.71, + "learning_rate": 1.008190706271521e-06, + "loss": 1.0561, + "step": 23649 + }, + { + "epoch": 0.71, + "learning_rate": 1.007994980519701e-06, + "loss": 1.0525, + "step": 23650 + }, + { + "epoch": 0.71, + "learning_rate": 1.0077992689710498e-06, + "loss": 1.167, + "step": 23651 + }, + { + "epoch": 0.71, + "learning_rate": 1.0076035716274312e-06, + "loss": 1.0029, + "step": 23652 + }, + { + "epoch": 0.71, + "learning_rate": 1.0074078884907087e-06, + "loss": 1.0712, + "step": 23653 + }, + { + "epoch": 0.71, + "learning_rate": 1.0072122195627435e-06, + "loss": 1.1158, + "step": 23654 + }, + { + "epoch": 0.71, + "learning_rate": 1.0070165648453986e-06, + "loss": 1.1033, + "step": 23655 + }, + { + "epoch": 0.71, + "learning_rate": 1.0068209243405372e-06, + "loss": 1.1296, + "step": 23656 + }, + { + "epoch": 0.71, + "learning_rate": 1.0066252980500216e-06, + "loss": 0.9584, + "step": 23657 + }, + { + "epoch": 0.71, + "learning_rate": 1.0064296859757138e-06, + "loss": 1.1628, + "step": 23658 + }, + { + "epoch": 0.71, + "learning_rate": 1.0062340881194759e-06, + "loss": 1.152, + "step": 23659 + }, + { + "epoch": 0.71, + "learning_rate": 1.006038504483171e-06, + "loss": 1.15, + "step": 23660 + }, + { + "epoch": 0.71, + "learning_rate": 1.0058429350686594e-06, + "loss": 1.1748, + "step": 23661 + }, + { + "epoch": 0.71, + "learning_rate": 1.0056473798778033e-06, + "loss": 1.1317, + "step": 23662 + }, + { + "epoch": 0.71, + "learning_rate": 1.0054518389124645e-06, + "loss": 1.1209, + "step": 23663 + }, + { + "epoch": 0.71, + "learning_rate": 1.0052563121745052e-06, + "loss": 1.062, + "step": 23664 + }, + { + "epoch": 0.71, + "learning_rate": 1.005060799665785e-06, + "loss": 1.1199, + "step": 23665 + }, + { + "epoch": 0.71, + "learning_rate": 1.004865301388166e-06, + "loss": 1.1119, + "step": 23666 + }, + { + "epoch": 0.71, + "learning_rate": 1.0046698173435093e-06, + "loss": 1.114, + "step": 23667 + }, + { + "epoch": 0.71, + "learning_rate": 1.0044743475336757e-06, + "loss": 1.119, + "step": 23668 + }, + { + "epoch": 0.71, + "learning_rate": 1.004278891960527e-06, + "loss": 1.1812, + "step": 23669 + }, + { + "epoch": 0.71, + "learning_rate": 1.004083450625922e-06, + "loss": 1.1054, + "step": 23670 + }, + { + "epoch": 0.71, + "learning_rate": 1.0038880235317223e-06, + "loss": 1.0406, + "step": 23671 + }, + { + "epoch": 0.71, + "learning_rate": 1.0036926106797877e-06, + "loss": 1.0864, + "step": 23672 + }, + { + "epoch": 0.71, + "learning_rate": 1.0034972120719796e-06, + "loss": 1.1399, + "step": 23673 + }, + { + "epoch": 0.71, + "learning_rate": 1.0033018277101566e-06, + "loss": 1.103, + "step": 23674 + }, + { + "epoch": 0.71, + "learning_rate": 1.0031064575961797e-06, + "loss": 1.1234, + "step": 23675 + }, + { + "epoch": 0.71, + "learning_rate": 1.002911101731908e-06, + "loss": 1.0983, + "step": 23676 + }, + { + "epoch": 0.71, + "learning_rate": 1.0027157601192025e-06, + "loss": 1.1908, + "step": 23677 + }, + { + "epoch": 0.71, + "learning_rate": 1.002520432759921e-06, + "loss": 1.012, + "step": 23678 + }, + { + "epoch": 0.71, + "learning_rate": 1.002325119655924e-06, + "loss": 1.1711, + "step": 23679 + }, + { + "epoch": 0.71, + "learning_rate": 1.0021298208090703e-06, + "loss": 0.9832, + "step": 23680 + }, + { + "epoch": 0.71, + "learning_rate": 1.0019345362212194e-06, + "loss": 1.1702, + "step": 23681 + }, + { + "epoch": 0.71, + "learning_rate": 1.0017392658942302e-06, + "loss": 1.0213, + "step": 23682 + }, + { + "epoch": 0.71, + "learning_rate": 1.0015440098299614e-06, + "loss": 1.1469, + "step": 23683 + }, + { + "epoch": 0.71, + "learning_rate": 1.0013487680302723e-06, + "loss": 1.1097, + "step": 23684 + }, + { + "epoch": 0.71, + "learning_rate": 1.0011535404970208e-06, + "loss": 1.1985, + "step": 23685 + }, + { + "epoch": 0.71, + "learning_rate": 1.0009583272320669e-06, + "loss": 1.0478, + "step": 23686 + }, + { + "epoch": 0.71, + "learning_rate": 1.0007631282372667e-06, + "loss": 1.0923, + "step": 23687 + }, + { + "epoch": 0.71, + "learning_rate": 1.0005679435144794e-06, + "loss": 1.2186, + "step": 23688 + }, + { + "epoch": 0.71, + "learning_rate": 1.0003727730655633e-06, + "loss": 1.1172, + "step": 23689 + }, + { + "epoch": 0.71, + "learning_rate": 1.000177616892377e-06, + "loss": 1.0956, + "step": 23690 + }, + { + "epoch": 0.71, + "learning_rate": 9.999824749967766e-07, + "loss": 1.1519, + "step": 23691 + }, + { + "epoch": 0.71, + "learning_rate": 9.997873473806205e-07, + "loss": 1.1171, + "step": 23692 + }, + { + "epoch": 0.71, + "learning_rate": 9.995922340457664e-07, + "loss": 1.1385, + "step": 23693 + }, + { + "epoch": 0.71, + "learning_rate": 9.993971349940718e-07, + "loss": 0.9581, + "step": 23694 + }, + { + "epoch": 0.71, + "learning_rate": 9.992020502273944e-07, + "loss": 1.013, + "step": 23695 + }, + { + "epoch": 0.71, + "learning_rate": 9.990069797475897e-07, + "loss": 1.0994, + "step": 23696 + }, + { + "epoch": 0.71, + "learning_rate": 9.988119235565157e-07, + "loss": 1.1201, + "step": 23697 + }, + { + "epoch": 0.71, + "learning_rate": 9.986168816560293e-07, + "loss": 1.2239, + "step": 23698 + }, + { + "epoch": 0.71, + "learning_rate": 9.984218540479881e-07, + "loss": 1.2667, + "step": 23699 + }, + { + "epoch": 0.71, + "learning_rate": 9.982268407342467e-07, + "loss": 1.1249, + "step": 23700 + }, + { + "epoch": 0.71, + "learning_rate": 9.980318417166623e-07, + "loss": 1.1387, + "step": 23701 + }, + { + "epoch": 0.71, + "learning_rate": 9.978368569970915e-07, + "loss": 1.0662, + "step": 23702 + }, + { + "epoch": 0.71, + "learning_rate": 9.976418865773913e-07, + "loss": 1.074, + "step": 23703 + }, + { + "epoch": 0.71, + "learning_rate": 9.974469304594158e-07, + "loss": 1.1099, + "step": 23704 + }, + { + "epoch": 0.71, + "learning_rate": 9.972519886450218e-07, + "loss": 1.0884, + "step": 23705 + }, + { + "epoch": 0.71, + "learning_rate": 9.970570611360656e-07, + "loss": 0.9838, + "step": 23706 + }, + { + "epoch": 0.71, + "learning_rate": 9.968621479344018e-07, + "loss": 0.9453, + "step": 23707 + }, + { + "epoch": 0.71, + "learning_rate": 9.966672490418866e-07, + "loss": 1.038, + "step": 23708 + }, + { + "epoch": 0.71, + "learning_rate": 9.964723644603751e-07, + "loss": 0.9315, + "step": 23709 + }, + { + "epoch": 0.71, + "learning_rate": 9.962774941917227e-07, + "loss": 1.0395, + "step": 23710 + }, + { + "epoch": 0.71, + "learning_rate": 9.960826382377842e-07, + "loss": 1.1429, + "step": 23711 + }, + { + "epoch": 0.71, + "learning_rate": 9.958877966004158e-07, + "loss": 1.2808, + "step": 23712 + }, + { + "epoch": 0.71, + "learning_rate": 9.956929692814698e-07, + "loss": 1.1006, + "step": 23713 + }, + { + "epoch": 0.71, + "learning_rate": 9.954981562828026e-07, + "loss": 1.0888, + "step": 23714 + }, + { + "epoch": 0.71, + "learning_rate": 9.953033576062685e-07, + "loss": 1.0793, + "step": 23715 + }, + { + "epoch": 0.71, + "learning_rate": 9.951085732537222e-07, + "loss": 1.1275, + "step": 23716 + }, + { + "epoch": 0.71, + "learning_rate": 9.949138032270169e-07, + "loss": 1.0974, + "step": 23717 + }, + { + "epoch": 0.71, + "learning_rate": 9.947190475280072e-07, + "loss": 1.1371, + "step": 23718 + }, + { + "epoch": 0.71, + "learning_rate": 9.945243061585475e-07, + "loss": 1.1113, + "step": 23719 + }, + { + "epoch": 0.71, + "learning_rate": 9.94329579120492e-07, + "loss": 1.1683, + "step": 23720 + }, + { + "epoch": 0.71, + "learning_rate": 9.941348664156926e-07, + "loss": 1.173, + "step": 23721 + }, + { + "epoch": 0.71, + "learning_rate": 9.939401680460044e-07, + "loss": 1.1129, + "step": 23722 + }, + { + "epoch": 0.71, + "learning_rate": 9.937454840132804e-07, + "loss": 1.1395, + "step": 23723 + }, + { + "epoch": 0.71, + "learning_rate": 9.93550814319374e-07, + "loss": 1.1565, + "step": 23724 + }, + { + "epoch": 0.71, + "learning_rate": 9.93356158966139e-07, + "loss": 1.0679, + "step": 23725 + }, + { + "epoch": 0.71, + "learning_rate": 9.931615179554268e-07, + "loss": 1.1533, + "step": 23726 + }, + { + "epoch": 0.71, + "learning_rate": 9.929668912890916e-07, + "loss": 0.952, + "step": 23727 + }, + { + "epoch": 0.71, + "learning_rate": 9.927722789689856e-07, + "loss": 1.0813, + "step": 23728 + }, + { + "epoch": 0.71, + "learning_rate": 9.925776809969622e-07, + "loss": 1.0745, + "step": 23729 + }, + { + "epoch": 0.71, + "learning_rate": 9.923830973748726e-07, + "loss": 1.0531, + "step": 23730 + }, + { + "epoch": 0.71, + "learning_rate": 9.921885281045701e-07, + "loss": 1.1324, + "step": 23731 + }, + { + "epoch": 0.71, + "learning_rate": 9.919939731879063e-07, + "loss": 0.9481, + "step": 23732 + }, + { + "epoch": 0.71, + "learning_rate": 9.917994326267335e-07, + "loss": 1.0092, + "step": 23733 + }, + { + "epoch": 0.71, + "learning_rate": 9.91604906422904e-07, + "loss": 1.1572, + "step": 23734 + }, + { + "epoch": 0.72, + "learning_rate": 9.914103945782693e-07, + "loss": 0.9927, + "step": 23735 + }, + { + "epoch": 0.72, + "learning_rate": 9.912158970946819e-07, + "loss": 1.0968, + "step": 23736 + }, + { + "epoch": 0.72, + "learning_rate": 9.910214139739915e-07, + "loss": 1.1196, + "step": 23737 + }, + { + "epoch": 0.72, + "learning_rate": 9.908269452180508e-07, + "loss": 1.0112, + "step": 23738 + }, + { + "epoch": 0.72, + "learning_rate": 9.906324908287104e-07, + "loss": 1.1281, + "step": 23739 + }, + { + "epoch": 0.72, + "learning_rate": 9.904380508078221e-07, + "loss": 1.1495, + "step": 23740 + }, + { + "epoch": 0.72, + "learning_rate": 9.902436251572362e-07, + "loss": 1.1946, + "step": 23741 + }, + { + "epoch": 0.72, + "learning_rate": 9.900492138788049e-07, + "loss": 1.1575, + "step": 23742 + }, + { + "epoch": 0.72, + "learning_rate": 9.898548169743768e-07, + "loss": 1.1998, + "step": 23743 + }, + { + "epoch": 0.72, + "learning_rate": 9.896604344458039e-07, + "loss": 1.1612, + "step": 23744 + }, + { + "epoch": 0.72, + "learning_rate": 9.89466066294936e-07, + "loss": 1.0616, + "step": 23745 + }, + { + "epoch": 0.72, + "learning_rate": 9.892717125236246e-07, + "loss": 1.0905, + "step": 23746 + }, + { + "epoch": 0.72, + "learning_rate": 9.89077373133718e-07, + "loss": 1.069, + "step": 23747 + }, + { + "epoch": 0.72, + "learning_rate": 9.88883048127067e-07, + "loss": 1.2089, + "step": 23748 + }, + { + "epoch": 0.72, + "learning_rate": 9.886887375055218e-07, + "loss": 1.1626, + "step": 23749 + }, + { + "epoch": 0.72, + "learning_rate": 9.88494441270932e-07, + "loss": 1.0533, + "step": 23750 + }, + { + "epoch": 0.72, + "learning_rate": 9.883001594251478e-07, + "loss": 1.0909, + "step": 23751 + }, + { + "epoch": 0.72, + "learning_rate": 9.881058919700173e-07, + "loss": 1.048, + "step": 23752 + }, + { + "epoch": 0.72, + "learning_rate": 9.879116389073906e-07, + "loss": 0.9765, + "step": 23753 + }, + { + "epoch": 0.72, + "learning_rate": 9.877174002391167e-07, + "loss": 1.0945, + "step": 23754 + }, + { + "epoch": 0.72, + "learning_rate": 9.875231759670456e-07, + "loss": 1.1637, + "step": 23755 + }, + { + "epoch": 0.72, + "learning_rate": 9.873289660930249e-07, + "loss": 1.2693, + "step": 23756 + }, + { + "epoch": 0.72, + "learning_rate": 9.871347706189036e-07, + "loss": 1.0656, + "step": 23757 + }, + { + "epoch": 0.72, + "learning_rate": 9.869405895465308e-07, + "loss": 1.0799, + "step": 23758 + }, + { + "epoch": 0.72, + "learning_rate": 9.867464228777557e-07, + "loss": 0.9847, + "step": 23759 + }, + { + "epoch": 0.72, + "learning_rate": 9.86552270614425e-07, + "loss": 1.1434, + "step": 23760 + }, + { + "epoch": 0.72, + "learning_rate": 9.863581327583877e-07, + "loss": 1.1978, + "step": 23761 + }, + { + "epoch": 0.72, + "learning_rate": 9.86164009311492e-07, + "loss": 1.1388, + "step": 23762 + }, + { + "epoch": 0.72, + "learning_rate": 9.85969900275586e-07, + "loss": 1.1425, + "step": 23763 + }, + { + "epoch": 0.72, + "learning_rate": 9.857758056525175e-07, + "loss": 1.0347, + "step": 23764 + }, + { + "epoch": 0.72, + "learning_rate": 9.855817254441335e-07, + "loss": 1.0932, + "step": 23765 + }, + { + "epoch": 0.72, + "learning_rate": 9.853876596522826e-07, + "loss": 1.2066, + "step": 23766 + }, + { + "epoch": 0.72, + "learning_rate": 9.851936082788117e-07, + "loss": 1.1162, + "step": 23767 + }, + { + "epoch": 0.72, + "learning_rate": 9.849995713255687e-07, + "loss": 1.1041, + "step": 23768 + }, + { + "epoch": 0.72, + "learning_rate": 9.848055487943995e-07, + "loss": 1.1454, + "step": 23769 + }, + { + "epoch": 0.72, + "learning_rate": 9.846115406871515e-07, + "loss": 1.0428, + "step": 23770 + }, + { + "epoch": 0.72, + "learning_rate": 9.844175470056718e-07, + "loss": 1.1536, + "step": 23771 + }, + { + "epoch": 0.72, + "learning_rate": 9.84223567751808e-07, + "loss": 1.0558, + "step": 23772 + }, + { + "epoch": 0.72, + "learning_rate": 9.840296029274052e-07, + "loss": 1.0891, + "step": 23773 + }, + { + "epoch": 0.72, + "learning_rate": 9.8383565253431e-07, + "loss": 1.0204, + "step": 23774 + }, + { + "epoch": 0.72, + "learning_rate": 9.836417165743698e-07, + "loss": 1.0525, + "step": 23775 + }, + { + "epoch": 0.72, + "learning_rate": 9.834477950494297e-07, + "loss": 1.11, + "step": 23776 + }, + { + "epoch": 0.72, + "learning_rate": 9.832538879613374e-07, + "loss": 1.1151, + "step": 23777 + }, + { + "epoch": 0.72, + "learning_rate": 9.830599953119364e-07, + "loss": 1.1135, + "step": 23778 + }, + { + "epoch": 0.72, + "learning_rate": 9.828661171030737e-07, + "loss": 1.0287, + "step": 23779 + }, + { + "epoch": 0.72, + "learning_rate": 9.826722533365952e-07, + "loss": 1.1299, + "step": 23780 + }, + { + "epoch": 0.72, + "learning_rate": 9.824784040143468e-07, + "loss": 1.2086, + "step": 23781 + }, + { + "epoch": 0.72, + "learning_rate": 9.82284569138172e-07, + "loss": 1.0612, + "step": 23782 + }, + { + "epoch": 0.72, + "learning_rate": 9.820907487099174e-07, + "loss": 1.0988, + "step": 23783 + }, + { + "epoch": 0.72, + "learning_rate": 9.818969427314276e-07, + "loss": 1.0797, + "step": 23784 + }, + { + "epoch": 0.72, + "learning_rate": 9.817031512045489e-07, + "loss": 1.0542, + "step": 23785 + }, + { + "epoch": 0.72, + "learning_rate": 9.81509374131124e-07, + "loss": 1.0469, + "step": 23786 + }, + { + "epoch": 0.72, + "learning_rate": 9.813156115129985e-07, + "loss": 1.1118, + "step": 23787 + }, + { + "epoch": 0.72, + "learning_rate": 9.81121863352017e-07, + "loss": 1.0419, + "step": 23788 + }, + { + "epoch": 0.72, + "learning_rate": 9.809281296500237e-07, + "loss": 1.1415, + "step": 23789 + }, + { + "epoch": 0.72, + "learning_rate": 9.80734410408863e-07, + "loss": 1.0787, + "step": 23790 + }, + { + "epoch": 0.72, + "learning_rate": 9.805407056303792e-07, + "loss": 1.1349, + "step": 23791 + }, + { + "epoch": 0.72, + "learning_rate": 9.80347015316416e-07, + "loss": 1.1937, + "step": 23792 + }, + { + "epoch": 0.72, + "learning_rate": 9.801533394688173e-07, + "loss": 1.1207, + "step": 23793 + }, + { + "epoch": 0.72, + "learning_rate": 9.799596780894276e-07, + "loss": 1.0194, + "step": 23794 + }, + { + "epoch": 0.72, + "learning_rate": 9.797660311800892e-07, + "loss": 1.1754, + "step": 23795 + }, + { + "epoch": 0.72, + "learning_rate": 9.795723987426456e-07, + "loss": 1.1268, + "step": 23796 + }, + { + "epoch": 0.72, + "learning_rate": 9.793787807789406e-07, + "loss": 1.1639, + "step": 23797 + }, + { + "epoch": 0.72, + "learning_rate": 9.791851772908182e-07, + "loss": 1.1062, + "step": 23798 + }, + { + "epoch": 0.72, + "learning_rate": 9.789915882801196e-07, + "loss": 1.1361, + "step": 23799 + }, + { + "epoch": 0.72, + "learning_rate": 9.787980137486886e-07, + "loss": 1.0821, + "step": 23800 + }, + { + "epoch": 0.72, + "learning_rate": 9.786044536983676e-07, + "loss": 1.1869, + "step": 23801 + }, + { + "epoch": 0.72, + "learning_rate": 9.784109081309998e-07, + "loss": 1.0593, + "step": 23802 + }, + { + "epoch": 0.72, + "learning_rate": 9.782173770484279e-07, + "loss": 1.0964, + "step": 23803 + }, + { + "epoch": 0.72, + "learning_rate": 9.78023860452493e-07, + "loss": 1.1116, + "step": 23804 + }, + { + "epoch": 0.72, + "learning_rate": 9.77830358345038e-07, + "loss": 1.129, + "step": 23805 + }, + { + "epoch": 0.72, + "learning_rate": 9.776368707279046e-07, + "loss": 1.2009, + "step": 23806 + }, + { + "epoch": 0.72, + "learning_rate": 9.77443397602936e-07, + "loss": 1.1437, + "step": 23807 + }, + { + "epoch": 0.72, + "learning_rate": 9.772499389719722e-07, + "loss": 1.043, + "step": 23808 + }, + { + "epoch": 0.72, + "learning_rate": 9.770564948368555e-07, + "loss": 1.0917, + "step": 23809 + }, + { + "epoch": 0.72, + "learning_rate": 9.768630651994274e-07, + "loss": 1.1315, + "step": 23810 + }, + { + "epoch": 0.72, + "learning_rate": 9.766696500615305e-07, + "loss": 1.0987, + "step": 23811 + }, + { + "epoch": 0.72, + "learning_rate": 9.764762494250039e-07, + "loss": 1.1215, + "step": 23812 + }, + { + "epoch": 0.72, + "learning_rate": 9.762828632916894e-07, + "loss": 1.1405, + "step": 23813 + }, + { + "epoch": 0.72, + "learning_rate": 9.760894916634283e-07, + "loss": 1.1593, + "step": 23814 + }, + { + "epoch": 0.72, + "learning_rate": 9.758961345420615e-07, + "loss": 1.1445, + "step": 23815 + }, + { + "epoch": 0.72, + "learning_rate": 9.757027919294292e-07, + "loss": 1.1339, + "step": 23816 + }, + { + "epoch": 0.72, + "learning_rate": 9.755094638273724e-07, + "loss": 1.0607, + "step": 23817 + }, + { + "epoch": 0.72, + "learning_rate": 9.75316150237732e-07, + "loss": 1.2789, + "step": 23818 + }, + { + "epoch": 0.72, + "learning_rate": 9.75122851162347e-07, + "loss": 1.1679, + "step": 23819 + }, + { + "epoch": 0.72, + "learning_rate": 9.749295666030579e-07, + "loss": 1.2177, + "step": 23820 + }, + { + "epoch": 0.72, + "learning_rate": 9.747362965617047e-07, + "loss": 1.1142, + "step": 23821 + }, + { + "epoch": 0.72, + "learning_rate": 9.745430410401272e-07, + "loss": 1.096, + "step": 23822 + }, + { + "epoch": 0.72, + "learning_rate": 9.743498000401654e-07, + "loss": 1.2077, + "step": 23823 + }, + { + "epoch": 0.72, + "learning_rate": 9.741565735636598e-07, + "loss": 1.1057, + "step": 23824 + }, + { + "epoch": 0.72, + "learning_rate": 9.739633616124477e-07, + "loss": 1.1566, + "step": 23825 + }, + { + "epoch": 0.72, + "learning_rate": 9.737701641883696e-07, + "loss": 1.1545, + "step": 23826 + }, + { + "epoch": 0.72, + "learning_rate": 9.735769812932641e-07, + "loss": 1.0376, + "step": 23827 + }, + { + "epoch": 0.72, + "learning_rate": 9.733838129289711e-07, + "loss": 1.0365, + "step": 23828 + }, + { + "epoch": 0.72, + "learning_rate": 9.731906590973295e-07, + "loss": 1.0284, + "step": 23829 + }, + { + "epoch": 0.72, + "learning_rate": 9.729975198001764e-07, + "loss": 1.0607, + "step": 23830 + }, + { + "epoch": 0.72, + "learning_rate": 9.72804395039352e-07, + "loss": 1.1256, + "step": 23831 + }, + { + "epoch": 0.72, + "learning_rate": 9.72611284816694e-07, + "loss": 1.1748, + "step": 23832 + }, + { + "epoch": 0.72, + "learning_rate": 9.724181891340417e-07, + "loss": 1.0765, + "step": 23833 + }, + { + "epoch": 0.72, + "learning_rate": 9.722251079932318e-07, + "loss": 1.0203, + "step": 23834 + }, + { + "epoch": 0.72, + "learning_rate": 9.720320413961031e-07, + "loss": 1.0692, + "step": 23835 + }, + { + "epoch": 0.72, + "learning_rate": 9.718389893444934e-07, + "loss": 1.066, + "step": 23836 + }, + { + "epoch": 0.72, + "learning_rate": 9.716459518402415e-07, + "loss": 1.1594, + "step": 23837 + }, + { + "epoch": 0.72, + "learning_rate": 9.714529288851832e-07, + "loss": 1.1533, + "step": 23838 + }, + { + "epoch": 0.72, + "learning_rate": 9.712599204811569e-07, + "loss": 1.0523, + "step": 23839 + }, + { + "epoch": 0.72, + "learning_rate": 9.710669266299996e-07, + "loss": 1.0262, + "step": 23840 + }, + { + "epoch": 0.72, + "learning_rate": 9.708739473335488e-07, + "loss": 1.0824, + "step": 23841 + }, + { + "epoch": 0.72, + "learning_rate": 9.706809825936427e-07, + "loss": 1.0878, + "step": 23842 + }, + { + "epoch": 0.72, + "learning_rate": 9.704880324121161e-07, + "loss": 1.2216, + "step": 23843 + }, + { + "epoch": 0.72, + "learning_rate": 9.702950967908067e-07, + "loss": 1.1667, + "step": 23844 + }, + { + "epoch": 0.72, + "learning_rate": 9.701021757315514e-07, + "loss": 1.0847, + "step": 23845 + }, + { + "epoch": 0.72, + "learning_rate": 9.699092692361867e-07, + "loss": 1.1254, + "step": 23846 + }, + { + "epoch": 0.72, + "learning_rate": 9.697163773065484e-07, + "loss": 1.0761, + "step": 23847 + }, + { + "epoch": 0.72, + "learning_rate": 9.695234999444735e-07, + "loss": 1.1628, + "step": 23848 + }, + { + "epoch": 0.72, + "learning_rate": 9.693306371517977e-07, + "loss": 1.0703, + "step": 23849 + }, + { + "epoch": 0.72, + "learning_rate": 9.69137788930358e-07, + "loss": 1.176, + "step": 23850 + }, + { + "epoch": 0.72, + "learning_rate": 9.689449552819881e-07, + "loss": 1.0416, + "step": 23851 + }, + { + "epoch": 0.72, + "learning_rate": 9.687521362085253e-07, + "loss": 1.1237, + "step": 23852 + }, + { + "epoch": 0.72, + "learning_rate": 9.685593317118044e-07, + "loss": 1.1196, + "step": 23853 + }, + { + "epoch": 0.72, + "learning_rate": 9.683665417936614e-07, + "loss": 1.0607, + "step": 23854 + }, + { + "epoch": 0.72, + "learning_rate": 9.681737664559318e-07, + "loss": 1.1573, + "step": 23855 + }, + { + "epoch": 0.72, + "learning_rate": 9.679810057004494e-07, + "loss": 1.1243, + "step": 23856 + }, + { + "epoch": 0.72, + "learning_rate": 9.6778825952905e-07, + "loss": 1.0934, + "step": 23857 + }, + { + "epoch": 0.72, + "learning_rate": 9.675955279435683e-07, + "loss": 1.0911, + "step": 23858 + }, + { + "epoch": 0.72, + "learning_rate": 9.674028109458403e-07, + "loss": 1.2061, + "step": 23859 + }, + { + "epoch": 0.72, + "learning_rate": 9.67210108537698e-07, + "loss": 1.2046, + "step": 23860 + }, + { + "epoch": 0.72, + "learning_rate": 9.670174207209778e-07, + "loss": 1.165, + "step": 23861 + }, + { + "epoch": 0.72, + "learning_rate": 9.668247474975134e-07, + "loss": 1.0321, + "step": 23862 + }, + { + "epoch": 0.72, + "learning_rate": 9.666320888691396e-07, + "loss": 1.106, + "step": 23863 + }, + { + "epoch": 0.72, + "learning_rate": 9.66439444837689e-07, + "loss": 1.2202, + "step": 23864 + }, + { + "epoch": 0.72, + "learning_rate": 9.662468154049964e-07, + "loss": 1.0917, + "step": 23865 + }, + { + "epoch": 0.72, + "learning_rate": 9.660542005728954e-07, + "loss": 1.1539, + "step": 23866 + }, + { + "epoch": 0.72, + "learning_rate": 9.658616003432198e-07, + "loss": 1.2776, + "step": 23867 + }, + { + "epoch": 0.72, + "learning_rate": 9.656690147178036e-07, + "loss": 1.1431, + "step": 23868 + }, + { + "epoch": 0.72, + "learning_rate": 9.654764436984787e-07, + "loss": 1.1946, + "step": 23869 + }, + { + "epoch": 0.72, + "learning_rate": 9.652838872870787e-07, + "loss": 1.0553, + "step": 23870 + }, + { + "epoch": 0.72, + "learning_rate": 9.65091345485437e-07, + "loss": 1.1232, + "step": 23871 + }, + { + "epoch": 0.72, + "learning_rate": 9.648988182953867e-07, + "loss": 0.9994, + "step": 23872 + }, + { + "epoch": 0.72, + "learning_rate": 9.647063057187603e-07, + "loss": 1.1211, + "step": 23873 + }, + { + "epoch": 0.72, + "learning_rate": 9.645138077573904e-07, + "loss": 1.1555, + "step": 23874 + }, + { + "epoch": 0.72, + "learning_rate": 9.643213244131095e-07, + "loss": 1.036, + "step": 23875 + }, + { + "epoch": 0.72, + "learning_rate": 9.641288556877507e-07, + "loss": 1.1652, + "step": 23876 + }, + { + "epoch": 0.72, + "learning_rate": 9.63936401583145e-07, + "loss": 1.0464, + "step": 23877 + }, + { + "epoch": 0.72, + "learning_rate": 9.637439621011243e-07, + "loss": 1.0198, + "step": 23878 + }, + { + "epoch": 0.72, + "learning_rate": 9.635515372435216e-07, + "loss": 1.1317, + "step": 23879 + }, + { + "epoch": 0.72, + "learning_rate": 9.633591270121683e-07, + "loss": 1.1442, + "step": 23880 + }, + { + "epoch": 0.72, + "learning_rate": 9.631667314088972e-07, + "loss": 1.1216, + "step": 23881 + }, + { + "epoch": 0.72, + "learning_rate": 9.629743504355374e-07, + "loss": 1.1048, + "step": 23882 + }, + { + "epoch": 0.72, + "learning_rate": 9.627819840939218e-07, + "loss": 1.0464, + "step": 23883 + }, + { + "epoch": 0.72, + "learning_rate": 9.62589632385881e-07, + "loss": 1.1092, + "step": 23884 + }, + { + "epoch": 0.72, + "learning_rate": 9.623972953132477e-07, + "loss": 1.1306, + "step": 23885 + }, + { + "epoch": 0.72, + "learning_rate": 9.622049728778505e-07, + "loss": 1.1881, + "step": 23886 + }, + { + "epoch": 0.72, + "learning_rate": 9.620126650815212e-07, + "loss": 1.115, + "step": 23887 + }, + { + "epoch": 0.72, + "learning_rate": 9.618203719260907e-07, + "loss": 0.9645, + "step": 23888 + }, + { + "epoch": 0.72, + "learning_rate": 9.616280934133906e-07, + "loss": 1.1031, + "step": 23889 + }, + { + "epoch": 0.72, + "learning_rate": 9.614358295452492e-07, + "loss": 1.0917, + "step": 23890 + }, + { + "epoch": 0.72, + "learning_rate": 9.612435803234972e-07, + "loss": 1.1267, + "step": 23891 + }, + { + "epoch": 0.72, + "learning_rate": 9.61051345749966e-07, + "loss": 1.131, + "step": 23892 + }, + { + "epoch": 0.72, + "learning_rate": 9.608591258264844e-07, + "loss": 1.1497, + "step": 23893 + }, + { + "epoch": 0.72, + "learning_rate": 9.606669205548835e-07, + "loss": 1.0727, + "step": 23894 + }, + { + "epoch": 0.72, + "learning_rate": 9.604747299369913e-07, + "loss": 1.0363, + "step": 23895 + }, + { + "epoch": 0.72, + "learning_rate": 9.602825539746383e-07, + "loss": 1.0604, + "step": 23896 + }, + { + "epoch": 0.72, + "learning_rate": 9.600903926696537e-07, + "loss": 1.0261, + "step": 23897 + }, + { + "epoch": 0.72, + "learning_rate": 9.598982460238667e-07, + "loss": 1.0427, + "step": 23898 + }, + { + "epoch": 0.72, + "learning_rate": 9.59706114039107e-07, + "loss": 1.1592, + "step": 23899 + }, + { + "epoch": 0.72, + "learning_rate": 9.595139967172042e-07, + "loss": 1.1979, + "step": 23900 + }, + { + "epoch": 0.72, + "learning_rate": 9.593218940599853e-07, + "loss": 1.0121, + "step": 23901 + }, + { + "epoch": 0.72, + "learning_rate": 9.591298060692796e-07, + "loss": 1.1774, + "step": 23902 + }, + { + "epoch": 0.72, + "learning_rate": 9.589377327469165e-07, + "loss": 1.1171, + "step": 23903 + }, + { + "epoch": 0.72, + "learning_rate": 9.587456740947238e-07, + "loss": 1.1619, + "step": 23904 + }, + { + "epoch": 0.72, + "learning_rate": 9.5855363011453e-07, + "loss": 1.0967, + "step": 23905 + }, + { + "epoch": 0.72, + "learning_rate": 9.583616008081641e-07, + "loss": 1.2237, + "step": 23906 + }, + { + "epoch": 0.72, + "learning_rate": 9.581695861774523e-07, + "loss": 1.0556, + "step": 23907 + }, + { + "epoch": 0.72, + "learning_rate": 9.579775862242238e-07, + "loss": 1.0763, + "step": 23908 + }, + { + "epoch": 0.72, + "learning_rate": 9.577856009503056e-07, + "loss": 1.0258, + "step": 23909 + }, + { + "epoch": 0.72, + "learning_rate": 9.575936303575262e-07, + "loss": 1.0667, + "step": 23910 + }, + { + "epoch": 0.72, + "learning_rate": 9.574016744477129e-07, + "loss": 1.1476, + "step": 23911 + }, + { + "epoch": 0.72, + "learning_rate": 9.572097332226923e-07, + "loss": 1.1307, + "step": 23912 + }, + { + "epoch": 0.72, + "learning_rate": 9.57017806684292e-07, + "loss": 1.2097, + "step": 23913 + }, + { + "epoch": 0.72, + "learning_rate": 9.568258948343387e-07, + "loss": 1.1494, + "step": 23914 + }, + { + "epoch": 0.72, + "learning_rate": 9.566339976746607e-07, + "loss": 1.0492, + "step": 23915 + }, + { + "epoch": 0.72, + "learning_rate": 9.564421152070829e-07, + "loss": 0.9939, + "step": 23916 + }, + { + "epoch": 0.72, + "learning_rate": 9.562502474334328e-07, + "loss": 1.2317, + "step": 23917 + }, + { + "epoch": 0.72, + "learning_rate": 9.560583943555369e-07, + "loss": 1.1129, + "step": 23918 + }, + { + "epoch": 0.72, + "learning_rate": 9.558665559752222e-07, + "loss": 1.1301, + "step": 23919 + }, + { + "epoch": 0.72, + "learning_rate": 9.556747322943133e-07, + "loss": 1.1495, + "step": 23920 + }, + { + "epoch": 0.72, + "learning_rate": 9.554829233146374e-07, + "loss": 1.0057, + "step": 23921 + }, + { + "epoch": 0.72, + "learning_rate": 9.552911290380202e-07, + "loss": 1.067, + "step": 23922 + }, + { + "epoch": 0.72, + "learning_rate": 9.550993494662872e-07, + "loss": 1.1074, + "step": 23923 + }, + { + "epoch": 0.72, + "learning_rate": 9.549075846012654e-07, + "loss": 1.0966, + "step": 23924 + }, + { + "epoch": 0.72, + "learning_rate": 9.547158344447785e-07, + "loss": 1.0963, + "step": 23925 + }, + { + "epoch": 0.72, + "learning_rate": 9.545240989986524e-07, + "loss": 1.1088, + "step": 23926 + }, + { + "epoch": 0.72, + "learning_rate": 9.543323782647127e-07, + "loss": 1.1437, + "step": 23927 + }, + { + "epoch": 0.72, + "learning_rate": 9.541406722447843e-07, + "loss": 1.032, + "step": 23928 + }, + { + "epoch": 0.72, + "learning_rate": 9.53948980940692e-07, + "loss": 1.1111, + "step": 23929 + }, + { + "epoch": 0.72, + "learning_rate": 9.537573043542612e-07, + "loss": 1.0997, + "step": 23930 + }, + { + "epoch": 0.72, + "learning_rate": 9.53565642487316e-07, + "loss": 1.084, + "step": 23931 + }, + { + "epoch": 0.72, + "learning_rate": 9.533739953416818e-07, + "loss": 1.0665, + "step": 23932 + }, + { + "epoch": 0.72, + "learning_rate": 9.531823629191816e-07, + "loss": 1.162, + "step": 23933 + }, + { + "epoch": 0.72, + "learning_rate": 9.529907452216403e-07, + "loss": 1.084, + "step": 23934 + }, + { + "epoch": 0.72, + "learning_rate": 9.52799142250882e-07, + "loss": 0.9495, + "step": 23935 + }, + { + "epoch": 0.72, + "learning_rate": 9.526075540087307e-07, + "loss": 1.2548, + "step": 23936 + }, + { + "epoch": 0.72, + "learning_rate": 9.524159804970109e-07, + "loss": 1.1524, + "step": 23937 + }, + { + "epoch": 0.72, + "learning_rate": 9.522244217175449e-07, + "loss": 1.1098, + "step": 23938 + }, + { + "epoch": 0.72, + "learning_rate": 9.520328776721572e-07, + "loss": 1.0559, + "step": 23939 + }, + { + "epoch": 0.72, + "learning_rate": 9.518413483626709e-07, + "loss": 1.0495, + "step": 23940 + }, + { + "epoch": 0.72, + "learning_rate": 9.5164983379091e-07, + "loss": 1.0886, + "step": 23941 + }, + { + "epoch": 0.72, + "learning_rate": 9.514583339586963e-07, + "loss": 1.1843, + "step": 23942 + }, + { + "epoch": 0.72, + "learning_rate": 9.512668488678534e-07, + "loss": 1.0851, + "step": 23943 + }, + { + "epoch": 0.72, + "learning_rate": 9.510753785202043e-07, + "loss": 1.0381, + "step": 23944 + }, + { + "epoch": 0.72, + "learning_rate": 9.508839229175724e-07, + "loss": 1.0623, + "step": 23945 + }, + { + "epoch": 0.72, + "learning_rate": 9.506924820617786e-07, + "loss": 1.0067, + "step": 23946 + }, + { + "epoch": 0.72, + "learning_rate": 9.50501055954646e-07, + "loss": 1.193, + "step": 23947 + }, + { + "epoch": 0.72, + "learning_rate": 9.503096445979973e-07, + "loss": 1.0692, + "step": 23948 + }, + { + "epoch": 0.72, + "learning_rate": 9.501182479936544e-07, + "loss": 1.1329, + "step": 23949 + }, + { + "epoch": 0.72, + "learning_rate": 9.499268661434402e-07, + "loss": 1.1351, + "step": 23950 + }, + { + "epoch": 0.72, + "learning_rate": 9.497354990491747e-07, + "loss": 1.091, + "step": 23951 + }, + { + "epoch": 0.72, + "learning_rate": 9.495441467126806e-07, + "loss": 1.1376, + "step": 23952 + }, + { + "epoch": 0.72, + "learning_rate": 9.493528091357798e-07, + "loss": 1.1678, + "step": 23953 + }, + { + "epoch": 0.72, + "learning_rate": 9.491614863202933e-07, + "loss": 1.1826, + "step": 23954 + }, + { + "epoch": 0.72, + "learning_rate": 9.489701782680425e-07, + "loss": 1.11, + "step": 23955 + }, + { + "epoch": 0.72, + "learning_rate": 9.487788849808486e-07, + "loss": 1.1581, + "step": 23956 + }, + { + "epoch": 0.72, + "learning_rate": 9.485876064605326e-07, + "loss": 1.0583, + "step": 23957 + }, + { + "epoch": 0.72, + "learning_rate": 9.483963427089162e-07, + "loss": 1.1206, + "step": 23958 + }, + { + "epoch": 0.72, + "learning_rate": 9.482050937278187e-07, + "loss": 1.0605, + "step": 23959 + }, + { + "epoch": 0.72, + "learning_rate": 9.480138595190611e-07, + "loss": 1.1865, + "step": 23960 + }, + { + "epoch": 0.72, + "learning_rate": 9.478226400844642e-07, + "loss": 1.0717, + "step": 23961 + }, + { + "epoch": 0.72, + "learning_rate": 9.476314354258481e-07, + "loss": 0.9777, + "step": 23962 + }, + { + "epoch": 0.72, + "learning_rate": 9.47440245545034e-07, + "loss": 1.1663, + "step": 23963 + }, + { + "epoch": 0.72, + "learning_rate": 9.472490704438403e-07, + "loss": 1.0408, + "step": 23964 + }, + { + "epoch": 0.72, + "learning_rate": 9.470579101240876e-07, + "loss": 1.0328, + "step": 23965 + }, + { + "epoch": 0.72, + "learning_rate": 9.468667645875957e-07, + "loss": 1.1213, + "step": 23966 + }, + { + "epoch": 0.72, + "learning_rate": 9.466756338361849e-07, + "loss": 1.1242, + "step": 23967 + }, + { + "epoch": 0.72, + "learning_rate": 9.46484517871673e-07, + "loss": 1.1331, + "step": 23968 + }, + { + "epoch": 0.72, + "learning_rate": 9.462934166958806e-07, + "loss": 1.0668, + "step": 23969 + }, + { + "epoch": 0.72, + "learning_rate": 9.461023303106265e-07, + "loss": 1.2331, + "step": 23970 + }, + { + "epoch": 0.72, + "learning_rate": 9.459112587177305e-07, + "loss": 1.0651, + "step": 23971 + }, + { + "epoch": 0.72, + "learning_rate": 9.457202019190101e-07, + "loss": 1.0629, + "step": 23972 + }, + { + "epoch": 0.72, + "learning_rate": 9.45529159916285e-07, + "loss": 1.0604, + "step": 23973 + }, + { + "epoch": 0.72, + "learning_rate": 9.453381327113733e-07, + "loss": 1.0289, + "step": 23974 + }, + { + "epoch": 0.72, + "learning_rate": 9.451471203060941e-07, + "loss": 1.0992, + "step": 23975 + }, + { + "epoch": 0.72, + "learning_rate": 9.449561227022664e-07, + "loss": 1.118, + "step": 23976 + }, + { + "epoch": 0.72, + "learning_rate": 9.447651399017063e-07, + "loss": 1.0693, + "step": 23977 + }, + { + "epoch": 0.72, + "learning_rate": 9.445741719062332e-07, + "loss": 1.2012, + "step": 23978 + }, + { + "epoch": 0.72, + "learning_rate": 9.443832187176647e-07, + "loss": 1.11, + "step": 23979 + }, + { + "epoch": 0.72, + "learning_rate": 9.441922803378189e-07, + "loss": 1.11, + "step": 23980 + }, + { + "epoch": 0.72, + "learning_rate": 9.440013567685132e-07, + "loss": 1.0829, + "step": 23981 + }, + { + "epoch": 0.72, + "learning_rate": 9.438104480115662e-07, + "loss": 1.1224, + "step": 23982 + }, + { + "epoch": 0.72, + "learning_rate": 9.436195540687934e-07, + "loss": 0.9775, + "step": 23983 + }, + { + "epoch": 0.72, + "learning_rate": 9.434286749420126e-07, + "loss": 0.9801, + "step": 23984 + }, + { + "epoch": 0.72, + "learning_rate": 9.432378106330415e-07, + "loss": 1.1703, + "step": 23985 + }, + { + "epoch": 0.72, + "learning_rate": 9.430469611436965e-07, + "loss": 1.1444, + "step": 23986 + }, + { + "epoch": 0.72, + "learning_rate": 9.428561264757946e-07, + "loss": 1.183, + "step": 23987 + }, + { + "epoch": 0.72, + "learning_rate": 9.426653066311522e-07, + "loss": 1.0477, + "step": 23988 + }, + { + "epoch": 0.72, + "learning_rate": 9.424745016115871e-07, + "loss": 1.1205, + "step": 23989 + }, + { + "epoch": 0.72, + "learning_rate": 9.42283711418914e-07, + "loss": 1.0231, + "step": 23990 + }, + { + "epoch": 0.72, + "learning_rate": 9.420929360549494e-07, + "loss": 1.0942, + "step": 23991 + }, + { + "epoch": 0.72, + "learning_rate": 9.419021755215099e-07, + "loss": 1.1479, + "step": 23992 + }, + { + "epoch": 0.72, + "learning_rate": 9.417114298204122e-07, + "loss": 1.0361, + "step": 23993 + }, + { + "epoch": 0.72, + "learning_rate": 9.415206989534701e-07, + "loss": 1.1526, + "step": 23994 + }, + { + "epoch": 0.72, + "learning_rate": 9.413299829225003e-07, + "loss": 1.0489, + "step": 23995 + }, + { + "epoch": 0.72, + "learning_rate": 9.411392817293188e-07, + "loss": 1.1144, + "step": 23996 + }, + { + "epoch": 0.72, + "learning_rate": 9.409485953757411e-07, + "loss": 1.1225, + "step": 23997 + }, + { + "epoch": 0.72, + "learning_rate": 9.407579238635811e-07, + "loss": 1.1457, + "step": 23998 + }, + { + "epoch": 0.72, + "learning_rate": 9.405672671946547e-07, + "loss": 1.158, + "step": 23999 + }, + { + "epoch": 0.72, + "learning_rate": 9.403766253707769e-07, + "loss": 1.0867, + "step": 24000 + }, + { + "epoch": 0.72, + "learning_rate": 9.401859983937625e-07, + "loss": 1.0768, + "step": 24001 + }, + { + "epoch": 0.72, + "learning_rate": 9.399953862654271e-07, + "loss": 1.1613, + "step": 24002 + }, + { + "epoch": 0.72, + "learning_rate": 9.398047889875833e-07, + "loss": 1.0943, + "step": 24003 + }, + { + "epoch": 0.72, + "learning_rate": 9.396142065620467e-07, + "loss": 1.1418, + "step": 24004 + }, + { + "epoch": 0.72, + "learning_rate": 9.394236389906311e-07, + "loss": 1.0984, + "step": 24005 + }, + { + "epoch": 0.72, + "learning_rate": 9.392330862751517e-07, + "loss": 1.0609, + "step": 24006 + }, + { + "epoch": 0.72, + "learning_rate": 9.390425484174209e-07, + "loss": 1.0391, + "step": 24007 + }, + { + "epoch": 0.72, + "learning_rate": 9.388520254192532e-07, + "loss": 1.0977, + "step": 24008 + }, + { + "epoch": 0.72, + "learning_rate": 9.386615172824626e-07, + "loss": 1.1066, + "step": 24009 + }, + { + "epoch": 0.72, + "learning_rate": 9.384710240088621e-07, + "loss": 1.2231, + "step": 24010 + }, + { + "epoch": 0.72, + "learning_rate": 9.382805456002656e-07, + "loss": 0.9826, + "step": 24011 + }, + { + "epoch": 0.72, + "learning_rate": 9.380900820584859e-07, + "loss": 1.2366, + "step": 24012 + }, + { + "epoch": 0.72, + "learning_rate": 9.378996333853362e-07, + "loss": 1.1273, + "step": 24013 + }, + { + "epoch": 0.72, + "learning_rate": 9.377091995826301e-07, + "loss": 1.043, + "step": 24014 + }, + { + "epoch": 0.72, + "learning_rate": 9.375187806521807e-07, + "loss": 1.0423, + "step": 24015 + }, + { + "epoch": 0.72, + "learning_rate": 9.373283765957991e-07, + "loss": 1.0191, + "step": 24016 + }, + { + "epoch": 0.72, + "learning_rate": 9.371379874152989e-07, + "loss": 1.11, + "step": 24017 + }, + { + "epoch": 0.72, + "learning_rate": 9.369476131124921e-07, + "loss": 1.0978, + "step": 24018 + }, + { + "epoch": 0.72, + "learning_rate": 9.367572536891922e-07, + "loss": 1.2517, + "step": 24019 + }, + { + "epoch": 0.72, + "learning_rate": 9.365669091472097e-07, + "loss": 1.1354, + "step": 24020 + }, + { + "epoch": 0.72, + "learning_rate": 9.36376579488357e-07, + "loss": 1.0607, + "step": 24021 + }, + { + "epoch": 0.72, + "learning_rate": 9.361862647144462e-07, + "loss": 1.138, + "step": 24022 + }, + { + "epoch": 0.72, + "learning_rate": 9.359959648272901e-07, + "loss": 1.2424, + "step": 24023 + }, + { + "epoch": 0.72, + "learning_rate": 9.358056798286982e-07, + "loss": 1.0884, + "step": 24024 + }, + { + "epoch": 0.72, + "learning_rate": 9.356154097204828e-07, + "loss": 1.1171, + "step": 24025 + }, + { + "epoch": 0.72, + "learning_rate": 9.354251545044554e-07, + "loss": 1.0686, + "step": 24026 + }, + { + "epoch": 0.72, + "learning_rate": 9.352349141824268e-07, + "loss": 1.0282, + "step": 24027 + }, + { + "epoch": 0.72, + "learning_rate": 9.350446887562093e-07, + "loss": 1.0237, + "step": 24028 + }, + { + "epoch": 0.72, + "learning_rate": 9.348544782276115e-07, + "loss": 1.1126, + "step": 24029 + }, + { + "epoch": 0.72, + "learning_rate": 9.346642825984453e-07, + "loss": 1.0557, + "step": 24030 + }, + { + "epoch": 0.72, + "learning_rate": 9.344741018705214e-07, + "loss": 1.1635, + "step": 24031 + }, + { + "epoch": 0.72, + "learning_rate": 9.34283936045651e-07, + "loss": 1.1729, + "step": 24032 + }, + { + "epoch": 0.72, + "learning_rate": 9.340937851256424e-07, + "loss": 1.1623, + "step": 24033 + }, + { + "epoch": 0.72, + "learning_rate": 9.339036491123069e-07, + "loss": 1.0178, + "step": 24034 + }, + { + "epoch": 0.72, + "learning_rate": 9.337135280074544e-07, + "loss": 1.0614, + "step": 24035 + }, + { + "epoch": 0.72, + "learning_rate": 9.335234218128946e-07, + "loss": 1.1103, + "step": 24036 + }, + { + "epoch": 0.72, + "learning_rate": 9.333333305304377e-07, + "loss": 1.158, + "step": 24037 + }, + { + "epoch": 0.72, + "learning_rate": 9.331432541618929e-07, + "loss": 1.0443, + "step": 24038 + }, + { + "epoch": 0.72, + "learning_rate": 9.329531927090696e-07, + "loss": 0.9999, + "step": 24039 + }, + { + "epoch": 0.72, + "learning_rate": 9.327631461737771e-07, + "loss": 1.022, + "step": 24040 + }, + { + "epoch": 0.72, + "learning_rate": 9.325731145578257e-07, + "loss": 1.0453, + "step": 24041 + }, + { + "epoch": 0.72, + "learning_rate": 9.323830978630221e-07, + "loss": 1.1378, + "step": 24042 + }, + { + "epoch": 0.72, + "learning_rate": 9.321930960911768e-07, + "loss": 1.0821, + "step": 24043 + }, + { + "epoch": 0.72, + "learning_rate": 9.320031092440981e-07, + "loss": 1.0894, + "step": 24044 + }, + { + "epoch": 0.72, + "learning_rate": 9.318131373235953e-07, + "loss": 1.1423, + "step": 24045 + }, + { + "epoch": 0.72, + "learning_rate": 9.316231803314755e-07, + "loss": 1.1129, + "step": 24046 + }, + { + "epoch": 0.72, + "learning_rate": 9.314332382695477e-07, + "loss": 1.0684, + "step": 24047 + }, + { + "epoch": 0.72, + "learning_rate": 9.312433111396199e-07, + "loss": 1.1064, + "step": 24048 + }, + { + "epoch": 0.72, + "learning_rate": 9.310533989435011e-07, + "loss": 1.1175, + "step": 24049 + }, + { + "epoch": 0.72, + "learning_rate": 9.308635016829975e-07, + "loss": 1.1097, + "step": 24050 + }, + { + "epoch": 0.72, + "learning_rate": 9.306736193599175e-07, + "loss": 1.0576, + "step": 24051 + }, + { + "epoch": 0.72, + "learning_rate": 9.304837519760689e-07, + "loss": 1.001, + "step": 24052 + }, + { + "epoch": 0.72, + "learning_rate": 9.302938995332591e-07, + "loss": 1.1277, + "step": 24053 + }, + { + "epoch": 0.72, + "learning_rate": 9.301040620332962e-07, + "loss": 1.0656, + "step": 24054 + }, + { + "epoch": 0.72, + "learning_rate": 9.299142394779858e-07, + "loss": 1.1548, + "step": 24055 + }, + { + "epoch": 0.72, + "learning_rate": 9.297244318691356e-07, + "loss": 1.1344, + "step": 24056 + }, + { + "epoch": 0.72, + "learning_rate": 9.295346392085528e-07, + "loss": 1.1819, + "step": 24057 + }, + { + "epoch": 0.72, + "learning_rate": 9.293448614980444e-07, + "loss": 1.108, + "step": 24058 + }, + { + "epoch": 0.72, + "learning_rate": 9.291550987394157e-07, + "loss": 1.1296, + "step": 24059 + }, + { + "epoch": 0.72, + "learning_rate": 9.289653509344738e-07, + "loss": 1.0663, + "step": 24060 + }, + { + "epoch": 0.72, + "learning_rate": 9.287756180850252e-07, + "loss": 1.0352, + "step": 24061 + }, + { + "epoch": 0.72, + "learning_rate": 9.28585900192876e-07, + "loss": 1.0631, + "step": 24062 + }, + { + "epoch": 0.72, + "learning_rate": 9.283961972598321e-07, + "loss": 1.1508, + "step": 24063 + }, + { + "epoch": 0.72, + "learning_rate": 9.282065092876996e-07, + "loss": 1.201, + "step": 24064 + }, + { + "epoch": 0.72, + "learning_rate": 9.280168362782852e-07, + "loss": 1.088, + "step": 24065 + }, + { + "epoch": 0.72, + "learning_rate": 9.278271782333923e-07, + "loss": 1.0608, + "step": 24066 + }, + { + "epoch": 0.73, + "learning_rate": 9.276375351548275e-07, + "loss": 1.0642, + "step": 24067 + }, + { + "epoch": 0.73, + "learning_rate": 9.274479070443962e-07, + "loss": 0.9308, + "step": 24068 + }, + { + "epoch": 0.73, + "learning_rate": 9.272582939039035e-07, + "loss": 1.1486, + "step": 24069 + }, + { + "epoch": 0.73, + "learning_rate": 9.270686957351541e-07, + "loss": 1.095, + "step": 24070 + }, + { + "epoch": 0.73, + "learning_rate": 9.268791125399543e-07, + "loss": 1.2545, + "step": 24071 + }, + { + "epoch": 0.73, + "learning_rate": 9.266895443201066e-07, + "loss": 1.0978, + "step": 24072 + }, + { + "epoch": 0.73, + "learning_rate": 9.264999910774169e-07, + "loss": 1.1293, + "step": 24073 + }, + { + "epoch": 0.73, + "learning_rate": 9.263104528136893e-07, + "loss": 1.1786, + "step": 24074 + }, + { + "epoch": 0.73, + "learning_rate": 9.261209295307294e-07, + "loss": 1.0774, + "step": 24075 + }, + { + "epoch": 0.73, + "learning_rate": 9.259314212303391e-07, + "loss": 1.1318, + "step": 24076 + }, + { + "epoch": 0.73, + "learning_rate": 9.257419279143237e-07, + "loss": 1.053, + "step": 24077 + }, + { + "epoch": 0.73, + "learning_rate": 9.25552449584487e-07, + "loss": 1.0355, + "step": 24078 + }, + { + "epoch": 0.73, + "learning_rate": 9.253629862426327e-07, + "loss": 1.1369, + "step": 24079 + }, + { + "epoch": 0.73, + "learning_rate": 9.251735378905652e-07, + "loss": 1.1718, + "step": 24080 + }, + { + "epoch": 0.73, + "learning_rate": 9.249841045300864e-07, + "loss": 1.1504, + "step": 24081 + }, + { + "epoch": 0.73, + "learning_rate": 9.247946861630003e-07, + "loss": 1.1039, + "step": 24082 + }, + { + "epoch": 0.73, + "learning_rate": 9.2460528279111e-07, + "loss": 1.0939, + "step": 24083 + }, + { + "epoch": 0.73, + "learning_rate": 9.244158944162199e-07, + "loss": 1.1327, + "step": 24084 + }, + { + "epoch": 0.73, + "learning_rate": 9.242265210401305e-07, + "loss": 1.099, + "step": 24085 + }, + { + "epoch": 0.73, + "learning_rate": 9.240371626646458e-07, + "loss": 1.2062, + "step": 24086 + }, + { + "epoch": 0.73, + "learning_rate": 9.238478192915681e-07, + "loss": 1.0546, + "step": 24087 + }, + { + "epoch": 0.73, + "learning_rate": 9.236584909227012e-07, + "loss": 1.2056, + "step": 24088 + }, + { + "epoch": 0.73, + "learning_rate": 9.234691775598453e-07, + "loss": 1.0274, + "step": 24089 + }, + { + "epoch": 0.73, + "learning_rate": 9.232798792048034e-07, + "loss": 1.1859, + "step": 24090 + }, + { + "epoch": 0.73, + "learning_rate": 9.23090595859378e-07, + "loss": 1.1199, + "step": 24091 + }, + { + "epoch": 0.73, + "learning_rate": 9.229013275253704e-07, + "loss": 1.1724, + "step": 24092 + }, + { + "epoch": 0.73, + "learning_rate": 9.227120742045828e-07, + "loss": 1.0851, + "step": 24093 + }, + { + "epoch": 0.73, + "learning_rate": 9.225228358988164e-07, + "loss": 1.1035, + "step": 24094 + }, + { + "epoch": 0.73, + "learning_rate": 9.223336126098728e-07, + "loss": 0.967, + "step": 24095 + }, + { + "epoch": 0.73, + "learning_rate": 9.221444043395536e-07, + "loss": 1.0883, + "step": 24096 + }, + { + "epoch": 0.73, + "learning_rate": 9.219552110896606e-07, + "loss": 1.2108, + "step": 24097 + }, + { + "epoch": 0.73, + "learning_rate": 9.217660328619932e-07, + "loss": 1.1948, + "step": 24098 + }, + { + "epoch": 0.73, + "learning_rate": 9.215768696583527e-07, + "loss": 1.0504, + "step": 24099 + }, + { + "epoch": 0.73, + "learning_rate": 9.213877214805405e-07, + "loss": 1.1074, + "step": 24100 + }, + { + "epoch": 0.73, + "learning_rate": 9.211985883303578e-07, + "loss": 1.0661, + "step": 24101 + }, + { + "epoch": 0.73, + "learning_rate": 9.210094702096032e-07, + "loss": 1.0607, + "step": 24102 + }, + { + "epoch": 0.73, + "learning_rate": 9.20820367120078e-07, + "loss": 1.0638, + "step": 24103 + }, + { + "epoch": 0.73, + "learning_rate": 9.206312790635821e-07, + "loss": 1.0786, + "step": 24104 + }, + { + "epoch": 0.73, + "learning_rate": 9.204422060419168e-07, + "loss": 1.1373, + "step": 24105 + }, + { + "epoch": 0.73, + "learning_rate": 9.202531480568803e-07, + "loss": 1.2493, + "step": 24106 + }, + { + "epoch": 0.73, + "learning_rate": 9.200641051102729e-07, + "loss": 1.01, + "step": 24107 + }, + { + "epoch": 0.73, + "learning_rate": 9.198750772038942e-07, + "loss": 1.0703, + "step": 24108 + }, + { + "epoch": 0.73, + "learning_rate": 9.196860643395439e-07, + "loss": 0.9136, + "step": 24109 + }, + { + "epoch": 0.73, + "learning_rate": 9.19497066519022e-07, + "loss": 1.1085, + "step": 24110 + }, + { + "epoch": 0.73, + "learning_rate": 9.193080837441257e-07, + "loss": 1.1405, + "step": 24111 + }, + { + "epoch": 0.73, + "learning_rate": 9.191191160166554e-07, + "loss": 1.1989, + "step": 24112 + }, + { + "epoch": 0.73, + "learning_rate": 9.189301633384096e-07, + "loss": 1.1187, + "step": 24113 + }, + { + "epoch": 0.73, + "learning_rate": 9.187412257111883e-07, + "loss": 1.0716, + "step": 24114 + }, + { + "epoch": 0.73, + "learning_rate": 9.18552303136788e-07, + "loss": 1.1333, + "step": 24115 + }, + { + "epoch": 0.73, + "learning_rate": 9.18363395617008e-07, + "loss": 1.0342, + "step": 24116 + }, + { + "epoch": 0.73, + "learning_rate": 9.181745031536466e-07, + "loss": 1.0963, + "step": 24117 + }, + { + "epoch": 0.73, + "learning_rate": 9.179856257485024e-07, + "loss": 1.1434, + "step": 24118 + }, + { + "epoch": 0.73, + "learning_rate": 9.17796763403373e-07, + "loss": 1.0125, + "step": 24119 + }, + { + "epoch": 0.73, + "learning_rate": 9.176079161200563e-07, + "loss": 1.2035, + "step": 24120 + }, + { + "epoch": 0.73, + "learning_rate": 9.174190839003503e-07, + "loss": 1.161, + "step": 24121 + }, + { + "epoch": 0.73, + "learning_rate": 9.172302667460523e-07, + "loss": 1.1268, + "step": 24122 + }, + { + "epoch": 0.73, + "learning_rate": 9.170414646589606e-07, + "loss": 1.1428, + "step": 24123 + }, + { + "epoch": 0.73, + "learning_rate": 9.168526776408712e-07, + "loss": 1.1061, + "step": 24124 + }, + { + "epoch": 0.73, + "learning_rate": 9.166639056935819e-07, + "loss": 1.0115, + "step": 24125 + }, + { + "epoch": 0.73, + "learning_rate": 9.164751488188894e-07, + "loss": 1.0906, + "step": 24126 + }, + { + "epoch": 0.73, + "learning_rate": 9.162864070185917e-07, + "loss": 1.0989, + "step": 24127 + }, + { + "epoch": 0.73, + "learning_rate": 9.160976802944841e-07, + "loss": 1.0367, + "step": 24128 + }, + { + "epoch": 0.73, + "learning_rate": 9.159089686483635e-07, + "loss": 1.0957, + "step": 24129 + }, + { + "epoch": 0.73, + "learning_rate": 9.157202720820266e-07, + "loss": 1.1472, + "step": 24130 + }, + { + "epoch": 0.73, + "learning_rate": 9.155315905972706e-07, + "loss": 1.0864, + "step": 24131 + }, + { + "epoch": 0.73, + "learning_rate": 9.1534292419589e-07, + "loss": 1.1685, + "step": 24132 + }, + { + "epoch": 0.73, + "learning_rate": 9.151542728796814e-07, + "loss": 1.1127, + "step": 24133 + }, + { + "epoch": 0.73, + "learning_rate": 9.149656366504408e-07, + "loss": 0.9428, + "step": 24134 + }, + { + "epoch": 0.73, + "learning_rate": 9.147770155099639e-07, + "loss": 1.082, + "step": 24135 + }, + { + "epoch": 0.73, + "learning_rate": 9.145884094600474e-07, + "loss": 1.1337, + "step": 24136 + }, + { + "epoch": 0.73, + "learning_rate": 9.143998185024849e-07, + "loss": 1.0848, + "step": 24137 + }, + { + "epoch": 0.73, + "learning_rate": 9.142112426390723e-07, + "loss": 1.1032, + "step": 24138 + }, + { + "epoch": 0.73, + "learning_rate": 9.14022681871605e-07, + "loss": 1.1108, + "step": 24139 + }, + { + "epoch": 0.73, + "learning_rate": 9.138341362018788e-07, + "loss": 1.1367, + "step": 24140 + }, + { + "epoch": 0.73, + "learning_rate": 9.136456056316866e-07, + "loss": 1.1199, + "step": 24141 + }, + { + "epoch": 0.73, + "learning_rate": 9.134570901628245e-07, + "loss": 1.0234, + "step": 24142 + }, + { + "epoch": 0.73, + "learning_rate": 9.132685897970867e-07, + "loss": 1.1313, + "step": 24143 + }, + { + "epoch": 0.73, + "learning_rate": 9.130801045362678e-07, + "loss": 1.0309, + "step": 24144 + }, + { + "epoch": 0.73, + "learning_rate": 9.12891634382162e-07, + "loss": 1.1317, + "step": 24145 + }, + { + "epoch": 0.73, + "learning_rate": 9.127031793365634e-07, + "loss": 1.1693, + "step": 24146 + }, + { + "epoch": 0.73, + "learning_rate": 9.125147394012671e-07, + "loss": 1.0927, + "step": 24147 + }, + { + "epoch": 0.73, + "learning_rate": 9.123263145780647e-07, + "loss": 1.0436, + "step": 24148 + }, + { + "epoch": 0.73, + "learning_rate": 9.121379048687515e-07, + "loss": 1.2793, + "step": 24149 + }, + { + "epoch": 0.73, + "learning_rate": 9.119495102751206e-07, + "loss": 1.2409, + "step": 24150 + }, + { + "epoch": 0.73, + "learning_rate": 9.117611307989654e-07, + "loss": 1.0852, + "step": 24151 + }, + { + "epoch": 0.73, + "learning_rate": 9.115727664420793e-07, + "loss": 1.1877, + "step": 24152 + }, + { + "epoch": 0.73, + "learning_rate": 9.113844172062566e-07, + "loss": 1.0869, + "step": 24153 + }, + { + "epoch": 0.73, + "learning_rate": 9.111960830932881e-07, + "loss": 1.053, + "step": 24154 + }, + { + "epoch": 0.73, + "learning_rate": 9.110077641049675e-07, + "loss": 1.0769, + "step": 24155 + }, + { + "epoch": 0.73, + "learning_rate": 9.108194602430881e-07, + "loss": 1.1242, + "step": 24156 + }, + { + "epoch": 0.73, + "learning_rate": 9.106311715094427e-07, + "loss": 1.1646, + "step": 24157 + }, + { + "epoch": 0.73, + "learning_rate": 9.104428979058222e-07, + "loss": 1.0717, + "step": 24158 + }, + { + "epoch": 0.73, + "learning_rate": 9.102546394340198e-07, + "loss": 1.1141, + "step": 24159 + }, + { + "epoch": 0.73, + "learning_rate": 9.100663960958275e-07, + "loss": 1.0134, + "step": 24160 + }, + { + "epoch": 0.73, + "learning_rate": 9.098781678930374e-07, + "loss": 1.1727, + "step": 24161 + }, + { + "epoch": 0.73, + "learning_rate": 9.096899548274424e-07, + "loss": 1.1561, + "step": 24162 + }, + { + "epoch": 0.73, + "learning_rate": 9.095017569008319e-07, + "loss": 1.0278, + "step": 24163 + }, + { + "epoch": 0.73, + "learning_rate": 9.093135741149988e-07, + "loss": 1.0965, + "step": 24164 + }, + { + "epoch": 0.73, + "learning_rate": 9.091254064717345e-07, + "loss": 1.1305, + "step": 24165 + }, + { + "epoch": 0.73, + "learning_rate": 9.089372539728308e-07, + "loss": 1.1649, + "step": 24166 + }, + { + "epoch": 0.73, + "learning_rate": 9.087491166200774e-07, + "loss": 1.0907, + "step": 24167 + }, + { + "epoch": 0.73, + "learning_rate": 9.085609944152662e-07, + "loss": 1.2262, + "step": 24168 + }, + { + "epoch": 0.73, + "learning_rate": 9.083728873601877e-07, + "loss": 1.096, + "step": 24169 + }, + { + "epoch": 0.73, + "learning_rate": 9.081847954566336e-07, + "loss": 1.0225, + "step": 24170 + }, + { + "epoch": 0.73, + "learning_rate": 9.079967187063929e-07, + "loss": 1.1055, + "step": 24171 + }, + { + "epoch": 0.73, + "learning_rate": 9.078086571112566e-07, + "loss": 0.9995, + "step": 24172 + }, + { + "epoch": 0.73, + "learning_rate": 9.076206106730148e-07, + "loss": 1.0865, + "step": 24173 + }, + { + "epoch": 0.73, + "learning_rate": 9.074325793934582e-07, + "loss": 1.0618, + "step": 24174 + }, + { + "epoch": 0.73, + "learning_rate": 9.072445632743763e-07, + "loss": 1.0905, + "step": 24175 + }, + { + "epoch": 0.73, + "learning_rate": 9.070565623175593e-07, + "loss": 1.0667, + "step": 24176 + }, + { + "epoch": 0.73, + "learning_rate": 9.068685765247962e-07, + "loss": 1.1091, + "step": 24177 + }, + { + "epoch": 0.73, + "learning_rate": 9.066806058978773e-07, + "loss": 1.0767, + "step": 24178 + }, + { + "epoch": 0.73, + "learning_rate": 9.064926504385923e-07, + "loss": 1.1825, + "step": 24179 + }, + { + "epoch": 0.73, + "learning_rate": 9.063047101487293e-07, + "loss": 1.1497, + "step": 24180 + }, + { + "epoch": 0.73, + "learning_rate": 9.061167850300775e-07, + "loss": 1.1179, + "step": 24181 + }, + { + "epoch": 0.73, + "learning_rate": 9.059288750844266e-07, + "loss": 1.1013, + "step": 24182 + }, + { + "epoch": 0.73, + "learning_rate": 9.057409803135658e-07, + "loss": 1.0962, + "step": 24183 + }, + { + "epoch": 0.73, + "learning_rate": 9.055531007192822e-07, + "loss": 1.1105, + "step": 24184 + }, + { + "epoch": 0.73, + "learning_rate": 9.053652363033652e-07, + "loss": 1.0858, + "step": 24185 + }, + { + "epoch": 0.73, + "learning_rate": 9.051773870676031e-07, + "loss": 1.0844, + "step": 24186 + }, + { + "epoch": 0.73, + "learning_rate": 9.049895530137842e-07, + "loss": 1.0546, + "step": 24187 + }, + { + "epoch": 0.73, + "learning_rate": 9.048017341436974e-07, + "loss": 1.2038, + "step": 24188 + }, + { + "epoch": 0.73, + "learning_rate": 9.046139304591289e-07, + "loss": 1.2371, + "step": 24189 + }, + { + "epoch": 0.73, + "learning_rate": 9.044261419618675e-07, + "loss": 1.062, + "step": 24190 + }, + { + "epoch": 0.73, + "learning_rate": 9.042383686537007e-07, + "loss": 1.1705, + "step": 24191 + }, + { + "epoch": 0.73, + "learning_rate": 9.040506105364172e-07, + "loss": 1.0554, + "step": 24192 + }, + { + "epoch": 0.73, + "learning_rate": 9.038628676118022e-07, + "loss": 1.0785, + "step": 24193 + }, + { + "epoch": 0.73, + "learning_rate": 9.036751398816437e-07, + "loss": 1.2123, + "step": 24194 + }, + { + "epoch": 0.73, + "learning_rate": 9.034874273477295e-07, + "loss": 1.0743, + "step": 24195 + }, + { + "epoch": 0.73, + "learning_rate": 9.032997300118468e-07, + "loss": 1.0964, + "step": 24196 + }, + { + "epoch": 0.73, + "learning_rate": 9.031120478757807e-07, + "loss": 1.0764, + "step": 24197 + }, + { + "epoch": 0.73, + "learning_rate": 9.02924380941319e-07, + "loss": 1.0477, + "step": 24198 + }, + { + "epoch": 0.73, + "learning_rate": 9.027367292102479e-07, + "loss": 1.0622, + "step": 24199 + }, + { + "epoch": 0.73, + "learning_rate": 9.025490926843538e-07, + "loss": 0.9748, + "step": 24200 + }, + { + "epoch": 0.73, + "learning_rate": 9.023614713654233e-07, + "loss": 1.2002, + "step": 24201 + }, + { + "epoch": 0.73, + "learning_rate": 9.021738652552417e-07, + "loss": 1.099, + "step": 24202 + }, + { + "epoch": 0.73, + "learning_rate": 9.019862743555957e-07, + "loss": 1.1049, + "step": 24203 + }, + { + "epoch": 0.73, + "learning_rate": 9.017986986682706e-07, + "loss": 1.0891, + "step": 24204 + }, + { + "epoch": 0.73, + "learning_rate": 9.016111381950529e-07, + "loss": 1.1582, + "step": 24205 + }, + { + "epoch": 0.73, + "learning_rate": 9.014235929377269e-07, + "loss": 1.1025, + "step": 24206 + }, + { + "epoch": 0.73, + "learning_rate": 9.012360628980779e-07, + "loss": 1.0557, + "step": 24207 + }, + { + "epoch": 0.73, + "learning_rate": 9.010485480778918e-07, + "loss": 1.0858, + "step": 24208 + }, + { + "epoch": 0.73, + "learning_rate": 9.008610484789543e-07, + "loss": 1.065, + "step": 24209 + }, + { + "epoch": 0.73, + "learning_rate": 9.006735641030487e-07, + "loss": 1.1786, + "step": 24210 + }, + { + "epoch": 0.73, + "learning_rate": 9.004860949519603e-07, + "loss": 1.1051, + "step": 24211 + }, + { + "epoch": 0.73, + "learning_rate": 9.002986410274742e-07, + "loss": 1.1718, + "step": 24212 + }, + { + "epoch": 0.73, + "learning_rate": 9.001112023313744e-07, + "loss": 1.0873, + "step": 24213 + }, + { + "epoch": 0.73, + "learning_rate": 8.999237788654463e-07, + "loss": 1.1251, + "step": 24214 + }, + { + "epoch": 0.73, + "learning_rate": 8.997363706314724e-07, + "loss": 1.0484, + "step": 24215 + }, + { + "epoch": 0.73, + "learning_rate": 8.995489776312375e-07, + "loss": 1.1236, + "step": 24216 + }, + { + "epoch": 0.73, + "learning_rate": 8.993615998665256e-07, + "loss": 1.1005, + "step": 24217 + }, + { + "epoch": 0.73, + "learning_rate": 8.99174237339121e-07, + "loss": 1.1886, + "step": 24218 + }, + { + "epoch": 0.73, + "learning_rate": 8.989868900508062e-07, + "loss": 1.201, + "step": 24219 + }, + { + "epoch": 0.73, + "learning_rate": 8.987995580033648e-07, + "loss": 1.0217, + "step": 24220 + }, + { + "epoch": 0.73, + "learning_rate": 8.986122411985804e-07, + "loss": 1.0572, + "step": 24221 + }, + { + "epoch": 0.73, + "learning_rate": 8.984249396382372e-07, + "loss": 1.0716, + "step": 24222 + }, + { + "epoch": 0.73, + "learning_rate": 8.982376533241166e-07, + "loss": 1.0702, + "step": 24223 + }, + { + "epoch": 0.73, + "learning_rate": 8.980503822580017e-07, + "loss": 1.108, + "step": 24224 + }, + { + "epoch": 0.73, + "learning_rate": 8.97863126441676e-07, + "loss": 1.114, + "step": 24225 + }, + { + "epoch": 0.73, + "learning_rate": 8.976758858769216e-07, + "loss": 1.1284, + "step": 24226 + }, + { + "epoch": 0.73, + "learning_rate": 8.974886605655208e-07, + "loss": 1.1818, + "step": 24227 + }, + { + "epoch": 0.73, + "learning_rate": 8.973014505092565e-07, + "loss": 1.1068, + "step": 24228 + }, + { + "epoch": 0.73, + "learning_rate": 8.971142557099113e-07, + "loss": 1.0449, + "step": 24229 + }, + { + "epoch": 0.73, + "learning_rate": 8.969270761692652e-07, + "loss": 1.0851, + "step": 24230 + }, + { + "epoch": 0.73, + "learning_rate": 8.967399118891019e-07, + "loss": 1.11, + "step": 24231 + }, + { + "epoch": 0.73, + "learning_rate": 8.965527628712021e-07, + "loss": 1.1637, + "step": 24232 + }, + { + "epoch": 0.73, + "learning_rate": 8.963656291173476e-07, + "loss": 1.0936, + "step": 24233 + }, + { + "epoch": 0.73, + "learning_rate": 8.961785106293202e-07, + "loss": 0.9727, + "step": 24234 + }, + { + "epoch": 0.73, + "learning_rate": 8.959914074089018e-07, + "loss": 1.0091, + "step": 24235 + }, + { + "epoch": 0.73, + "learning_rate": 8.958043194578717e-07, + "loss": 1.2193, + "step": 24236 + }, + { + "epoch": 0.73, + "learning_rate": 8.95617246778012e-07, + "loss": 1.1716, + "step": 24237 + }, + { + "epoch": 0.73, + "learning_rate": 8.954301893711034e-07, + "loss": 1.0492, + "step": 24238 + }, + { + "epoch": 0.73, + "learning_rate": 8.952431472389267e-07, + "loss": 1.1596, + "step": 24239 + }, + { + "epoch": 0.73, + "learning_rate": 8.95056120383263e-07, + "loss": 1.0631, + "step": 24240 + }, + { + "epoch": 0.73, + "learning_rate": 8.948691088058914e-07, + "loss": 1.0579, + "step": 24241 + }, + { + "epoch": 0.73, + "learning_rate": 8.946821125085928e-07, + "loss": 1.1064, + "step": 24242 + }, + { + "epoch": 0.73, + "learning_rate": 8.944951314931471e-07, + "loss": 1.1792, + "step": 24243 + }, + { + "epoch": 0.73, + "learning_rate": 8.943081657613356e-07, + "loss": 1.1606, + "step": 24244 + }, + { + "epoch": 0.73, + "learning_rate": 8.941212153149362e-07, + "loss": 1.1124, + "step": 24245 + }, + { + "epoch": 0.73, + "learning_rate": 8.939342801557293e-07, + "loss": 1.0919, + "step": 24246 + }, + { + "epoch": 0.73, + "learning_rate": 8.937473602854945e-07, + "loss": 1.0607, + "step": 24247 + }, + { + "epoch": 0.73, + "learning_rate": 8.935604557060124e-07, + "loss": 1.0491, + "step": 24248 + }, + { + "epoch": 0.73, + "learning_rate": 8.933735664190598e-07, + "loss": 1.147, + "step": 24249 + }, + { + "epoch": 0.73, + "learning_rate": 8.931866924264173e-07, + "loss": 1.065, + "step": 24250 + }, + { + "epoch": 0.73, + "learning_rate": 8.929998337298637e-07, + "loss": 1.0923, + "step": 24251 + }, + { + "epoch": 0.73, + "learning_rate": 8.928129903311774e-07, + "loss": 1.1547, + "step": 24252 + }, + { + "epoch": 0.73, + "learning_rate": 8.926261622321386e-07, + "loss": 1.101, + "step": 24253 + }, + { + "epoch": 0.73, + "learning_rate": 8.924393494345235e-07, + "loss": 1.1398, + "step": 24254 + }, + { + "epoch": 0.73, + "learning_rate": 8.922525519401118e-07, + "loss": 1.0781, + "step": 24255 + }, + { + "epoch": 0.73, + "learning_rate": 8.920657697506813e-07, + "loss": 1.1476, + "step": 24256 + }, + { + "epoch": 0.73, + "learning_rate": 8.918790028680102e-07, + "loss": 1.1379, + "step": 24257 + }, + { + "epoch": 0.73, + "learning_rate": 8.916922512938766e-07, + "loss": 1.0685, + "step": 24258 + }, + { + "epoch": 0.73, + "learning_rate": 8.915055150300583e-07, + "loss": 0.9938, + "step": 24259 + }, + { + "epoch": 0.73, + "learning_rate": 8.913187940783327e-07, + "loss": 1.0715, + "step": 24260 + }, + { + "epoch": 0.73, + "learning_rate": 8.911320884404781e-07, + "loss": 1.2554, + "step": 24261 + }, + { + "epoch": 0.73, + "learning_rate": 8.909453981182705e-07, + "loss": 1.2302, + "step": 24262 + }, + { + "epoch": 0.73, + "learning_rate": 8.907587231134879e-07, + "loss": 1.1116, + "step": 24263 + }, + { + "epoch": 0.73, + "learning_rate": 8.905720634279069e-07, + "loss": 1.2148, + "step": 24264 + }, + { + "epoch": 0.73, + "learning_rate": 8.903854190633049e-07, + "loss": 1.0059, + "step": 24265 + }, + { + "epoch": 0.73, + "learning_rate": 8.901987900214595e-07, + "loss": 1.1149, + "step": 24266 + }, + { + "epoch": 0.73, + "learning_rate": 8.900121763041453e-07, + "loss": 1.0782, + "step": 24267 + }, + { + "epoch": 0.73, + "learning_rate": 8.898255779131398e-07, + "loss": 1.1371, + "step": 24268 + }, + { + "epoch": 0.73, + "learning_rate": 8.896389948502193e-07, + "loss": 1.0112, + "step": 24269 + }, + { + "epoch": 0.73, + "learning_rate": 8.894524271171607e-07, + "loss": 1.0659, + "step": 24270 + }, + { + "epoch": 0.73, + "learning_rate": 8.892658747157387e-07, + "loss": 1.0526, + "step": 24271 + }, + { + "epoch": 0.73, + "learning_rate": 8.890793376477297e-07, + "loss": 1.0671, + "step": 24272 + }, + { + "epoch": 0.73, + "learning_rate": 8.888928159149096e-07, + "loss": 1.1208, + "step": 24273 + }, + { + "epoch": 0.73, + "learning_rate": 8.887063095190549e-07, + "loss": 1.1466, + "step": 24274 + }, + { + "epoch": 0.73, + "learning_rate": 8.88519818461939e-07, + "loss": 1.2357, + "step": 24275 + }, + { + "epoch": 0.73, + "learning_rate": 8.883333427453387e-07, + "loss": 1.1279, + "step": 24276 + }, + { + "epoch": 0.73, + "learning_rate": 8.881468823710282e-07, + "loss": 1.1008, + "step": 24277 + }, + { + "epoch": 0.73, + "learning_rate": 8.879604373407844e-07, + "loss": 1.0886, + "step": 24278 + }, + { + "epoch": 0.73, + "learning_rate": 8.877740076563799e-07, + "loss": 1.0764, + "step": 24279 + }, + { + "epoch": 0.73, + "learning_rate": 8.875875933195905e-07, + "loss": 1.1132, + "step": 24280 + }, + { + "epoch": 0.73, + "learning_rate": 8.874011943321903e-07, + "loss": 1.2052, + "step": 24281 + }, + { + "epoch": 0.73, + "learning_rate": 8.872148106959543e-07, + "loss": 1.1575, + "step": 24282 + }, + { + "epoch": 0.73, + "learning_rate": 8.870284424126565e-07, + "loss": 1.2061, + "step": 24283 + }, + { + "epoch": 0.73, + "learning_rate": 8.868420894840712e-07, + "loss": 0.9135, + "step": 24284 + }, + { + "epoch": 0.73, + "learning_rate": 8.86655751911972e-07, + "loss": 1.2341, + "step": 24285 + }, + { + "epoch": 0.73, + "learning_rate": 8.864694296981333e-07, + "loss": 1.1547, + "step": 24286 + }, + { + "epoch": 0.73, + "learning_rate": 8.862831228443294e-07, + "loss": 1.1824, + "step": 24287 + }, + { + "epoch": 0.73, + "learning_rate": 8.860968313523318e-07, + "loss": 1.0437, + "step": 24288 + }, + { + "epoch": 0.73, + "learning_rate": 8.859105552239155e-07, + "loss": 1.1811, + "step": 24289 + }, + { + "epoch": 0.73, + "learning_rate": 8.857242944608532e-07, + "loss": 1.0682, + "step": 24290 + }, + { + "epoch": 0.73, + "learning_rate": 8.85538049064919e-07, + "loss": 1.0651, + "step": 24291 + }, + { + "epoch": 0.73, + "learning_rate": 8.85351819037884e-07, + "loss": 1.1109, + "step": 24292 + }, + { + "epoch": 0.73, + "learning_rate": 8.851656043815223e-07, + "loss": 1.1341, + "step": 24293 + }, + { + "epoch": 0.73, + "learning_rate": 8.849794050976063e-07, + "loss": 1.0027, + "step": 24294 + }, + { + "epoch": 0.73, + "learning_rate": 8.847932211879082e-07, + "loss": 1.0763, + "step": 24295 + }, + { + "epoch": 0.73, + "learning_rate": 8.846070526542019e-07, + "loss": 1.2005, + "step": 24296 + }, + { + "epoch": 0.73, + "learning_rate": 8.844208994982576e-07, + "loss": 1.0746, + "step": 24297 + }, + { + "epoch": 0.73, + "learning_rate": 8.84234761721848e-07, + "loss": 1.1322, + "step": 24298 + }, + { + "epoch": 0.73, + "learning_rate": 8.840486393267456e-07, + "loss": 1.162, + "step": 24299 + }, + { + "epoch": 0.73, + "learning_rate": 8.838625323147227e-07, + "loss": 1.0858, + "step": 24300 + }, + { + "epoch": 0.73, + "learning_rate": 8.836764406875489e-07, + "loss": 1.0543, + "step": 24301 + }, + { + "epoch": 0.73, + "learning_rate": 8.834903644469975e-07, + "loss": 1.157, + "step": 24302 + }, + { + "epoch": 0.73, + "learning_rate": 8.833043035948389e-07, + "loss": 1.0749, + "step": 24303 + }, + { + "epoch": 0.73, + "learning_rate": 8.831182581328457e-07, + "loss": 1.0531, + "step": 24304 + }, + { + "epoch": 0.73, + "learning_rate": 8.829322280627869e-07, + "loss": 1.1376, + "step": 24305 + }, + { + "epoch": 0.73, + "learning_rate": 8.827462133864348e-07, + "loss": 1.1149, + "step": 24306 + }, + { + "epoch": 0.73, + "learning_rate": 8.825602141055598e-07, + "loss": 1.0386, + "step": 24307 + }, + { + "epoch": 0.73, + "learning_rate": 8.823742302219324e-07, + "loss": 1.1756, + "step": 24308 + }, + { + "epoch": 0.73, + "learning_rate": 8.821882617373234e-07, + "loss": 1.0903, + "step": 24309 + }, + { + "epoch": 0.73, + "learning_rate": 8.820023086535029e-07, + "loss": 1.1122, + "step": 24310 + }, + { + "epoch": 0.73, + "learning_rate": 8.81816370972241e-07, + "loss": 1.0981, + "step": 24311 + }, + { + "epoch": 0.73, + "learning_rate": 8.81630448695309e-07, + "loss": 1.2214, + "step": 24312 + }, + { + "epoch": 0.73, + "learning_rate": 8.814445418244749e-07, + "loss": 1.1441, + "step": 24313 + }, + { + "epoch": 0.73, + "learning_rate": 8.81258650361509e-07, + "loss": 1.153, + "step": 24314 + }, + { + "epoch": 0.73, + "learning_rate": 8.810727743081812e-07, + "loss": 1.1992, + "step": 24315 + }, + { + "epoch": 0.73, + "learning_rate": 8.808869136662609e-07, + "loss": 1.0023, + "step": 24316 + }, + { + "epoch": 0.73, + "learning_rate": 8.807010684375183e-07, + "loss": 1.1584, + "step": 24317 + }, + { + "epoch": 0.73, + "learning_rate": 8.80515238623721e-07, + "loss": 1.1841, + "step": 24318 + }, + { + "epoch": 0.73, + "learning_rate": 8.803294242266384e-07, + "loss": 1.1458, + "step": 24319 + }, + { + "epoch": 0.73, + "learning_rate": 8.801436252480397e-07, + "loss": 1.0901, + "step": 24320 + }, + { + "epoch": 0.73, + "learning_rate": 8.799578416896934e-07, + "loss": 1.133, + "step": 24321 + }, + { + "epoch": 0.73, + "learning_rate": 8.797720735533691e-07, + "loss": 1.0174, + "step": 24322 + }, + { + "epoch": 0.73, + "learning_rate": 8.795863208408337e-07, + "loss": 1.182, + "step": 24323 + }, + { + "epoch": 0.73, + "learning_rate": 8.794005835538558e-07, + "loss": 1.2932, + "step": 24324 + }, + { + "epoch": 0.73, + "learning_rate": 8.792148616942043e-07, + "loss": 1.0171, + "step": 24325 + }, + { + "epoch": 0.73, + "learning_rate": 8.790291552636471e-07, + "loss": 1.0931, + "step": 24326 + }, + { + "epoch": 0.73, + "learning_rate": 8.78843464263951e-07, + "loss": 1.0846, + "step": 24327 + }, + { + "epoch": 0.73, + "learning_rate": 8.786577886968842e-07, + "loss": 0.9265, + "step": 24328 + }, + { + "epoch": 0.73, + "learning_rate": 8.784721285642145e-07, + "loss": 1.0624, + "step": 24329 + }, + { + "epoch": 0.73, + "learning_rate": 8.782864838677099e-07, + "loss": 1.0966, + "step": 24330 + }, + { + "epoch": 0.73, + "learning_rate": 8.781008546091363e-07, + "loss": 1.0193, + "step": 24331 + }, + { + "epoch": 0.73, + "learning_rate": 8.779152407902613e-07, + "loss": 0.9966, + "step": 24332 + }, + { + "epoch": 0.73, + "learning_rate": 8.77729642412852e-07, + "loss": 1.0969, + "step": 24333 + }, + { + "epoch": 0.73, + "learning_rate": 8.775440594786752e-07, + "loss": 1.0883, + "step": 24334 + }, + { + "epoch": 0.73, + "learning_rate": 8.773584919894984e-07, + "loss": 1.1412, + "step": 24335 + }, + { + "epoch": 0.73, + "learning_rate": 8.771729399470866e-07, + "loss": 1.1696, + "step": 24336 + }, + { + "epoch": 0.73, + "learning_rate": 8.769874033532067e-07, + "loss": 1.1617, + "step": 24337 + }, + { + "epoch": 0.73, + "learning_rate": 8.768018822096249e-07, + "loss": 1.1781, + "step": 24338 + }, + { + "epoch": 0.73, + "learning_rate": 8.766163765181076e-07, + "loss": 1.1476, + "step": 24339 + }, + { + "epoch": 0.73, + "learning_rate": 8.764308862804205e-07, + "loss": 0.9913, + "step": 24340 + }, + { + "epoch": 0.73, + "learning_rate": 8.762454114983293e-07, + "loss": 1.1365, + "step": 24341 + }, + { + "epoch": 0.73, + "learning_rate": 8.760599521735999e-07, + "loss": 1.0755, + "step": 24342 + }, + { + "epoch": 0.73, + "learning_rate": 8.758745083079983e-07, + "loss": 1.2251, + "step": 24343 + }, + { + "epoch": 0.73, + "learning_rate": 8.756890799032886e-07, + "loss": 1.0222, + "step": 24344 + }, + { + "epoch": 0.73, + "learning_rate": 8.755036669612366e-07, + "loss": 1.0692, + "step": 24345 + }, + { + "epoch": 0.73, + "learning_rate": 8.753182694836071e-07, + "loss": 1.0557, + "step": 24346 + }, + { + "epoch": 0.73, + "learning_rate": 8.751328874721651e-07, + "loss": 1.0607, + "step": 24347 + }, + { + "epoch": 0.73, + "learning_rate": 8.749475209286764e-07, + "loss": 1.135, + "step": 24348 + }, + { + "epoch": 0.73, + "learning_rate": 8.747621698549039e-07, + "loss": 1.2321, + "step": 24349 + }, + { + "epoch": 0.73, + "learning_rate": 8.745768342526128e-07, + "loss": 1.0753, + "step": 24350 + }, + { + "epoch": 0.73, + "learning_rate": 8.743915141235674e-07, + "loss": 1.1709, + "step": 24351 + }, + { + "epoch": 0.73, + "learning_rate": 8.742062094695325e-07, + "loss": 1.0991, + "step": 24352 + }, + { + "epoch": 0.73, + "learning_rate": 8.740209202922708e-07, + "loss": 1.1564, + "step": 24353 + }, + { + "epoch": 0.73, + "learning_rate": 8.738356465935468e-07, + "loss": 1.1193, + "step": 24354 + }, + { + "epoch": 0.73, + "learning_rate": 8.736503883751243e-07, + "loss": 1.2103, + "step": 24355 + }, + { + "epoch": 0.73, + "learning_rate": 8.734651456387677e-07, + "loss": 1.1924, + "step": 24356 + }, + { + "epoch": 0.73, + "learning_rate": 8.732799183862386e-07, + "loss": 1.0718, + "step": 24357 + }, + { + "epoch": 0.73, + "learning_rate": 8.730947066193016e-07, + "loss": 1.0328, + "step": 24358 + }, + { + "epoch": 0.73, + "learning_rate": 8.729095103397189e-07, + "loss": 1.0341, + "step": 24359 + }, + { + "epoch": 0.73, + "learning_rate": 8.727243295492544e-07, + "loss": 0.9731, + "step": 24360 + }, + { + "epoch": 0.73, + "learning_rate": 8.725391642496711e-07, + "loss": 1.1266, + "step": 24361 + }, + { + "epoch": 0.73, + "learning_rate": 8.723540144427306e-07, + "loss": 1.0634, + "step": 24362 + }, + { + "epoch": 0.73, + "learning_rate": 8.721688801301958e-07, + "loss": 1.1324, + "step": 24363 + }, + { + "epoch": 0.73, + "learning_rate": 8.719837613138293e-07, + "loss": 1.1564, + "step": 24364 + }, + { + "epoch": 0.73, + "learning_rate": 8.717986579953936e-07, + "loss": 1.1588, + "step": 24365 + }, + { + "epoch": 0.73, + "learning_rate": 8.716135701766501e-07, + "loss": 0.9973, + "step": 24366 + }, + { + "epoch": 0.73, + "learning_rate": 8.714284978593613e-07, + "loss": 1.0998, + "step": 24367 + }, + { + "epoch": 0.73, + "learning_rate": 8.712434410452889e-07, + "loss": 1.1325, + "step": 24368 + }, + { + "epoch": 0.73, + "learning_rate": 8.710583997361952e-07, + "loss": 1.0598, + "step": 24369 + }, + { + "epoch": 0.73, + "learning_rate": 8.708733739338401e-07, + "loss": 1.0885, + "step": 24370 + }, + { + "epoch": 0.73, + "learning_rate": 8.706883636399862e-07, + "loss": 1.0623, + "step": 24371 + }, + { + "epoch": 0.73, + "learning_rate": 8.70503368856394e-07, + "loss": 1.0737, + "step": 24372 + }, + { + "epoch": 0.73, + "learning_rate": 8.703183895848253e-07, + "loss": 1.1202, + "step": 24373 + }, + { + "epoch": 0.73, + "learning_rate": 8.701334258270413e-07, + "loss": 1.2922, + "step": 24374 + }, + { + "epoch": 0.73, + "learning_rate": 8.699484775848013e-07, + "loss": 1.0792, + "step": 24375 + }, + { + "epoch": 0.73, + "learning_rate": 8.697635448598668e-07, + "loss": 1.0095, + "step": 24376 + }, + { + "epoch": 0.73, + "learning_rate": 8.69578627653998e-07, + "loss": 1.0151, + "step": 24377 + }, + { + "epoch": 0.73, + "learning_rate": 8.693937259689567e-07, + "loss": 1.0399, + "step": 24378 + }, + { + "epoch": 0.73, + "learning_rate": 8.692088398065005e-07, + "loss": 1.1141, + "step": 24379 + }, + { + "epoch": 0.73, + "learning_rate": 8.690239691683911e-07, + "loss": 1.1841, + "step": 24380 + }, + { + "epoch": 0.73, + "learning_rate": 8.688391140563876e-07, + "loss": 1.3054, + "step": 24381 + }, + { + "epoch": 0.73, + "learning_rate": 8.686542744722512e-07, + "loss": 1.2437, + "step": 24382 + }, + { + "epoch": 0.73, + "learning_rate": 8.684694504177396e-07, + "loss": 1.1193, + "step": 24383 + }, + { + "epoch": 0.73, + "learning_rate": 8.682846418946131e-07, + "loss": 1.0865, + "step": 24384 + }, + { + "epoch": 0.73, + "learning_rate": 8.680998489046307e-07, + "loss": 1.0424, + "step": 24385 + }, + { + "epoch": 0.73, + "learning_rate": 8.679150714495522e-07, + "loss": 1.1407, + "step": 24386 + }, + { + "epoch": 0.73, + "learning_rate": 8.677303095311368e-07, + "loss": 1.1151, + "step": 24387 + }, + { + "epoch": 0.73, + "learning_rate": 8.675455631511418e-07, + "loss": 1.1799, + "step": 24388 + }, + { + "epoch": 0.73, + "learning_rate": 8.673608323113269e-07, + "loss": 1.0214, + "step": 24389 + }, + { + "epoch": 0.73, + "learning_rate": 8.671761170134505e-07, + "loss": 1.0259, + "step": 24390 + }, + { + "epoch": 0.73, + "learning_rate": 8.669914172592711e-07, + "loss": 0.9979, + "step": 24391 + }, + { + "epoch": 0.73, + "learning_rate": 8.66806733050547e-07, + "loss": 1.153, + "step": 24392 + }, + { + "epoch": 0.73, + "learning_rate": 8.666220643890364e-07, + "loss": 1.1663, + "step": 24393 + }, + { + "epoch": 0.73, + "learning_rate": 8.664374112764975e-07, + "loss": 0.974, + "step": 24394 + }, + { + "epoch": 0.73, + "learning_rate": 8.662527737146873e-07, + "loss": 1.0746, + "step": 24395 + }, + { + "epoch": 0.73, + "learning_rate": 8.660681517053634e-07, + "loss": 1.0209, + "step": 24396 + }, + { + "epoch": 0.73, + "learning_rate": 8.658835452502839e-07, + "loss": 1.0837, + "step": 24397 + }, + { + "epoch": 0.73, + "learning_rate": 8.656989543512062e-07, + "loss": 1.1033, + "step": 24398 + }, + { + "epoch": 0.74, + "learning_rate": 8.655143790098874e-07, + "loss": 1.0912, + "step": 24399 + }, + { + "epoch": 0.74, + "learning_rate": 8.653298192280851e-07, + "loss": 1.1575, + "step": 24400 + }, + { + "epoch": 0.74, + "learning_rate": 8.651452750075551e-07, + "loss": 1.0545, + "step": 24401 + }, + { + "epoch": 0.74, + "learning_rate": 8.649607463500545e-07, + "loss": 1.0294, + "step": 24402 + }, + { + "epoch": 0.74, + "learning_rate": 8.647762332573401e-07, + "loss": 1.0322, + "step": 24403 + }, + { + "epoch": 0.74, + "learning_rate": 8.645917357311693e-07, + "loss": 1.0141, + "step": 24404 + }, + { + "epoch": 0.74, + "learning_rate": 8.644072537732967e-07, + "loss": 1.0012, + "step": 24405 + }, + { + "epoch": 0.74, + "learning_rate": 8.642227873854794e-07, + "loss": 1.1896, + "step": 24406 + }, + { + "epoch": 0.74, + "learning_rate": 8.640383365694732e-07, + "loss": 1.048, + "step": 24407 + }, + { + "epoch": 0.74, + "learning_rate": 8.63853901327035e-07, + "loss": 1.1642, + "step": 24408 + }, + { + "epoch": 0.74, + "learning_rate": 8.63669481659919e-07, + "loss": 1.0863, + "step": 24409 + }, + { + "epoch": 0.74, + "learning_rate": 8.634850775698814e-07, + "loss": 1.1316, + "step": 24410 + }, + { + "epoch": 0.74, + "learning_rate": 8.633006890586776e-07, + "loss": 1.0914, + "step": 24411 + }, + { + "epoch": 0.74, + "learning_rate": 8.631163161280629e-07, + "loss": 1.2688, + "step": 24412 + }, + { + "epoch": 0.74, + "learning_rate": 8.629319587797935e-07, + "loss": 1.1049, + "step": 24413 + }, + { + "epoch": 0.74, + "learning_rate": 8.627476170156224e-07, + "loss": 1.1539, + "step": 24414 + }, + { + "epoch": 0.74, + "learning_rate": 8.625632908373054e-07, + "loss": 1.0576, + "step": 24415 + }, + { + "epoch": 0.74, + "learning_rate": 8.623789802465976e-07, + "loss": 1.0611, + "step": 24416 + }, + { + "epoch": 0.74, + "learning_rate": 8.621946852452539e-07, + "loss": 1.12, + "step": 24417 + }, + { + "epoch": 0.74, + "learning_rate": 8.62010405835027e-07, + "loss": 1.106, + "step": 24418 + }, + { + "epoch": 0.74, + "learning_rate": 8.618261420176724e-07, + "loss": 1.2224, + "step": 24419 + }, + { + "epoch": 0.74, + "learning_rate": 8.616418937949439e-07, + "loss": 1.2617, + "step": 24420 + }, + { + "epoch": 0.74, + "learning_rate": 8.614576611685954e-07, + "loss": 1.0782, + "step": 24421 + }, + { + "epoch": 0.74, + "learning_rate": 8.612734441403808e-07, + "loss": 1.1162, + "step": 24422 + }, + { + "epoch": 0.74, + "learning_rate": 8.610892427120541e-07, + "loss": 1.2156, + "step": 24423 + }, + { + "epoch": 0.74, + "learning_rate": 8.60905056885368e-07, + "loss": 1.0593, + "step": 24424 + }, + { + "epoch": 0.74, + "learning_rate": 8.607208866620767e-07, + "loss": 1.126, + "step": 24425 + }, + { + "epoch": 0.74, + "learning_rate": 8.605367320439337e-07, + "loss": 1.1011, + "step": 24426 + }, + { + "epoch": 0.74, + "learning_rate": 8.603525930326906e-07, + "loss": 1.0679, + "step": 24427 + }, + { + "epoch": 0.74, + "learning_rate": 8.601684696301014e-07, + "loss": 1.1722, + "step": 24428 + }, + { + "epoch": 0.74, + "learning_rate": 8.599843618379183e-07, + "loss": 1.1466, + "step": 24429 + }, + { + "epoch": 0.74, + "learning_rate": 8.59800269657895e-07, + "loss": 1.05, + "step": 24430 + }, + { + "epoch": 0.74, + "learning_rate": 8.596161930917827e-07, + "loss": 1.1367, + "step": 24431 + }, + { + "epoch": 0.74, + "learning_rate": 8.594321321413338e-07, + "loss": 1.0908, + "step": 24432 + }, + { + "epoch": 0.74, + "learning_rate": 8.592480868083011e-07, + "loss": 1.0514, + "step": 24433 + }, + { + "epoch": 0.74, + "learning_rate": 8.590640570944372e-07, + "loss": 0.9578, + "step": 24434 + }, + { + "epoch": 0.74, + "learning_rate": 8.588800430014923e-07, + "loss": 1.1508, + "step": 24435 + }, + { + "epoch": 0.74, + "learning_rate": 8.586960445312192e-07, + "loss": 1.0342, + "step": 24436 + }, + { + "epoch": 0.74, + "learning_rate": 8.58512061685369e-07, + "loss": 1.21, + "step": 24437 + }, + { + "epoch": 0.74, + "learning_rate": 8.583280944656936e-07, + "loss": 1.1109, + "step": 24438 + }, + { + "epoch": 0.74, + "learning_rate": 8.581441428739448e-07, + "loss": 1.0453, + "step": 24439 + }, + { + "epoch": 0.74, + "learning_rate": 8.579602069118723e-07, + "loss": 1.0578, + "step": 24440 + }, + { + "epoch": 0.74, + "learning_rate": 8.577762865812278e-07, + "loss": 1.1439, + "step": 24441 + }, + { + "epoch": 0.74, + "learning_rate": 8.575923818837619e-07, + "loss": 1.1499, + "step": 24442 + }, + { + "epoch": 0.74, + "learning_rate": 8.574084928212264e-07, + "loss": 1.2003, + "step": 24443 + }, + { + "epoch": 0.74, + "learning_rate": 8.572246193953704e-07, + "loss": 0.9476, + "step": 24444 + }, + { + "epoch": 0.74, + "learning_rate": 8.570407616079446e-07, + "loss": 1.1616, + "step": 24445 + }, + { + "epoch": 0.74, + "learning_rate": 8.568569194606996e-07, + "loss": 1.1163, + "step": 24446 + }, + { + "epoch": 0.74, + "learning_rate": 8.566730929553852e-07, + "loss": 1.12, + "step": 24447 + }, + { + "epoch": 0.74, + "learning_rate": 8.564892820937515e-07, + "loss": 1.0397, + "step": 24448 + }, + { + "epoch": 0.74, + "learning_rate": 8.563054868775483e-07, + "loss": 1.0833, + "step": 24449 + }, + { + "epoch": 0.74, + "learning_rate": 8.561217073085254e-07, + "loss": 1.0683, + "step": 24450 + }, + { + "epoch": 0.74, + "learning_rate": 8.559379433884321e-07, + "loss": 1.1353, + "step": 24451 + }, + { + "epoch": 0.74, + "learning_rate": 8.557541951190185e-07, + "loss": 1.156, + "step": 24452 + }, + { + "epoch": 0.74, + "learning_rate": 8.555704625020322e-07, + "loss": 1.1622, + "step": 24453 + }, + { + "epoch": 0.74, + "learning_rate": 8.553867455392234e-07, + "loss": 1.073, + "step": 24454 + }, + { + "epoch": 0.74, + "learning_rate": 8.552030442323403e-07, + "loss": 1.205, + "step": 24455 + }, + { + "epoch": 0.74, + "learning_rate": 8.550193585831332e-07, + "loss": 1.1964, + "step": 24456 + }, + { + "epoch": 0.74, + "learning_rate": 8.548356885933487e-07, + "loss": 1.1366, + "step": 24457 + }, + { + "epoch": 0.74, + "learning_rate": 8.54652034264736e-07, + "loss": 1.069, + "step": 24458 + }, + { + "epoch": 0.74, + "learning_rate": 8.544683955990435e-07, + "loss": 1.1227, + "step": 24459 + }, + { + "epoch": 0.74, + "learning_rate": 8.542847725980202e-07, + "loss": 1.1166, + "step": 24460 + }, + { + "epoch": 0.74, + "learning_rate": 8.541011652634123e-07, + "loss": 1.064, + "step": 24461 + }, + { + "epoch": 0.74, + "learning_rate": 8.53917573596969e-07, + "loss": 1.1753, + "step": 24462 + }, + { + "epoch": 0.74, + "learning_rate": 8.537339976004371e-07, + "loss": 1.0731, + "step": 24463 + }, + { + "epoch": 0.74, + "learning_rate": 8.535504372755659e-07, + "loss": 1.1513, + "step": 24464 + }, + { + "epoch": 0.74, + "learning_rate": 8.533668926241007e-07, + "loss": 1.1372, + "step": 24465 + }, + { + "epoch": 0.74, + "learning_rate": 8.531833636477896e-07, + "loss": 1.0289, + "step": 24466 + }, + { + "epoch": 0.74, + "learning_rate": 8.529998503483797e-07, + "loss": 1.1176, + "step": 24467 + }, + { + "epoch": 0.74, + "learning_rate": 8.528163527276182e-07, + "loss": 1.0685, + "step": 24468 + }, + { + "epoch": 0.74, + "learning_rate": 8.526328707872522e-07, + "loss": 1.1188, + "step": 24469 + }, + { + "epoch": 0.74, + "learning_rate": 8.524494045290272e-07, + "loss": 1.1873, + "step": 24470 + }, + { + "epoch": 0.74, + "learning_rate": 8.522659539546904e-07, + "loss": 1.0604, + "step": 24471 + }, + { + "epoch": 0.74, + "learning_rate": 8.520825190659882e-07, + "loss": 1.097, + "step": 24472 + }, + { + "epoch": 0.74, + "learning_rate": 8.518990998646664e-07, + "loss": 1.05, + "step": 24473 + }, + { + "epoch": 0.74, + "learning_rate": 8.51715696352472e-07, + "loss": 1.0392, + "step": 24474 + }, + { + "epoch": 0.74, + "learning_rate": 8.5153230853115e-07, + "loss": 1.187, + "step": 24475 + }, + { + "epoch": 0.74, + "learning_rate": 8.513489364024471e-07, + "loss": 1.071, + "step": 24476 + }, + { + "epoch": 0.74, + "learning_rate": 8.511655799681079e-07, + "loss": 0.9125, + "step": 24477 + }, + { + "epoch": 0.74, + "learning_rate": 8.50982239229878e-07, + "loss": 1.1425, + "step": 24478 + }, + { + "epoch": 0.74, + "learning_rate": 8.507989141895031e-07, + "loss": 1.062, + "step": 24479 + }, + { + "epoch": 0.74, + "learning_rate": 8.506156048487282e-07, + "loss": 1.05, + "step": 24480 + }, + { + "epoch": 0.74, + "learning_rate": 8.504323112092985e-07, + "loss": 1.0884, + "step": 24481 + }, + { + "epoch": 0.74, + "learning_rate": 8.502490332729596e-07, + "loss": 1.0538, + "step": 24482 + }, + { + "epoch": 0.74, + "learning_rate": 8.500657710414542e-07, + "loss": 1.085, + "step": 24483 + }, + { + "epoch": 0.74, + "learning_rate": 8.498825245165285e-07, + "loss": 1.0869, + "step": 24484 + }, + { + "epoch": 0.74, + "learning_rate": 8.49699293699926e-07, + "loss": 1.1177, + "step": 24485 + }, + { + "epoch": 0.74, + "learning_rate": 8.495160785933923e-07, + "loss": 1.1487, + "step": 24486 + }, + { + "epoch": 0.74, + "learning_rate": 8.493328791986699e-07, + "loss": 1.0037, + "step": 24487 + }, + { + "epoch": 0.74, + "learning_rate": 8.491496955175036e-07, + "loss": 1.0776, + "step": 24488 + }, + { + "epoch": 0.74, + "learning_rate": 8.48966527551637e-07, + "loss": 1.1245, + "step": 24489 + }, + { + "epoch": 0.74, + "learning_rate": 8.487833753028149e-07, + "loss": 1.0972, + "step": 24490 + }, + { + "epoch": 0.74, + "learning_rate": 8.486002387727788e-07, + "loss": 1.1923, + "step": 24491 + }, + { + "epoch": 0.74, + "learning_rate": 8.48417117963273e-07, + "loss": 1.0596, + "step": 24492 + }, + { + "epoch": 0.74, + "learning_rate": 8.482340128760411e-07, + "loss": 1.1407, + "step": 24493 + }, + { + "epoch": 0.74, + "learning_rate": 8.480509235128257e-07, + "loss": 1.0828, + "step": 24494 + }, + { + "epoch": 0.74, + "learning_rate": 8.478678498753707e-07, + "loss": 1.1464, + "step": 24495 + }, + { + "epoch": 0.74, + "learning_rate": 8.476847919654174e-07, + "loss": 1.1047, + "step": 24496 + }, + { + "epoch": 0.74, + "learning_rate": 8.47501749784709e-07, + "loss": 1.0839, + "step": 24497 + }, + { + "epoch": 0.74, + "learning_rate": 8.47318723334988e-07, + "loss": 1.1356, + "step": 24498 + }, + { + "epoch": 0.74, + "learning_rate": 8.471357126179977e-07, + "loss": 1.0555, + "step": 24499 + }, + { + "epoch": 0.74, + "learning_rate": 8.469527176354786e-07, + "loss": 1.0804, + "step": 24500 + }, + { + "epoch": 0.74, + "learning_rate": 8.467697383891735e-07, + "loss": 1.1783, + "step": 24501 + }, + { + "epoch": 0.74, + "learning_rate": 8.46586774880824e-07, + "loss": 1.1053, + "step": 24502 + }, + { + "epoch": 0.74, + "learning_rate": 8.464038271121724e-07, + "loss": 1.0364, + "step": 24503 + }, + { + "epoch": 0.74, + "learning_rate": 8.462208950849599e-07, + "loss": 1.0842, + "step": 24504 + }, + { + "epoch": 0.74, + "learning_rate": 8.460379788009279e-07, + "loss": 1.1114, + "step": 24505 + }, + { + "epoch": 0.74, + "learning_rate": 8.458550782618177e-07, + "loss": 0.92, + "step": 24506 + }, + { + "epoch": 0.74, + "learning_rate": 8.456721934693706e-07, + "loss": 1.0173, + "step": 24507 + }, + { + "epoch": 0.74, + "learning_rate": 8.454893244253284e-07, + "loss": 0.9927, + "step": 24508 + }, + { + "epoch": 0.74, + "learning_rate": 8.453064711314299e-07, + "loss": 1.0514, + "step": 24509 + }, + { + "epoch": 0.74, + "learning_rate": 8.451236335894172e-07, + "loss": 1.1713, + "step": 24510 + }, + { + "epoch": 0.74, + "learning_rate": 8.449408118010302e-07, + "loss": 1.1207, + "step": 24511 + }, + { + "epoch": 0.74, + "learning_rate": 8.447580057680105e-07, + "loss": 1.1198, + "step": 24512 + }, + { + "epoch": 0.74, + "learning_rate": 8.445752154920966e-07, + "loss": 1.0844, + "step": 24513 + }, + { + "epoch": 0.74, + "learning_rate": 8.443924409750293e-07, + "loss": 1.1227, + "step": 24514 + }, + { + "epoch": 0.74, + "learning_rate": 8.442096822185486e-07, + "loss": 1.1868, + "step": 24515 + }, + { + "epoch": 0.74, + "learning_rate": 8.440269392243952e-07, + "loss": 1.2178, + "step": 24516 + }, + { + "epoch": 0.74, + "learning_rate": 8.438442119943069e-07, + "loss": 1.0847, + "step": 24517 + }, + { + "epoch": 0.74, + "learning_rate": 8.436615005300242e-07, + "loss": 1.1379, + "step": 24518 + }, + { + "epoch": 0.74, + "learning_rate": 8.434788048332862e-07, + "loss": 1.1143, + "step": 24519 + }, + { + "epoch": 0.74, + "learning_rate": 8.432961249058321e-07, + "loss": 1.1418, + "step": 24520 + }, + { + "epoch": 0.74, + "learning_rate": 8.431134607494019e-07, + "loss": 1.0953, + "step": 24521 + }, + { + "epoch": 0.74, + "learning_rate": 8.429308123657326e-07, + "loss": 1.1379, + "step": 24522 + }, + { + "epoch": 0.74, + "learning_rate": 8.42748179756564e-07, + "loss": 1.0389, + "step": 24523 + }, + { + "epoch": 0.74, + "learning_rate": 8.425655629236346e-07, + "loss": 1.1331, + "step": 24524 + }, + { + "epoch": 0.74, + "learning_rate": 8.423829618686835e-07, + "loss": 1.1325, + "step": 24525 + }, + { + "epoch": 0.74, + "learning_rate": 8.422003765934475e-07, + "loss": 1.0735, + "step": 24526 + }, + { + "epoch": 0.74, + "learning_rate": 8.420178070996657e-07, + "loss": 1.0702, + "step": 24527 + }, + { + "epoch": 0.74, + "learning_rate": 8.418352533890756e-07, + "loss": 1.2233, + "step": 24528 + }, + { + "epoch": 0.74, + "learning_rate": 8.416527154634155e-07, + "loss": 1.1292, + "step": 24529 + }, + { + "epoch": 0.74, + "learning_rate": 8.414701933244226e-07, + "loss": 1.1304, + "step": 24530 + }, + { + "epoch": 0.74, + "learning_rate": 8.412876869738348e-07, + "loss": 1.152, + "step": 24531 + }, + { + "epoch": 0.74, + "learning_rate": 8.411051964133895e-07, + "loss": 1.208, + "step": 24532 + }, + { + "epoch": 0.74, + "learning_rate": 8.409227216448234e-07, + "loss": 1.0924, + "step": 24533 + }, + { + "epoch": 0.74, + "learning_rate": 8.407402626698752e-07, + "loss": 1.2433, + "step": 24534 + }, + { + "epoch": 0.74, + "learning_rate": 8.405578194902797e-07, + "loss": 1.184, + "step": 24535 + }, + { + "epoch": 0.74, + "learning_rate": 8.403753921077743e-07, + "loss": 1.0286, + "step": 24536 + }, + { + "epoch": 0.74, + "learning_rate": 8.40192980524096e-07, + "loss": 1.1091, + "step": 24537 + }, + { + "epoch": 0.74, + "learning_rate": 8.400105847409821e-07, + "loss": 1.1066, + "step": 24538 + }, + { + "epoch": 0.74, + "learning_rate": 8.398282047601669e-07, + "loss": 1.1624, + "step": 24539 + }, + { + "epoch": 0.74, + "learning_rate": 8.396458405833876e-07, + "loss": 1.0468, + "step": 24540 + }, + { + "epoch": 0.74, + "learning_rate": 8.394634922123804e-07, + "loss": 1.042, + "step": 24541 + }, + { + "epoch": 0.74, + "learning_rate": 8.392811596488818e-07, + "loss": 1.0807, + "step": 24542 + }, + { + "epoch": 0.74, + "learning_rate": 8.390988428946259e-07, + "loss": 1.2085, + "step": 24543 + }, + { + "epoch": 0.74, + "learning_rate": 8.38916541951349e-07, + "loss": 1.1112, + "step": 24544 + }, + { + "epoch": 0.74, + "learning_rate": 8.387342568207868e-07, + "loss": 1.0842, + "step": 24545 + }, + { + "epoch": 0.74, + "learning_rate": 8.385519875046741e-07, + "loss": 1.0848, + "step": 24546 + }, + { + "epoch": 0.74, + "learning_rate": 8.383697340047475e-07, + "loss": 1.1502, + "step": 24547 + }, + { + "epoch": 0.74, + "learning_rate": 8.381874963227396e-07, + "loss": 1.1472, + "step": 24548 + }, + { + "epoch": 0.74, + "learning_rate": 8.380052744603867e-07, + "loss": 1.046, + "step": 24549 + }, + { + "epoch": 0.74, + "learning_rate": 8.378230684194227e-07, + "loss": 1.0726, + "step": 24550 + }, + { + "epoch": 0.74, + "learning_rate": 8.376408782015838e-07, + "loss": 1.035, + "step": 24551 + }, + { + "epoch": 0.74, + "learning_rate": 8.374587038086022e-07, + "loss": 1.0292, + "step": 24552 + }, + { + "epoch": 0.74, + "learning_rate": 8.372765452422129e-07, + "loss": 1.115, + "step": 24553 + }, + { + "epoch": 0.74, + "learning_rate": 8.370944025041502e-07, + "loss": 1.0109, + "step": 24554 + }, + { + "epoch": 0.74, + "learning_rate": 8.369122755961479e-07, + "loss": 1.2051, + "step": 24555 + }, + { + "epoch": 0.74, + "learning_rate": 8.367301645199396e-07, + "loss": 1.2083, + "step": 24556 + }, + { + "epoch": 0.74, + "learning_rate": 8.365480692772593e-07, + "loss": 1.0701, + "step": 24557 + }, + { + "epoch": 0.74, + "learning_rate": 8.363659898698401e-07, + "loss": 1.0588, + "step": 24558 + }, + { + "epoch": 0.74, + "learning_rate": 8.361839262994165e-07, + "loss": 1.076, + "step": 24559 + }, + { + "epoch": 0.74, + "learning_rate": 8.360018785677195e-07, + "loss": 1.1391, + "step": 24560 + }, + { + "epoch": 0.74, + "learning_rate": 8.358198466764833e-07, + "loss": 1.2283, + "step": 24561 + }, + { + "epoch": 0.74, + "learning_rate": 8.356378306274407e-07, + "loss": 1.0784, + "step": 24562 + }, + { + "epoch": 0.74, + "learning_rate": 8.354558304223242e-07, + "loss": 1.0969, + "step": 24563 + }, + { + "epoch": 0.74, + "learning_rate": 8.352738460628676e-07, + "loss": 1.1245, + "step": 24564 + }, + { + "epoch": 0.74, + "learning_rate": 8.350918775508013e-07, + "loss": 1.2016, + "step": 24565 + }, + { + "epoch": 0.74, + "learning_rate": 8.349099248878584e-07, + "loss": 1.0722, + "step": 24566 + }, + { + "epoch": 0.74, + "learning_rate": 8.347279880757711e-07, + "loss": 1.1699, + "step": 24567 + }, + { + "epoch": 0.74, + "learning_rate": 8.345460671162723e-07, + "loss": 1.1823, + "step": 24568 + }, + { + "epoch": 0.74, + "learning_rate": 8.343641620110918e-07, + "loss": 1.138, + "step": 24569 + }, + { + "epoch": 0.74, + "learning_rate": 8.341822727619625e-07, + "loss": 1.1031, + "step": 24570 + }, + { + "epoch": 0.74, + "learning_rate": 8.340003993706155e-07, + "loss": 1.1052, + "step": 24571 + }, + { + "epoch": 0.74, + "learning_rate": 8.338185418387823e-07, + "loss": 1.0768, + "step": 24572 + }, + { + "epoch": 0.74, + "learning_rate": 8.33636700168195e-07, + "loss": 1.1513, + "step": 24573 + }, + { + "epoch": 0.74, + "learning_rate": 8.33454874360583e-07, + "loss": 1.0609, + "step": 24574 + }, + { + "epoch": 0.74, + "learning_rate": 8.332730644176781e-07, + "loss": 1.1351, + "step": 24575 + }, + { + "epoch": 0.74, + "learning_rate": 8.330912703412106e-07, + "loss": 0.9837, + "step": 24576 + }, + { + "epoch": 0.74, + "learning_rate": 8.329094921329123e-07, + "loss": 1.0413, + "step": 24577 + }, + { + "epoch": 0.74, + "learning_rate": 8.327277297945121e-07, + "loss": 1.14, + "step": 24578 + }, + { + "epoch": 0.74, + "learning_rate": 8.325459833277408e-07, + "loss": 1.0823, + "step": 24579 + }, + { + "epoch": 0.74, + "learning_rate": 8.323642527343287e-07, + "loss": 1.1734, + "step": 24580 + }, + { + "epoch": 0.74, + "learning_rate": 8.321825380160064e-07, + "loss": 1.1536, + "step": 24581 + }, + { + "epoch": 0.74, + "learning_rate": 8.320008391745025e-07, + "loss": 1.1799, + "step": 24582 + }, + { + "epoch": 0.74, + "learning_rate": 8.318191562115472e-07, + "loss": 1.1423, + "step": 24583 + }, + { + "epoch": 0.74, + "learning_rate": 8.316374891288701e-07, + "loss": 1.2207, + "step": 24584 + }, + { + "epoch": 0.74, + "learning_rate": 8.314558379282006e-07, + "loss": 1.2458, + "step": 24585 + }, + { + "epoch": 0.74, + "learning_rate": 8.312742026112678e-07, + "loss": 1.067, + "step": 24586 + }, + { + "epoch": 0.74, + "learning_rate": 8.310925831798011e-07, + "loss": 1.0605, + "step": 24587 + }, + { + "epoch": 0.74, + "learning_rate": 8.309109796355291e-07, + "loss": 1.2183, + "step": 24588 + }, + { + "epoch": 0.74, + "learning_rate": 8.307293919801806e-07, + "loss": 1.1536, + "step": 24589 + }, + { + "epoch": 0.74, + "learning_rate": 8.305478202154855e-07, + "loss": 1.0141, + "step": 24590 + }, + { + "epoch": 0.74, + "learning_rate": 8.3036626434317e-07, + "loss": 1.2156, + "step": 24591 + }, + { + "epoch": 0.74, + "learning_rate": 8.301847243649638e-07, + "loss": 1.1773, + "step": 24592 + }, + { + "epoch": 0.74, + "learning_rate": 8.300032002825945e-07, + "loss": 1.0278, + "step": 24593 + }, + { + "epoch": 0.74, + "learning_rate": 8.298216920977914e-07, + "loss": 1.096, + "step": 24594 + }, + { + "epoch": 0.74, + "learning_rate": 8.296401998122808e-07, + "loss": 1.0823, + "step": 24595 + }, + { + "epoch": 0.74, + "learning_rate": 8.294587234277906e-07, + "loss": 1.095, + "step": 24596 + }, + { + "epoch": 0.74, + "learning_rate": 8.292772629460491e-07, + "loss": 1.0659, + "step": 24597 + }, + { + "epoch": 0.74, + "learning_rate": 8.290958183687833e-07, + "loss": 1.1143, + "step": 24598 + }, + { + "epoch": 0.74, + "learning_rate": 8.289143896977214e-07, + "loss": 1.1305, + "step": 24599 + }, + { + "epoch": 0.74, + "learning_rate": 8.287329769345889e-07, + "loss": 1.1992, + "step": 24600 + }, + { + "epoch": 0.74, + "learning_rate": 8.285515800811137e-07, + "loss": 1.0962, + "step": 24601 + }, + { + "epoch": 0.74, + "learning_rate": 8.283701991390222e-07, + "loss": 1.0247, + "step": 24602 + }, + { + "epoch": 0.74, + "learning_rate": 8.281888341100422e-07, + "loss": 1.0595, + "step": 24603 + }, + { + "epoch": 0.74, + "learning_rate": 8.280074849958986e-07, + "loss": 1.1261, + "step": 24604 + }, + { + "epoch": 0.74, + "learning_rate": 8.278261517983185e-07, + "loss": 1.0035, + "step": 24605 + }, + { + "epoch": 0.74, + "learning_rate": 8.27644834519028e-07, + "loss": 1.1981, + "step": 24606 + }, + { + "epoch": 0.74, + "learning_rate": 8.274635331597541e-07, + "loss": 1.16, + "step": 24607 + }, + { + "epoch": 0.74, + "learning_rate": 8.272822477222211e-07, + "loss": 1.1304, + "step": 24608 + }, + { + "epoch": 0.74, + "learning_rate": 8.271009782081554e-07, + "loss": 1.078, + "step": 24609 + }, + { + "epoch": 0.74, + "learning_rate": 8.269197246192826e-07, + "loss": 1.197, + "step": 24610 + }, + { + "epoch": 0.74, + "learning_rate": 8.267384869573283e-07, + "loss": 1.176, + "step": 24611 + }, + { + "epoch": 0.74, + "learning_rate": 8.265572652240178e-07, + "loss": 1.0749, + "step": 24612 + }, + { + "epoch": 0.74, + "learning_rate": 8.263760594210762e-07, + "loss": 1.1382, + "step": 24613 + }, + { + "epoch": 0.74, + "learning_rate": 8.261948695502284e-07, + "loss": 1.0977, + "step": 24614 + }, + { + "epoch": 0.74, + "learning_rate": 8.260136956131993e-07, + "loss": 1.0374, + "step": 24615 + }, + { + "epoch": 0.74, + "learning_rate": 8.258325376117144e-07, + "loss": 1.1804, + "step": 24616 + }, + { + "epoch": 0.74, + "learning_rate": 8.256513955474968e-07, + "loss": 1.1771, + "step": 24617 + }, + { + "epoch": 0.74, + "learning_rate": 8.254702694222714e-07, + "loss": 1.1373, + "step": 24618 + }, + { + "epoch": 0.74, + "learning_rate": 8.252891592377624e-07, + "loss": 1.1304, + "step": 24619 + }, + { + "epoch": 0.74, + "learning_rate": 8.251080649956949e-07, + "loss": 1.0309, + "step": 24620 + }, + { + "epoch": 0.74, + "learning_rate": 8.249269866977913e-07, + "loss": 1.0724, + "step": 24621 + }, + { + "epoch": 0.74, + "learning_rate": 8.247459243457759e-07, + "loss": 1.0978, + "step": 24622 + }, + { + "epoch": 0.74, + "learning_rate": 8.245648779413726e-07, + "loss": 1.2299, + "step": 24623 + }, + { + "epoch": 0.74, + "learning_rate": 8.243838474863048e-07, + "loss": 1.1565, + "step": 24624 + }, + { + "epoch": 0.74, + "learning_rate": 8.242028329822966e-07, + "loss": 1.1628, + "step": 24625 + }, + { + "epoch": 0.74, + "learning_rate": 8.240218344310693e-07, + "loss": 1.1, + "step": 24626 + }, + { + "epoch": 0.74, + "learning_rate": 8.238408518343468e-07, + "loss": 1.0388, + "step": 24627 + }, + { + "epoch": 0.74, + "learning_rate": 8.236598851938526e-07, + "loss": 1.1549, + "step": 24628 + }, + { + "epoch": 0.74, + "learning_rate": 8.234789345113095e-07, + "loss": 1.0367, + "step": 24629 + }, + { + "epoch": 0.74, + "learning_rate": 8.232979997884389e-07, + "loss": 1.1798, + "step": 24630 + }, + { + "epoch": 0.74, + "learning_rate": 8.231170810269634e-07, + "loss": 1.0331, + "step": 24631 + }, + { + "epoch": 0.74, + "learning_rate": 8.229361782286061e-07, + "loss": 1.0019, + "step": 24632 + }, + { + "epoch": 0.74, + "learning_rate": 8.227552913950892e-07, + "loss": 1.071, + "step": 24633 + }, + { + "epoch": 0.74, + "learning_rate": 8.225744205281333e-07, + "loss": 1.2103, + "step": 24634 + }, + { + "epoch": 0.74, + "learning_rate": 8.223935656294612e-07, + "loss": 1.0537, + "step": 24635 + }, + { + "epoch": 0.74, + "learning_rate": 8.222127267007946e-07, + "loss": 1.0988, + "step": 24636 + }, + { + "epoch": 0.74, + "learning_rate": 8.220319037438543e-07, + "loss": 1.1214, + "step": 24637 + }, + { + "epoch": 0.74, + "learning_rate": 8.218510967603624e-07, + "loss": 1.1797, + "step": 24638 + }, + { + "epoch": 0.74, + "learning_rate": 8.216703057520401e-07, + "loss": 1.1467, + "step": 24639 + }, + { + "epoch": 0.74, + "learning_rate": 8.214895307206078e-07, + "loss": 1.1141, + "step": 24640 + }, + { + "epoch": 0.74, + "learning_rate": 8.213087716677876e-07, + "loss": 0.9458, + "step": 24641 + }, + { + "epoch": 0.74, + "learning_rate": 8.211280285952989e-07, + "loss": 1.0098, + "step": 24642 + }, + { + "epoch": 0.74, + "learning_rate": 8.209473015048625e-07, + "loss": 1.0865, + "step": 24643 + }, + { + "epoch": 0.74, + "learning_rate": 8.20766590398199e-07, + "loss": 1.0913, + "step": 24644 + }, + { + "epoch": 0.74, + "learning_rate": 8.20585895277029e-07, + "loss": 1.1538, + "step": 24645 + }, + { + "epoch": 0.74, + "learning_rate": 8.204052161430734e-07, + "loss": 1.2142, + "step": 24646 + }, + { + "epoch": 0.74, + "learning_rate": 8.202245529980505e-07, + "loss": 1.16, + "step": 24647 + }, + { + "epoch": 0.74, + "learning_rate": 8.200439058436804e-07, + "loss": 1.2032, + "step": 24648 + }, + { + "epoch": 0.74, + "learning_rate": 8.198632746816834e-07, + "loss": 1.058, + "step": 24649 + }, + { + "epoch": 0.74, + "learning_rate": 8.1968265951378e-07, + "loss": 1.1767, + "step": 24650 + }, + { + "epoch": 0.74, + "learning_rate": 8.19502060341687e-07, + "loss": 1.0941, + "step": 24651 + }, + { + "epoch": 0.74, + "learning_rate": 8.193214771671254e-07, + "loss": 1.075, + "step": 24652 + }, + { + "epoch": 0.74, + "learning_rate": 8.191409099918138e-07, + "loss": 1.1549, + "step": 24653 + }, + { + "epoch": 0.74, + "learning_rate": 8.189603588174713e-07, + "loss": 1.1409, + "step": 24654 + }, + { + "epoch": 0.74, + "learning_rate": 8.187798236458175e-07, + "loss": 1.054, + "step": 24655 + }, + { + "epoch": 0.74, + "learning_rate": 8.18599304478569e-07, + "loss": 0.9495, + "step": 24656 + }, + { + "epoch": 0.74, + "learning_rate": 8.184188013174455e-07, + "loss": 1.1254, + "step": 24657 + }, + { + "epoch": 0.74, + "learning_rate": 8.182383141641651e-07, + "loss": 1.1172, + "step": 24658 + }, + { + "epoch": 0.74, + "learning_rate": 8.180578430204467e-07, + "loss": 1.1291, + "step": 24659 + }, + { + "epoch": 0.74, + "learning_rate": 8.178773878880066e-07, + "loss": 1.2214, + "step": 24660 + }, + { + "epoch": 0.74, + "learning_rate": 8.17696948768564e-07, + "loss": 1.1189, + "step": 24661 + }, + { + "epoch": 0.74, + "learning_rate": 8.175165256638359e-07, + "loss": 1.1634, + "step": 24662 + }, + { + "epoch": 0.74, + "learning_rate": 8.173361185755412e-07, + "loss": 1.0888, + "step": 24663 + }, + { + "epoch": 0.74, + "learning_rate": 8.171557275053954e-07, + "loss": 1.0172, + "step": 24664 + }, + { + "epoch": 0.74, + "learning_rate": 8.169753524551167e-07, + "loss": 1.1289, + "step": 24665 + }, + { + "epoch": 0.74, + "learning_rate": 8.167949934264219e-07, + "loss": 1.0341, + "step": 24666 + }, + { + "epoch": 0.74, + "learning_rate": 8.166146504210281e-07, + "loss": 1.1273, + "step": 24667 + }, + { + "epoch": 0.74, + "learning_rate": 8.164343234406522e-07, + "loss": 1.0041, + "step": 24668 + }, + { + "epoch": 0.74, + "learning_rate": 8.162540124870108e-07, + "loss": 1.1046, + "step": 24669 + }, + { + "epoch": 0.74, + "learning_rate": 8.1607371756182e-07, + "loss": 1.1652, + "step": 24670 + }, + { + "epoch": 0.74, + "learning_rate": 8.158934386667966e-07, + "loss": 1.0433, + "step": 24671 + }, + { + "epoch": 0.74, + "learning_rate": 8.157131758036572e-07, + "loss": 1.1329, + "step": 24672 + }, + { + "epoch": 0.74, + "learning_rate": 8.155329289741166e-07, + "loss": 1.1068, + "step": 24673 + }, + { + "epoch": 0.74, + "learning_rate": 8.15352698179891e-07, + "loss": 1.0967, + "step": 24674 + }, + { + "epoch": 0.74, + "learning_rate": 8.151724834226965e-07, + "loss": 1.1478, + "step": 24675 + }, + { + "epoch": 0.74, + "learning_rate": 8.149922847042493e-07, + "loss": 1.0644, + "step": 24676 + }, + { + "epoch": 0.74, + "learning_rate": 8.148121020262634e-07, + "loss": 1.0728, + "step": 24677 + }, + { + "epoch": 0.74, + "learning_rate": 8.146319353904545e-07, + "loss": 1.0644, + "step": 24678 + }, + { + "epoch": 0.74, + "learning_rate": 8.144517847985378e-07, + "loss": 1.1104, + "step": 24679 + }, + { + "epoch": 0.74, + "learning_rate": 8.142716502522283e-07, + "loss": 1.2894, + "step": 24680 + }, + { + "epoch": 0.74, + "learning_rate": 8.140915317532419e-07, + "loss": 1.162, + "step": 24681 + }, + { + "epoch": 0.74, + "learning_rate": 8.13911429303291e-07, + "loss": 1.1441, + "step": 24682 + }, + { + "epoch": 0.74, + "learning_rate": 8.137313429040916e-07, + "loss": 1.2173, + "step": 24683 + }, + { + "epoch": 0.74, + "learning_rate": 8.135512725573574e-07, + "loss": 1.1066, + "step": 24684 + }, + { + "epoch": 0.74, + "learning_rate": 8.133712182648038e-07, + "loss": 1.174, + "step": 24685 + }, + { + "epoch": 0.74, + "learning_rate": 8.131911800281431e-07, + "loss": 1.201, + "step": 24686 + }, + { + "epoch": 0.74, + "learning_rate": 8.130111578490899e-07, + "loss": 1.0496, + "step": 24687 + }, + { + "epoch": 0.74, + "learning_rate": 8.12831151729358e-07, + "loss": 1.2411, + "step": 24688 + }, + { + "epoch": 0.74, + "learning_rate": 8.126511616706617e-07, + "loss": 1.1139, + "step": 24689 + }, + { + "epoch": 0.74, + "learning_rate": 8.124711876747129e-07, + "loss": 1.0851, + "step": 24690 + }, + { + "epoch": 0.74, + "learning_rate": 8.122912297432259e-07, + "loss": 1.1113, + "step": 24691 + }, + { + "epoch": 0.74, + "learning_rate": 8.121112878779133e-07, + "loss": 1.147, + "step": 24692 + }, + { + "epoch": 0.74, + "learning_rate": 8.119313620804886e-07, + "loss": 1.229, + "step": 24693 + }, + { + "epoch": 0.74, + "learning_rate": 8.11751452352664e-07, + "loss": 1.1057, + "step": 24694 + }, + { + "epoch": 0.74, + "learning_rate": 8.115715586961526e-07, + "loss": 1.068, + "step": 24695 + }, + { + "epoch": 0.74, + "learning_rate": 8.113916811126668e-07, + "loss": 1.0366, + "step": 24696 + }, + { + "epoch": 0.74, + "learning_rate": 8.11211819603919e-07, + "loss": 1.0895, + "step": 24697 + }, + { + "epoch": 0.74, + "learning_rate": 8.110319741716222e-07, + "loss": 1.0544, + "step": 24698 + }, + { + "epoch": 0.74, + "learning_rate": 8.108521448174866e-07, + "loss": 1.2122, + "step": 24699 + }, + { + "epoch": 0.74, + "learning_rate": 8.106723315432252e-07, + "loss": 1.105, + "step": 24700 + }, + { + "epoch": 0.74, + "learning_rate": 8.104925343505493e-07, + "loss": 1.0658, + "step": 24701 + }, + { + "epoch": 0.74, + "learning_rate": 8.10312753241172e-07, + "loss": 1.1724, + "step": 24702 + }, + { + "epoch": 0.74, + "learning_rate": 8.101329882168024e-07, + "loss": 1.0802, + "step": 24703 + }, + { + "epoch": 0.74, + "learning_rate": 8.099532392791529e-07, + "loss": 1.0234, + "step": 24704 + }, + { + "epoch": 0.74, + "learning_rate": 8.097735064299348e-07, + "loss": 1.1655, + "step": 24705 + }, + { + "epoch": 0.74, + "learning_rate": 8.095937896708588e-07, + "loss": 1.2166, + "step": 24706 + }, + { + "epoch": 0.74, + "learning_rate": 8.094140890036364e-07, + "loss": 1.0361, + "step": 24707 + }, + { + "epoch": 0.74, + "learning_rate": 8.092344044299771e-07, + "loss": 1.0545, + "step": 24708 + }, + { + "epoch": 0.74, + "learning_rate": 8.090547359515919e-07, + "loss": 1.0544, + "step": 24709 + }, + { + "epoch": 0.74, + "learning_rate": 8.088750835701912e-07, + "loss": 1.1125, + "step": 24710 + }, + { + "epoch": 0.74, + "learning_rate": 8.086954472874861e-07, + "loss": 1.0974, + "step": 24711 + }, + { + "epoch": 0.74, + "learning_rate": 8.085158271051849e-07, + "loss": 1.0858, + "step": 24712 + }, + { + "epoch": 0.74, + "learning_rate": 8.083362230249983e-07, + "loss": 1.1219, + "step": 24713 + }, + { + "epoch": 0.74, + "learning_rate": 8.081566350486364e-07, + "loss": 1.095, + "step": 24714 + }, + { + "epoch": 0.74, + "learning_rate": 8.079770631778092e-07, + "loss": 1.0604, + "step": 24715 + }, + { + "epoch": 0.74, + "learning_rate": 8.077975074142244e-07, + "loss": 1.1328, + "step": 24716 + }, + { + "epoch": 0.74, + "learning_rate": 8.076179677595927e-07, + "loss": 1.1045, + "step": 24717 + }, + { + "epoch": 0.74, + "learning_rate": 8.074384442156227e-07, + "loss": 1.2075, + "step": 24718 + }, + { + "epoch": 0.74, + "learning_rate": 8.072589367840236e-07, + "loss": 1.1296, + "step": 24719 + }, + { + "epoch": 0.74, + "learning_rate": 8.07079445466504e-07, + "loss": 1.1022, + "step": 24720 + }, + { + "epoch": 0.74, + "learning_rate": 8.068999702647728e-07, + "loss": 1.0016, + "step": 24721 + }, + { + "epoch": 0.74, + "learning_rate": 8.067205111805384e-07, + "loss": 1.2323, + "step": 24722 + }, + { + "epoch": 0.74, + "learning_rate": 8.065410682155103e-07, + "loss": 1.1415, + "step": 24723 + }, + { + "epoch": 0.74, + "learning_rate": 8.063616413713945e-07, + "loss": 1.0684, + "step": 24724 + }, + { + "epoch": 0.74, + "learning_rate": 8.061822306499007e-07, + "loss": 1.2753, + "step": 24725 + }, + { + "epoch": 0.74, + "learning_rate": 8.060028360527359e-07, + "loss": 1.1539, + "step": 24726 + }, + { + "epoch": 0.74, + "learning_rate": 8.058234575816082e-07, + "loss": 1.1266, + "step": 24727 + }, + { + "epoch": 0.74, + "learning_rate": 8.05644095238226e-07, + "loss": 1.0786, + "step": 24728 + }, + { + "epoch": 0.74, + "learning_rate": 8.054647490242953e-07, + "loss": 1.048, + "step": 24729 + }, + { + "epoch": 0.74, + "learning_rate": 8.052854189415243e-07, + "loss": 1.0671, + "step": 24730 + }, + { + "epoch": 0.75, + "learning_rate": 8.051061049916198e-07, + "loss": 1.1596, + "step": 24731 + }, + { + "epoch": 0.75, + "learning_rate": 8.049268071762886e-07, + "loss": 1.1091, + "step": 24732 + }, + { + "epoch": 0.75, + "learning_rate": 8.04747525497239e-07, + "loss": 1.136, + "step": 24733 + }, + { + "epoch": 0.75, + "learning_rate": 8.045682599561755e-07, + "loss": 1.0074, + "step": 24734 + }, + { + "epoch": 0.75, + "learning_rate": 8.043890105548055e-07, + "loss": 1.136, + "step": 24735 + }, + { + "epoch": 0.75, + "learning_rate": 8.042097772948357e-07, + "loss": 1.0746, + "step": 24736 + }, + { + "epoch": 0.75, + "learning_rate": 8.040305601779727e-07, + "loss": 1.1553, + "step": 24737 + }, + { + "epoch": 0.75, + "learning_rate": 8.038513592059213e-07, + "loss": 1.1393, + "step": 24738 + }, + { + "epoch": 0.75, + "learning_rate": 8.03672174380388e-07, + "loss": 1.0756, + "step": 24739 + }, + { + "epoch": 0.75, + "learning_rate": 8.034930057030788e-07, + "loss": 1.1235, + "step": 24740 + }, + { + "epoch": 0.75, + "learning_rate": 8.033138531756998e-07, + "loss": 0.9929, + "step": 24741 + }, + { + "epoch": 0.75, + "learning_rate": 8.031347167999548e-07, + "loss": 1.2403, + "step": 24742 + }, + { + "epoch": 0.75, + "learning_rate": 8.029555965775504e-07, + "loss": 1.0282, + "step": 24743 + }, + { + "epoch": 0.75, + "learning_rate": 8.02776492510191e-07, + "loss": 1.1538, + "step": 24744 + }, + { + "epoch": 0.75, + "learning_rate": 8.025974045995822e-07, + "loss": 1.0918, + "step": 24745 + }, + { + "epoch": 0.75, + "learning_rate": 8.024183328474294e-07, + "loss": 1.0217, + "step": 24746 + }, + { + "epoch": 0.75, + "learning_rate": 8.022392772554358e-07, + "loss": 1.1326, + "step": 24747 + }, + { + "epoch": 0.75, + "learning_rate": 8.020602378253064e-07, + "loss": 1.1895, + "step": 24748 + }, + { + "epoch": 0.75, + "learning_rate": 8.01881214558746e-07, + "loss": 1.0988, + "step": 24749 + }, + { + "epoch": 0.75, + "learning_rate": 8.017022074574585e-07, + "loss": 0.9666, + "step": 24750 + }, + { + "epoch": 0.75, + "learning_rate": 8.015232165231479e-07, + "loss": 1.1589, + "step": 24751 + }, + { + "epoch": 0.75, + "learning_rate": 8.013442417575184e-07, + "loss": 1.0751, + "step": 24752 + }, + { + "epoch": 0.75, + "learning_rate": 8.011652831622735e-07, + "loss": 1.0298, + "step": 24753 + }, + { + "epoch": 0.75, + "learning_rate": 8.00986340739118e-07, + "loss": 1.1941, + "step": 24754 + }, + { + "epoch": 0.75, + "learning_rate": 8.008074144897532e-07, + "loss": 1.2192, + "step": 24755 + }, + { + "epoch": 0.75, + "learning_rate": 8.006285044158835e-07, + "loss": 1.2432, + "step": 24756 + }, + { + "epoch": 0.75, + "learning_rate": 8.00449610519212e-07, + "loss": 1.1302, + "step": 24757 + }, + { + "epoch": 0.75, + "learning_rate": 8.002707328014417e-07, + "loss": 1.0853, + "step": 24758 + }, + { + "epoch": 0.75, + "learning_rate": 8.000918712642763e-07, + "loss": 1.1115, + "step": 24759 + }, + { + "epoch": 0.75, + "learning_rate": 7.999130259094168e-07, + "loss": 1.1368, + "step": 24760 + }, + { + "epoch": 0.75, + "learning_rate": 7.997341967385664e-07, + "loss": 1.2343, + "step": 24761 + }, + { + "epoch": 0.75, + "learning_rate": 7.995553837534275e-07, + "loss": 1.2468, + "step": 24762 + }, + { + "epoch": 0.75, + "learning_rate": 7.993765869557033e-07, + "loss": 1.0437, + "step": 24763 + }, + { + "epoch": 0.75, + "learning_rate": 7.99197806347094e-07, + "loss": 1.1016, + "step": 24764 + }, + { + "epoch": 0.75, + "learning_rate": 7.990190419293025e-07, + "loss": 1.0708, + "step": 24765 + }, + { + "epoch": 0.75, + "learning_rate": 7.988402937040307e-07, + "loss": 1.1339, + "step": 24766 + }, + { + "epoch": 0.75, + "learning_rate": 7.986615616729807e-07, + "loss": 1.1161, + "step": 24767 + }, + { + "epoch": 0.75, + "learning_rate": 7.984828458378522e-07, + "loss": 1.083, + "step": 24768 + }, + { + "epoch": 0.75, + "learning_rate": 7.983041462003477e-07, + "loss": 1.1143, + "step": 24769 + }, + { + "epoch": 0.75, + "learning_rate": 7.981254627621682e-07, + "loss": 1.0918, + "step": 24770 + }, + { + "epoch": 0.75, + "learning_rate": 7.979467955250148e-07, + "loss": 1.1533, + "step": 24771 + }, + { + "epoch": 0.75, + "learning_rate": 7.977681444905885e-07, + "loss": 1.1568, + "step": 24772 + }, + { + "epoch": 0.75, + "learning_rate": 7.975895096605893e-07, + "loss": 1.075, + "step": 24773 + }, + { + "epoch": 0.75, + "learning_rate": 7.974108910367179e-07, + "loss": 1.0854, + "step": 24774 + }, + { + "epoch": 0.75, + "learning_rate": 7.972322886206748e-07, + "loss": 1.0411, + "step": 24775 + }, + { + "epoch": 0.75, + "learning_rate": 7.970537024141603e-07, + "loss": 1.0669, + "step": 24776 + }, + { + "epoch": 0.75, + "learning_rate": 7.968751324188743e-07, + "loss": 1.0648, + "step": 24777 + }, + { + "epoch": 0.75, + "learning_rate": 7.966965786365169e-07, + "loss": 1.0878, + "step": 24778 + }, + { + "epoch": 0.75, + "learning_rate": 7.965180410687876e-07, + "loss": 1.0808, + "step": 24779 + }, + { + "epoch": 0.75, + "learning_rate": 7.96339519717387e-07, + "loss": 1.0986, + "step": 24780 + }, + { + "epoch": 0.75, + "learning_rate": 7.961610145840126e-07, + "loss": 1.1115, + "step": 24781 + }, + { + "epoch": 0.75, + "learning_rate": 7.959825256703652e-07, + "loss": 1.0697, + "step": 24782 + }, + { + "epoch": 0.75, + "learning_rate": 7.958040529781433e-07, + "loss": 1.0372, + "step": 24783 + }, + { + "epoch": 0.75, + "learning_rate": 7.956255965090459e-07, + "loss": 1.0574, + "step": 24784 + }, + { + "epoch": 0.75, + "learning_rate": 7.954471562647729e-07, + "loss": 1.1423, + "step": 24785 + }, + { + "epoch": 0.75, + "learning_rate": 7.952687322470212e-07, + "loss": 1.1792, + "step": 24786 + }, + { + "epoch": 0.75, + "learning_rate": 7.950903244574901e-07, + "loss": 1.0634, + "step": 24787 + }, + { + "epoch": 0.75, + "learning_rate": 7.94911932897878e-07, + "loss": 1.2295, + "step": 24788 + }, + { + "epoch": 0.75, + "learning_rate": 7.947335575698839e-07, + "loss": 1.0454, + "step": 24789 + }, + { + "epoch": 0.75, + "learning_rate": 7.945551984752042e-07, + "loss": 1.1255, + "step": 24790 + }, + { + "epoch": 0.75, + "learning_rate": 7.943768556155379e-07, + "loss": 1.0123, + "step": 24791 + }, + { + "epoch": 0.75, + "learning_rate": 7.941985289925821e-07, + "loss": 1.1466, + "step": 24792 + }, + { + "epoch": 0.75, + "learning_rate": 7.940202186080359e-07, + "loss": 1.152, + "step": 24793 + }, + { + "epoch": 0.75, + "learning_rate": 7.938419244635947e-07, + "loss": 1.0667, + "step": 24794 + }, + { + "epoch": 0.75, + "learning_rate": 7.936636465609565e-07, + "loss": 1.1233, + "step": 24795 + }, + { + "epoch": 0.75, + "learning_rate": 7.934853849018188e-07, + "loss": 1.1295, + "step": 24796 + }, + { + "epoch": 0.75, + "learning_rate": 7.933071394878783e-07, + "loss": 0.9851, + "step": 24797 + }, + { + "epoch": 0.75, + "learning_rate": 7.931289103208326e-07, + "loss": 1.1967, + "step": 24798 + }, + { + "epoch": 0.75, + "learning_rate": 7.929506974023768e-07, + "loss": 1.1644, + "step": 24799 + }, + { + "epoch": 0.75, + "learning_rate": 7.927725007342082e-07, + "loss": 1.1538, + "step": 24800 + }, + { + "epoch": 0.75, + "learning_rate": 7.925943203180234e-07, + "loss": 1.2374, + "step": 24801 + }, + { + "epoch": 0.75, + "learning_rate": 7.92416156155518e-07, + "loss": 1.0988, + "step": 24802 + }, + { + "epoch": 0.75, + "learning_rate": 7.922380082483885e-07, + "loss": 1.0359, + "step": 24803 + }, + { + "epoch": 0.75, + "learning_rate": 7.920598765983309e-07, + "loss": 1.026, + "step": 24804 + }, + { + "epoch": 0.75, + "learning_rate": 7.918817612070406e-07, + "loss": 1.0751, + "step": 24805 + }, + { + "epoch": 0.75, + "learning_rate": 7.917036620762139e-07, + "loss": 1.0949, + "step": 24806 + }, + { + "epoch": 0.75, + "learning_rate": 7.915255792075449e-07, + "loss": 1.0595, + "step": 24807 + }, + { + "epoch": 0.75, + "learning_rate": 7.913475126027295e-07, + "loss": 1.0552, + "step": 24808 + }, + { + "epoch": 0.75, + "learning_rate": 7.91169462263463e-07, + "loss": 1.0448, + "step": 24809 + }, + { + "epoch": 0.75, + "learning_rate": 7.909914281914402e-07, + "loss": 1.1355, + "step": 24810 + }, + { + "epoch": 0.75, + "learning_rate": 7.908134103883566e-07, + "loss": 1.2018, + "step": 24811 + }, + { + "epoch": 0.75, + "learning_rate": 7.906354088559054e-07, + "loss": 1.1048, + "step": 24812 + }, + { + "epoch": 0.75, + "learning_rate": 7.904574235957821e-07, + "loss": 1.0656, + "step": 24813 + }, + { + "epoch": 0.75, + "learning_rate": 7.902794546096803e-07, + "loss": 1.0304, + "step": 24814 + }, + { + "epoch": 0.75, + "learning_rate": 7.901015018992958e-07, + "loss": 1.0623, + "step": 24815 + }, + { + "epoch": 0.75, + "learning_rate": 7.899235654663206e-07, + "loss": 1.1229, + "step": 24816 + }, + { + "epoch": 0.75, + "learning_rate": 7.897456453124497e-07, + "loss": 1.1682, + "step": 24817 + }, + { + "epoch": 0.75, + "learning_rate": 7.895677414393762e-07, + "loss": 1.1424, + "step": 24818 + }, + { + "epoch": 0.75, + "learning_rate": 7.893898538487948e-07, + "loss": 1.0054, + "step": 24819 + }, + { + "epoch": 0.75, + "learning_rate": 7.892119825423977e-07, + "loss": 1.0709, + "step": 24820 + }, + { + "epoch": 0.75, + "learning_rate": 7.890341275218783e-07, + "loss": 1.0952, + "step": 24821 + }, + { + "epoch": 0.75, + "learning_rate": 7.888562887889301e-07, + "loss": 1.0911, + "step": 24822 + }, + { + "epoch": 0.75, + "learning_rate": 7.88678466345246e-07, + "loss": 1.1238, + "step": 24823 + }, + { + "epoch": 0.75, + "learning_rate": 7.885006601925194e-07, + "loss": 1.0333, + "step": 24824 + }, + { + "epoch": 0.75, + "learning_rate": 7.883228703324414e-07, + "loss": 1.2443, + "step": 24825 + }, + { + "epoch": 0.75, + "learning_rate": 7.881450967667051e-07, + "loss": 1.0118, + "step": 24826 + }, + { + "epoch": 0.75, + "learning_rate": 7.879673394970034e-07, + "loss": 1.1, + "step": 24827 + }, + { + "epoch": 0.75, + "learning_rate": 7.877895985250286e-07, + "loss": 1.1361, + "step": 24828 + }, + { + "epoch": 0.75, + "learning_rate": 7.876118738524716e-07, + "loss": 1.1304, + "step": 24829 + }, + { + "epoch": 0.75, + "learning_rate": 7.874341654810247e-07, + "loss": 1.2027, + "step": 24830 + }, + { + "epoch": 0.75, + "learning_rate": 7.872564734123797e-07, + "loss": 1.0851, + "step": 24831 + }, + { + "epoch": 0.75, + "learning_rate": 7.870787976482283e-07, + "loss": 1.142, + "step": 24832 + }, + { + "epoch": 0.75, + "learning_rate": 7.869011381902616e-07, + "loss": 1.1089, + "step": 24833 + }, + { + "epoch": 0.75, + "learning_rate": 7.867234950401714e-07, + "loss": 1.0687, + "step": 24834 + }, + { + "epoch": 0.75, + "learning_rate": 7.86545868199648e-07, + "loss": 0.9752, + "step": 24835 + }, + { + "epoch": 0.75, + "learning_rate": 7.863682576703837e-07, + "loss": 1.2776, + "step": 24836 + }, + { + "epoch": 0.75, + "learning_rate": 7.861906634540676e-07, + "loss": 1.0105, + "step": 24837 + }, + { + "epoch": 0.75, + "learning_rate": 7.860130855523906e-07, + "loss": 1.2114, + "step": 24838 + }, + { + "epoch": 0.75, + "learning_rate": 7.858355239670437e-07, + "loss": 1.2103, + "step": 24839 + }, + { + "epoch": 0.75, + "learning_rate": 7.856579786997174e-07, + "loss": 1.1058, + "step": 24840 + }, + { + "epoch": 0.75, + "learning_rate": 7.854804497521018e-07, + "loss": 1.168, + "step": 24841 + }, + { + "epoch": 0.75, + "learning_rate": 7.85302937125886e-07, + "loss": 1.136, + "step": 24842 + }, + { + "epoch": 0.75, + "learning_rate": 7.851254408227604e-07, + "loss": 1.1005, + "step": 24843 + }, + { + "epoch": 0.75, + "learning_rate": 7.849479608444147e-07, + "loss": 1.1427, + "step": 24844 + }, + { + "epoch": 0.75, + "learning_rate": 7.847704971925391e-07, + "loss": 1.0336, + "step": 24845 + }, + { + "epoch": 0.75, + "learning_rate": 7.845930498688214e-07, + "loss": 1.1758, + "step": 24846 + }, + { + "epoch": 0.75, + "learning_rate": 7.844156188749519e-07, + "loss": 1.1436, + "step": 24847 + }, + { + "epoch": 0.75, + "learning_rate": 7.842382042126195e-07, + "loss": 1.1625, + "step": 24848 + }, + { + "epoch": 0.75, + "learning_rate": 7.840608058835139e-07, + "loss": 1.0709, + "step": 24849 + }, + { + "epoch": 0.75, + "learning_rate": 7.838834238893219e-07, + "loss": 1.0252, + "step": 24850 + }, + { + "epoch": 0.75, + "learning_rate": 7.837060582317336e-07, + "loss": 1.1369, + "step": 24851 + }, + { + "epoch": 0.75, + "learning_rate": 7.835287089124366e-07, + "loss": 1.0841, + "step": 24852 + }, + { + "epoch": 0.75, + "learning_rate": 7.833513759331199e-07, + "loss": 1.1033, + "step": 24853 + }, + { + "epoch": 0.75, + "learning_rate": 7.83174059295472e-07, + "loss": 1.2079, + "step": 24854 + }, + { + "epoch": 0.75, + "learning_rate": 7.829967590011794e-07, + "loss": 1.1799, + "step": 24855 + }, + { + "epoch": 0.75, + "learning_rate": 7.828194750519308e-07, + "loss": 1.1417, + "step": 24856 + }, + { + "epoch": 0.75, + "learning_rate": 7.826422074494139e-07, + "loss": 1.1572, + "step": 24857 + }, + { + "epoch": 0.75, + "learning_rate": 7.824649561953157e-07, + "loss": 1.2051, + "step": 24858 + }, + { + "epoch": 0.75, + "learning_rate": 7.822877212913243e-07, + "loss": 0.9704, + "step": 24859 + }, + { + "epoch": 0.75, + "learning_rate": 7.821105027391262e-07, + "loss": 1.0507, + "step": 24860 + }, + { + "epoch": 0.75, + "learning_rate": 7.819333005404089e-07, + "loss": 1.1336, + "step": 24861 + }, + { + "epoch": 0.75, + "learning_rate": 7.8175611469686e-07, + "loss": 1.0944, + "step": 24862 + }, + { + "epoch": 0.75, + "learning_rate": 7.815789452101647e-07, + "loss": 1.183, + "step": 24863 + }, + { + "epoch": 0.75, + "learning_rate": 7.814017920820099e-07, + "loss": 1.1011, + "step": 24864 + }, + { + "epoch": 0.75, + "learning_rate": 7.812246553140824e-07, + "loss": 1.0948, + "step": 24865 + }, + { + "epoch": 0.75, + "learning_rate": 7.810475349080684e-07, + "loss": 1.1147, + "step": 24866 + }, + { + "epoch": 0.75, + "learning_rate": 7.808704308656548e-07, + "loss": 1.1943, + "step": 24867 + }, + { + "epoch": 0.75, + "learning_rate": 7.806933431885261e-07, + "loss": 1.152, + "step": 24868 + }, + { + "epoch": 0.75, + "learning_rate": 7.805162718783684e-07, + "loss": 1.0581, + "step": 24869 + }, + { + "epoch": 0.75, + "learning_rate": 7.803392169368679e-07, + "loss": 1.183, + "step": 24870 + }, + { + "epoch": 0.75, + "learning_rate": 7.801621783657107e-07, + "loss": 1.1246, + "step": 24871 + }, + { + "epoch": 0.75, + "learning_rate": 7.799851561665802e-07, + "loss": 1.1357, + "step": 24872 + }, + { + "epoch": 0.75, + "learning_rate": 7.798081503411628e-07, + "loss": 1.0236, + "step": 24873 + }, + { + "epoch": 0.75, + "learning_rate": 7.796311608911433e-07, + "loss": 1.201, + "step": 24874 + }, + { + "epoch": 0.75, + "learning_rate": 7.794541878182074e-07, + "loss": 1.1196, + "step": 24875 + }, + { + "epoch": 0.75, + "learning_rate": 7.792772311240382e-07, + "loss": 1.052, + "step": 24876 + }, + { + "epoch": 0.75, + "learning_rate": 7.791002908103209e-07, + "loss": 1.1185, + "step": 24877 + }, + { + "epoch": 0.75, + "learning_rate": 7.789233668787402e-07, + "loss": 1.1141, + "step": 24878 + }, + { + "epoch": 0.75, + "learning_rate": 7.787464593309802e-07, + "loss": 1.0453, + "step": 24879 + }, + { + "epoch": 0.75, + "learning_rate": 7.785695681687256e-07, + "loss": 1.1324, + "step": 24880 + }, + { + "epoch": 0.75, + "learning_rate": 7.783926933936589e-07, + "loss": 1.1254, + "step": 24881 + }, + { + "epoch": 0.75, + "learning_rate": 7.782158350074646e-07, + "loss": 1.0955, + "step": 24882 + }, + { + "epoch": 0.75, + "learning_rate": 7.780389930118263e-07, + "loss": 1.0503, + "step": 24883 + }, + { + "epoch": 0.75, + "learning_rate": 7.778621674084275e-07, + "loss": 0.9386, + "step": 24884 + }, + { + "epoch": 0.75, + "learning_rate": 7.776853581989513e-07, + "loss": 1.1751, + "step": 24885 + }, + { + "epoch": 0.75, + "learning_rate": 7.775085653850811e-07, + "loss": 1.2206, + "step": 24886 + }, + { + "epoch": 0.75, + "learning_rate": 7.773317889684998e-07, + "loss": 1.1118, + "step": 24887 + }, + { + "epoch": 0.75, + "learning_rate": 7.771550289508908e-07, + "loss": 0.9788, + "step": 24888 + }, + { + "epoch": 0.75, + "learning_rate": 7.769782853339356e-07, + "loss": 1.0781, + "step": 24889 + }, + { + "epoch": 0.75, + "learning_rate": 7.768015581193173e-07, + "loss": 1.1593, + "step": 24890 + }, + { + "epoch": 0.75, + "learning_rate": 7.766248473087179e-07, + "loss": 1.0792, + "step": 24891 + }, + { + "epoch": 0.75, + "learning_rate": 7.764481529038203e-07, + "loss": 1.0192, + "step": 24892 + }, + { + "epoch": 0.75, + "learning_rate": 7.762714749063069e-07, + "loss": 1.1699, + "step": 24893 + }, + { + "epoch": 0.75, + "learning_rate": 7.760948133178581e-07, + "loss": 1.2204, + "step": 24894 + }, + { + "epoch": 0.75, + "learning_rate": 7.759181681401564e-07, + "loss": 1.1696, + "step": 24895 + }, + { + "epoch": 0.75, + "learning_rate": 7.757415393748835e-07, + "loss": 1.0314, + "step": 24896 + }, + { + "epoch": 0.75, + "learning_rate": 7.755649270237214e-07, + "loss": 1.0972, + "step": 24897 + }, + { + "epoch": 0.75, + "learning_rate": 7.753883310883498e-07, + "loss": 1.0564, + "step": 24898 + }, + { + "epoch": 0.75, + "learning_rate": 7.752117515704507e-07, + "loss": 1.062, + "step": 24899 + }, + { + "epoch": 0.75, + "learning_rate": 7.750351884717053e-07, + "loss": 1.2058, + "step": 24900 + }, + { + "epoch": 0.75, + "learning_rate": 7.748586417937948e-07, + "loss": 1.096, + "step": 24901 + }, + { + "epoch": 0.75, + "learning_rate": 7.746821115383982e-07, + "loss": 1.1099, + "step": 24902 + }, + { + "epoch": 0.75, + "learning_rate": 7.745055977071972e-07, + "loss": 1.0604, + "step": 24903 + }, + { + "epoch": 0.75, + "learning_rate": 7.743291003018716e-07, + "loss": 1.1945, + "step": 24904 + }, + { + "epoch": 0.75, + "learning_rate": 7.741526193241022e-07, + "loss": 1.0536, + "step": 24905 + }, + { + "epoch": 0.75, + "learning_rate": 7.739761547755692e-07, + "loss": 1.1153, + "step": 24906 + }, + { + "epoch": 0.75, + "learning_rate": 7.737997066579512e-07, + "loss": 1.2324, + "step": 24907 + }, + { + "epoch": 0.75, + "learning_rate": 7.736232749729287e-07, + "loss": 1.1049, + "step": 24908 + }, + { + "epoch": 0.75, + "learning_rate": 7.734468597221812e-07, + "loss": 0.9598, + "step": 24909 + }, + { + "epoch": 0.75, + "learning_rate": 7.732704609073885e-07, + "loss": 1.1047, + "step": 24910 + }, + { + "epoch": 0.75, + "learning_rate": 7.73094078530229e-07, + "loss": 1.1052, + "step": 24911 + }, + { + "epoch": 0.75, + "learning_rate": 7.72917712592382e-07, + "loss": 1.2242, + "step": 24912 + }, + { + "epoch": 0.75, + "learning_rate": 7.727413630955266e-07, + "loss": 1.046, + "step": 24913 + }, + { + "epoch": 0.75, + "learning_rate": 7.725650300413415e-07, + "loss": 1.053, + "step": 24914 + }, + { + "epoch": 0.75, + "learning_rate": 7.723887134315055e-07, + "loss": 1.0418, + "step": 24915 + }, + { + "epoch": 0.75, + "learning_rate": 7.722124132676967e-07, + "loss": 1.1447, + "step": 24916 + }, + { + "epoch": 0.75, + "learning_rate": 7.720361295515937e-07, + "loss": 1.1209, + "step": 24917 + }, + { + "epoch": 0.75, + "learning_rate": 7.718598622848747e-07, + "loss": 1.0554, + "step": 24918 + }, + { + "epoch": 0.75, + "learning_rate": 7.71683611469218e-07, + "loss": 1.2069, + "step": 24919 + }, + { + "epoch": 0.75, + "learning_rate": 7.715073771063003e-07, + "loss": 1.1453, + "step": 24920 + }, + { + "epoch": 0.75, + "learning_rate": 7.713311591977999e-07, + "loss": 1.0656, + "step": 24921 + }, + { + "epoch": 0.75, + "learning_rate": 7.711549577453945e-07, + "loss": 1.0496, + "step": 24922 + }, + { + "epoch": 0.75, + "learning_rate": 7.709787727507617e-07, + "loss": 1.1512, + "step": 24923 + }, + { + "epoch": 0.75, + "learning_rate": 7.708026042155775e-07, + "loss": 1.158, + "step": 24924 + }, + { + "epoch": 0.75, + "learning_rate": 7.706264521415199e-07, + "loss": 1.1022, + "step": 24925 + }, + { + "epoch": 0.75, + "learning_rate": 7.704503165302654e-07, + "loss": 1.1036, + "step": 24926 + }, + { + "epoch": 0.75, + "learning_rate": 7.702741973834918e-07, + "loss": 1.1066, + "step": 24927 + }, + { + "epoch": 0.75, + "learning_rate": 7.700980947028741e-07, + "loss": 1.1717, + "step": 24928 + }, + { + "epoch": 0.75, + "learning_rate": 7.699220084900891e-07, + "loss": 1.1087, + "step": 24929 + }, + { + "epoch": 0.75, + "learning_rate": 7.697459387468137e-07, + "loss": 1.1228, + "step": 24930 + }, + { + "epoch": 0.75, + "learning_rate": 7.695698854747232e-07, + "loss": 0.9747, + "step": 24931 + }, + { + "epoch": 0.75, + "learning_rate": 7.693938486754951e-07, + "loss": 1.0373, + "step": 24932 + }, + { + "epoch": 0.75, + "learning_rate": 7.692178283508034e-07, + "loss": 1.04, + "step": 24933 + }, + { + "epoch": 0.75, + "learning_rate": 7.690418245023241e-07, + "loss": 1.1186, + "step": 24934 + }, + { + "epoch": 0.75, + "learning_rate": 7.688658371317331e-07, + "loss": 1.0955, + "step": 24935 + }, + { + "epoch": 0.75, + "learning_rate": 7.686898662407064e-07, + "loss": 1.1151, + "step": 24936 + }, + { + "epoch": 0.75, + "learning_rate": 7.685139118309173e-07, + "loss": 1.2408, + "step": 24937 + }, + { + "epoch": 0.75, + "learning_rate": 7.683379739040422e-07, + "loss": 0.9514, + "step": 24938 + }, + { + "epoch": 0.75, + "learning_rate": 7.681620524617556e-07, + "loss": 1.1348, + "step": 24939 + }, + { + "epoch": 0.75, + "learning_rate": 7.679861475057319e-07, + "loss": 1.0197, + "step": 24940 + }, + { + "epoch": 0.75, + "learning_rate": 7.67810259037646e-07, + "loss": 1.0432, + "step": 24941 + }, + { + "epoch": 0.75, + "learning_rate": 7.676343870591723e-07, + "loss": 1.1106, + "step": 24942 + }, + { + "epoch": 0.75, + "learning_rate": 7.674585315719848e-07, + "loss": 1.181, + "step": 24943 + }, + { + "epoch": 0.75, + "learning_rate": 7.672826925777576e-07, + "loss": 1.1111, + "step": 24944 + }, + { + "epoch": 0.75, + "learning_rate": 7.671068700781655e-07, + "loss": 1.1812, + "step": 24945 + }, + { + "epoch": 0.75, + "learning_rate": 7.669310640748808e-07, + "loss": 1.152, + "step": 24946 + }, + { + "epoch": 0.75, + "learning_rate": 7.667552745695775e-07, + "loss": 1.0615, + "step": 24947 + }, + { + "epoch": 0.75, + "learning_rate": 7.665795015639293e-07, + "loss": 1.1146, + "step": 24948 + }, + { + "epoch": 0.75, + "learning_rate": 7.664037450596102e-07, + "loss": 1.1119, + "step": 24949 + }, + { + "epoch": 0.75, + "learning_rate": 7.662280050582916e-07, + "loss": 1.167, + "step": 24950 + }, + { + "epoch": 0.75, + "learning_rate": 7.660522815616475e-07, + "loss": 1.0126, + "step": 24951 + }, + { + "epoch": 0.75, + "learning_rate": 7.658765745713506e-07, + "loss": 1.0218, + "step": 24952 + }, + { + "epoch": 0.75, + "learning_rate": 7.657008840890743e-07, + "loss": 0.9902, + "step": 24953 + }, + { + "epoch": 0.75, + "learning_rate": 7.655252101164895e-07, + "loss": 1.2236, + "step": 24954 + }, + { + "epoch": 0.75, + "learning_rate": 7.653495526552693e-07, + "loss": 1.1389, + "step": 24955 + }, + { + "epoch": 0.75, + "learning_rate": 7.651739117070859e-07, + "loss": 1.1033, + "step": 24956 + }, + { + "epoch": 0.75, + "learning_rate": 7.649982872736115e-07, + "loss": 1.1358, + "step": 24957 + }, + { + "epoch": 0.75, + "learning_rate": 7.648226793565184e-07, + "loss": 1.0772, + "step": 24958 + }, + { + "epoch": 0.75, + "learning_rate": 7.646470879574771e-07, + "loss": 1.0408, + "step": 24959 + }, + { + "epoch": 0.75, + "learning_rate": 7.644715130781596e-07, + "loss": 1.0389, + "step": 24960 + }, + { + "epoch": 0.75, + "learning_rate": 7.642959547202375e-07, + "loss": 1.1245, + "step": 24961 + }, + { + "epoch": 0.75, + "learning_rate": 7.641204128853827e-07, + "loss": 1.2321, + "step": 24962 + }, + { + "epoch": 0.75, + "learning_rate": 7.639448875752647e-07, + "loss": 1.0616, + "step": 24963 + }, + { + "epoch": 0.75, + "learning_rate": 7.637693787915553e-07, + "loss": 1.0983, + "step": 24964 + }, + { + "epoch": 0.75, + "learning_rate": 7.635938865359255e-07, + "loss": 1.1172, + "step": 24965 + }, + { + "epoch": 0.75, + "learning_rate": 7.634184108100454e-07, + "loss": 1.0328, + "step": 24966 + }, + { + "epoch": 0.75, + "learning_rate": 7.632429516155856e-07, + "loss": 1.1804, + "step": 24967 + }, + { + "epoch": 0.75, + "learning_rate": 7.630675089542166e-07, + "loss": 1.1219, + "step": 24968 + }, + { + "epoch": 0.75, + "learning_rate": 7.628920828276082e-07, + "loss": 1.0021, + "step": 24969 + }, + { + "epoch": 0.75, + "learning_rate": 7.627166732374313e-07, + "loss": 1.0443, + "step": 24970 + }, + { + "epoch": 0.75, + "learning_rate": 7.625412801853543e-07, + "loss": 1.0828, + "step": 24971 + }, + { + "epoch": 0.75, + "learning_rate": 7.623659036730477e-07, + "loss": 1.0236, + "step": 24972 + }, + { + "epoch": 0.75, + "learning_rate": 7.621905437021807e-07, + "loss": 1.0523, + "step": 24973 + }, + { + "epoch": 0.75, + "learning_rate": 7.620152002744227e-07, + "loss": 1.1001, + "step": 24974 + }, + { + "epoch": 0.75, + "learning_rate": 7.618398733914436e-07, + "loss": 0.9911, + "step": 24975 + }, + { + "epoch": 0.75, + "learning_rate": 7.616645630549113e-07, + "loss": 1.1995, + "step": 24976 + }, + { + "epoch": 0.75, + "learning_rate": 7.61489269266495e-07, + "loss": 1.1721, + "step": 24977 + }, + { + "epoch": 0.75, + "learning_rate": 7.613139920278634e-07, + "loss": 0.9987, + "step": 24978 + }, + { + "epoch": 0.75, + "learning_rate": 7.611387313406862e-07, + "loss": 1.1116, + "step": 24979 + }, + { + "epoch": 0.75, + "learning_rate": 7.609634872066302e-07, + "loss": 1.2054, + "step": 24980 + }, + { + "epoch": 0.75, + "learning_rate": 7.607882596273639e-07, + "loss": 1.1457, + "step": 24981 + }, + { + "epoch": 0.75, + "learning_rate": 7.60613048604556e-07, + "loss": 1.1085, + "step": 24982 + }, + { + "epoch": 0.75, + "learning_rate": 7.604378541398738e-07, + "loss": 1.0492, + "step": 24983 + }, + { + "epoch": 0.75, + "learning_rate": 7.602626762349866e-07, + "loss": 0.9958, + "step": 24984 + }, + { + "epoch": 0.75, + "learning_rate": 7.600875148915598e-07, + "loss": 1.0657, + "step": 24985 + }, + { + "epoch": 0.75, + "learning_rate": 7.59912370111262e-07, + "loss": 1.2122, + "step": 24986 + }, + { + "epoch": 0.75, + "learning_rate": 7.597372418957605e-07, + "loss": 1.1119, + "step": 24987 + }, + { + "epoch": 0.75, + "learning_rate": 7.59562130246723e-07, + "loss": 1.1733, + "step": 24988 + }, + { + "epoch": 0.75, + "learning_rate": 7.593870351658147e-07, + "loss": 1.0695, + "step": 24989 + }, + { + "epoch": 0.75, + "learning_rate": 7.592119566547041e-07, + "loss": 1.0836, + "step": 24990 + }, + { + "epoch": 0.75, + "learning_rate": 7.59036894715057e-07, + "loss": 1.1548, + "step": 24991 + }, + { + "epoch": 0.75, + "learning_rate": 7.588618493485409e-07, + "loss": 1.2042, + "step": 24992 + }, + { + "epoch": 0.75, + "learning_rate": 7.586868205568207e-07, + "loss": 0.9882, + "step": 24993 + }, + { + "epoch": 0.75, + "learning_rate": 7.585118083415633e-07, + "loss": 1.02, + "step": 24994 + }, + { + "epoch": 0.75, + "learning_rate": 7.583368127044347e-07, + "loss": 1.0486, + "step": 24995 + }, + { + "epoch": 0.75, + "learning_rate": 7.581618336471008e-07, + "loss": 1.1329, + "step": 24996 + }, + { + "epoch": 0.75, + "learning_rate": 7.579868711712276e-07, + "loss": 1.1505, + "step": 24997 + }, + { + "epoch": 0.75, + "learning_rate": 7.578119252784802e-07, + "loss": 1.1121, + "step": 24998 + }, + { + "epoch": 0.75, + "learning_rate": 7.576369959705243e-07, + "loss": 1.0737, + "step": 24999 + }, + { + "epoch": 0.75, + "learning_rate": 7.574620832490251e-07, + "loss": 1.1586, + "step": 25000 + }, + { + "epoch": 0.75, + "learning_rate": 7.572871871156481e-07, + "loss": 1.1637, + "step": 25001 + }, + { + "epoch": 0.75, + "learning_rate": 7.571123075720573e-07, + "loss": 1.0022, + "step": 25002 + }, + { + "epoch": 0.75, + "learning_rate": 7.569374446199179e-07, + "loss": 1.0546, + "step": 25003 + }, + { + "epoch": 0.75, + "learning_rate": 7.567625982608945e-07, + "loss": 1.1211, + "step": 25004 + }, + { + "epoch": 0.75, + "learning_rate": 7.565877684966521e-07, + "loss": 1.2648, + "step": 25005 + }, + { + "epoch": 0.75, + "learning_rate": 7.56412955328854e-07, + "loss": 1.1445, + "step": 25006 + }, + { + "epoch": 0.75, + "learning_rate": 7.562381587591649e-07, + "loss": 1.1593, + "step": 25007 + }, + { + "epoch": 0.75, + "learning_rate": 7.560633787892486e-07, + "loss": 1.1064, + "step": 25008 + }, + { + "epoch": 0.75, + "learning_rate": 7.558886154207698e-07, + "loss": 1.0201, + "step": 25009 + }, + { + "epoch": 0.75, + "learning_rate": 7.557138686553905e-07, + "loss": 1.1274, + "step": 25010 + }, + { + "epoch": 0.75, + "learning_rate": 7.555391384947752e-07, + "loss": 1.163, + "step": 25011 + }, + { + "epoch": 0.75, + "learning_rate": 7.553644249405872e-07, + "loss": 1.0932, + "step": 25012 + }, + { + "epoch": 0.75, + "learning_rate": 7.551897279944895e-07, + "loss": 1.131, + "step": 25013 + }, + { + "epoch": 0.75, + "learning_rate": 7.550150476581461e-07, + "loss": 1.0451, + "step": 25014 + }, + { + "epoch": 0.75, + "learning_rate": 7.548403839332182e-07, + "loss": 1.1047, + "step": 25015 + }, + { + "epoch": 0.75, + "learning_rate": 7.546657368213695e-07, + "loss": 1.042, + "step": 25016 + }, + { + "epoch": 0.75, + "learning_rate": 7.544911063242622e-07, + "loss": 1.0703, + "step": 25017 + }, + { + "epoch": 0.75, + "learning_rate": 7.543164924435597e-07, + "loss": 1.1434, + "step": 25018 + }, + { + "epoch": 0.75, + "learning_rate": 7.541418951809229e-07, + "loss": 1.0213, + "step": 25019 + }, + { + "epoch": 0.75, + "learning_rate": 7.539673145380142e-07, + "loss": 1.0726, + "step": 25020 + }, + { + "epoch": 0.75, + "learning_rate": 7.537927505164958e-07, + "loss": 1.1401, + "step": 25021 + }, + { + "epoch": 0.75, + "learning_rate": 7.536182031180294e-07, + "loss": 1.0329, + "step": 25022 + }, + { + "epoch": 0.75, + "learning_rate": 7.534436723442767e-07, + "loss": 1.0901, + "step": 25023 + }, + { + "epoch": 0.75, + "learning_rate": 7.53269158196899e-07, + "loss": 1.0142, + "step": 25024 + }, + { + "epoch": 0.75, + "learning_rate": 7.530946606775577e-07, + "loss": 1.1311, + "step": 25025 + }, + { + "epoch": 0.75, + "learning_rate": 7.529201797879138e-07, + "loss": 1.1433, + "step": 25026 + }, + { + "epoch": 0.75, + "learning_rate": 7.527457155296292e-07, + "loss": 1.0941, + "step": 25027 + }, + { + "epoch": 0.75, + "learning_rate": 7.525712679043632e-07, + "loss": 1.0487, + "step": 25028 + }, + { + "epoch": 0.75, + "learning_rate": 7.523968369137771e-07, + "loss": 1.1367, + "step": 25029 + }, + { + "epoch": 0.75, + "learning_rate": 7.522224225595312e-07, + "loss": 1.1879, + "step": 25030 + }, + { + "epoch": 0.75, + "learning_rate": 7.52048024843287e-07, + "loss": 1.0931, + "step": 25031 + }, + { + "epoch": 0.75, + "learning_rate": 7.518736437667032e-07, + "loss": 1.1278, + "step": 25032 + }, + { + "epoch": 0.75, + "learning_rate": 7.516992793314401e-07, + "loss": 1.071, + "step": 25033 + }, + { + "epoch": 0.75, + "learning_rate": 7.515249315391582e-07, + "loss": 1.1661, + "step": 25034 + }, + { + "epoch": 0.75, + "learning_rate": 7.513506003915172e-07, + "loss": 1.0516, + "step": 25035 + }, + { + "epoch": 0.75, + "learning_rate": 7.511762858901758e-07, + "loss": 1.1275, + "step": 25036 + }, + { + "epoch": 0.75, + "learning_rate": 7.510019880367938e-07, + "loss": 1.1968, + "step": 25037 + }, + { + "epoch": 0.75, + "learning_rate": 7.508277068330305e-07, + "loss": 1.0926, + "step": 25038 + }, + { + "epoch": 0.75, + "learning_rate": 7.50653442280545e-07, + "loss": 1.027, + "step": 25039 + }, + { + "epoch": 0.75, + "learning_rate": 7.504791943809972e-07, + "loss": 0.9621, + "step": 25040 + }, + { + "epoch": 0.75, + "learning_rate": 7.50304963136044e-07, + "loss": 1.0947, + "step": 25041 + }, + { + "epoch": 0.75, + "learning_rate": 7.501307485473447e-07, + "loss": 1.1658, + "step": 25042 + }, + { + "epoch": 0.75, + "learning_rate": 7.499565506165579e-07, + "loss": 1.0768, + "step": 25043 + }, + { + "epoch": 0.75, + "learning_rate": 7.49782369345343e-07, + "loss": 0.8148, + "step": 25044 + }, + { + "epoch": 0.75, + "learning_rate": 7.496082047353559e-07, + "loss": 1.1536, + "step": 25045 + }, + { + "epoch": 0.75, + "learning_rate": 7.494340567882558e-07, + "loss": 0.9993, + "step": 25046 + }, + { + "epoch": 0.75, + "learning_rate": 7.492599255057003e-07, + "loss": 0.9699, + "step": 25047 + }, + { + "epoch": 0.75, + "learning_rate": 7.490858108893473e-07, + "loss": 1.0647, + "step": 25048 + }, + { + "epoch": 0.75, + "learning_rate": 7.489117129408541e-07, + "loss": 1.1519, + "step": 25049 + }, + { + "epoch": 0.75, + "learning_rate": 7.487376316618777e-07, + "loss": 1.0414, + "step": 25050 + }, + { + "epoch": 0.75, + "learning_rate": 7.485635670540759e-07, + "loss": 1.1286, + "step": 25051 + }, + { + "epoch": 0.75, + "learning_rate": 7.483895191191063e-07, + "loss": 1.1069, + "step": 25052 + }, + { + "epoch": 0.75, + "learning_rate": 7.48215487858624e-07, + "loss": 1.0842, + "step": 25053 + }, + { + "epoch": 0.75, + "learning_rate": 7.480414732742864e-07, + "loss": 1.0475, + "step": 25054 + }, + { + "epoch": 0.75, + "learning_rate": 7.478674753677503e-07, + "loss": 1.0565, + "step": 25055 + }, + { + "epoch": 0.75, + "learning_rate": 7.476934941406719e-07, + "loss": 1.1009, + "step": 25056 + }, + { + "epoch": 0.75, + "learning_rate": 7.475195295947086e-07, + "loss": 1.191, + "step": 25057 + }, + { + "epoch": 0.75, + "learning_rate": 7.473455817315143e-07, + "loss": 1.0286, + "step": 25058 + }, + { + "epoch": 0.75, + "learning_rate": 7.47171650552746e-07, + "loss": 1.1489, + "step": 25059 + }, + { + "epoch": 0.75, + "learning_rate": 7.469977360600595e-07, + "loss": 1.0952, + "step": 25060 + }, + { + "epoch": 0.75, + "learning_rate": 7.468238382551107e-07, + "loss": 1.12, + "step": 25061 + }, + { + "epoch": 0.75, + "learning_rate": 7.466499571395541e-07, + "loss": 1.0449, + "step": 25062 + }, + { + "epoch": 0.76, + "learning_rate": 7.464760927150455e-07, + "loss": 1.0712, + "step": 25063 + }, + { + "epoch": 0.76, + "learning_rate": 7.463022449832399e-07, + "loss": 1.082, + "step": 25064 + }, + { + "epoch": 0.76, + "learning_rate": 7.461284139457922e-07, + "loss": 0.9741, + "step": 25065 + }, + { + "epoch": 0.76, + "learning_rate": 7.459545996043582e-07, + "loss": 1.093, + "step": 25066 + }, + { + "epoch": 0.76, + "learning_rate": 7.457808019605911e-07, + "loss": 1.1259, + "step": 25067 + }, + { + "epoch": 0.76, + "learning_rate": 7.456070210161457e-07, + "loss": 1.0574, + "step": 25068 + }, + { + "epoch": 0.76, + "learning_rate": 7.454332567726763e-07, + "loss": 1.1185, + "step": 25069 + }, + { + "epoch": 0.76, + "learning_rate": 7.452595092318382e-07, + "loss": 1.0558, + "step": 25070 + }, + { + "epoch": 0.76, + "learning_rate": 7.450857783952839e-07, + "loss": 1.0732, + "step": 25071 + }, + { + "epoch": 0.76, + "learning_rate": 7.449120642646676e-07, + "loss": 1.1228, + "step": 25072 + }, + { + "epoch": 0.76, + "learning_rate": 7.44738366841643e-07, + "loss": 0.9308, + "step": 25073 + }, + { + "epoch": 0.76, + "learning_rate": 7.44564686127865e-07, + "loss": 1.0729, + "step": 25074 + }, + { + "epoch": 0.76, + "learning_rate": 7.443910221249844e-07, + "loss": 1.2286, + "step": 25075 + }, + { + "epoch": 0.76, + "learning_rate": 7.442173748346562e-07, + "loss": 1.0263, + "step": 25076 + }, + { + "epoch": 0.76, + "learning_rate": 7.440437442585327e-07, + "loss": 1.1606, + "step": 25077 + }, + { + "epoch": 0.76, + "learning_rate": 7.438701303982673e-07, + "loss": 1.0417, + "step": 25078 + }, + { + "epoch": 0.76, + "learning_rate": 7.436965332555124e-07, + "loss": 1.1358, + "step": 25079 + }, + { + "epoch": 0.76, + "learning_rate": 7.435229528319204e-07, + "loss": 1.1507, + "step": 25080 + }, + { + "epoch": 0.76, + "learning_rate": 7.433493891291443e-07, + "loss": 1.0723, + "step": 25081 + }, + { + "epoch": 0.76, + "learning_rate": 7.431758421488358e-07, + "loss": 1.1104, + "step": 25082 + }, + { + "epoch": 0.76, + "learning_rate": 7.430023118926479e-07, + "loss": 1.1275, + "step": 25083 + }, + { + "epoch": 0.76, + "learning_rate": 7.428287983622312e-07, + "loss": 1.1332, + "step": 25084 + }, + { + "epoch": 0.76, + "learning_rate": 7.426553015592378e-07, + "loss": 1.1539, + "step": 25085 + }, + { + "epoch": 0.76, + "learning_rate": 7.424818214853197e-07, + "loss": 1.1644, + "step": 25086 + }, + { + "epoch": 0.76, + "learning_rate": 7.42308358142129e-07, + "loss": 1.0713, + "step": 25087 + }, + { + "epoch": 0.76, + "learning_rate": 7.421349115313154e-07, + "loss": 1.0882, + "step": 25088 + }, + { + "epoch": 0.76, + "learning_rate": 7.419614816545309e-07, + "loss": 1.0635, + "step": 25089 + }, + { + "epoch": 0.76, + "learning_rate": 7.417880685134262e-07, + "loss": 1.1925, + "step": 25090 + }, + { + "epoch": 0.76, + "learning_rate": 7.416146721096526e-07, + "loss": 1.0105, + "step": 25091 + }, + { + "epoch": 0.76, + "learning_rate": 7.41441292444861e-07, + "loss": 1.2369, + "step": 25092 + }, + { + "epoch": 0.76, + "learning_rate": 7.412679295207006e-07, + "loss": 1.1505, + "step": 25093 + }, + { + "epoch": 0.76, + "learning_rate": 7.410945833388225e-07, + "loss": 1.1099, + "step": 25094 + }, + { + "epoch": 0.76, + "learning_rate": 7.40921253900877e-07, + "loss": 1.1065, + "step": 25095 + }, + { + "epoch": 0.76, + "learning_rate": 7.407479412085144e-07, + "loss": 1.1423, + "step": 25096 + }, + { + "epoch": 0.76, + "learning_rate": 7.405746452633836e-07, + "loss": 1.0788, + "step": 25097 + }, + { + "epoch": 0.76, + "learning_rate": 7.404013660671347e-07, + "loss": 1.0241, + "step": 25098 + }, + { + "epoch": 0.76, + "learning_rate": 7.402281036214174e-07, + "loss": 1.2057, + "step": 25099 + }, + { + "epoch": 0.76, + "learning_rate": 7.400548579278819e-07, + "loss": 1.1729, + "step": 25100 + }, + { + "epoch": 0.76, + "learning_rate": 7.398816289881755e-07, + "loss": 1.069, + "step": 25101 + }, + { + "epoch": 0.76, + "learning_rate": 7.397084168039484e-07, + "loss": 1.0577, + "step": 25102 + }, + { + "epoch": 0.76, + "learning_rate": 7.395352213768495e-07, + "loss": 0.9996, + "step": 25103 + }, + { + "epoch": 0.76, + "learning_rate": 7.393620427085271e-07, + "loss": 1.1286, + "step": 25104 + }, + { + "epoch": 0.76, + "learning_rate": 7.391888808006306e-07, + "loss": 1.1636, + "step": 25105 + }, + { + "epoch": 0.76, + "learning_rate": 7.390157356548074e-07, + "loss": 1.2307, + "step": 25106 + }, + { + "epoch": 0.76, + "learning_rate": 7.388426072727067e-07, + "loss": 1.1257, + "step": 25107 + }, + { + "epoch": 0.76, + "learning_rate": 7.386694956559759e-07, + "loss": 1.2163, + "step": 25108 + }, + { + "epoch": 0.76, + "learning_rate": 7.384964008062643e-07, + "loss": 1.0378, + "step": 25109 + }, + { + "epoch": 0.76, + "learning_rate": 7.383233227252176e-07, + "loss": 0.9921, + "step": 25110 + }, + { + "epoch": 0.76, + "learning_rate": 7.381502614144842e-07, + "loss": 1.1212, + "step": 25111 + }, + { + "epoch": 0.76, + "learning_rate": 7.379772168757121e-07, + "loss": 1.2079, + "step": 25112 + }, + { + "epoch": 0.76, + "learning_rate": 7.378041891105489e-07, + "loss": 1.0554, + "step": 25113 + }, + { + "epoch": 0.76, + "learning_rate": 7.376311781206405e-07, + "loss": 1.1669, + "step": 25114 + }, + { + "epoch": 0.76, + "learning_rate": 7.374581839076344e-07, + "loss": 1.1356, + "step": 25115 + }, + { + "epoch": 0.76, + "learning_rate": 7.372852064731775e-07, + "loss": 1.1002, + "step": 25116 + }, + { + "epoch": 0.76, + "learning_rate": 7.371122458189165e-07, + "loss": 1.1138, + "step": 25117 + }, + { + "epoch": 0.76, + "learning_rate": 7.369393019464988e-07, + "loss": 1.1681, + "step": 25118 + }, + { + "epoch": 0.76, + "learning_rate": 7.367663748575687e-07, + "loss": 1.0128, + "step": 25119 + }, + { + "epoch": 0.76, + "learning_rate": 7.365934645537737e-07, + "loss": 1.1248, + "step": 25120 + }, + { + "epoch": 0.76, + "learning_rate": 7.364205710367598e-07, + "loss": 1.127, + "step": 25121 + }, + { + "epoch": 0.76, + "learning_rate": 7.362476943081734e-07, + "loss": 0.9953, + "step": 25122 + }, + { + "epoch": 0.76, + "learning_rate": 7.360748343696586e-07, + "loss": 1.0829, + "step": 25123 + }, + { + "epoch": 0.76, + "learning_rate": 7.359019912228618e-07, + "loss": 1.1816, + "step": 25124 + }, + { + "epoch": 0.76, + "learning_rate": 7.357291648694284e-07, + "loss": 1.2406, + "step": 25125 + }, + { + "epoch": 0.76, + "learning_rate": 7.355563553110045e-07, + "loss": 1.0854, + "step": 25126 + }, + { + "epoch": 0.76, + "learning_rate": 7.353835625492337e-07, + "loss": 1.0975, + "step": 25127 + }, + { + "epoch": 0.76, + "learning_rate": 7.352107865857613e-07, + "loss": 1.0853, + "step": 25128 + }, + { + "epoch": 0.76, + "learning_rate": 7.350380274222324e-07, + "loss": 1.1816, + "step": 25129 + }, + { + "epoch": 0.76, + "learning_rate": 7.348652850602914e-07, + "loss": 1.1888, + "step": 25130 + }, + { + "epoch": 0.76, + "learning_rate": 7.346925595015828e-07, + "loss": 1.095, + "step": 25131 + }, + { + "epoch": 0.76, + "learning_rate": 7.345198507477508e-07, + "loss": 1.0153, + "step": 25132 + }, + { + "epoch": 0.76, + "learning_rate": 7.343471588004394e-07, + "loss": 1.084, + "step": 25133 + }, + { + "epoch": 0.76, + "learning_rate": 7.34174483661293e-07, + "loss": 0.98, + "step": 25134 + }, + { + "epoch": 0.76, + "learning_rate": 7.340018253319555e-07, + "loss": 1.1421, + "step": 25135 + }, + { + "epoch": 0.76, + "learning_rate": 7.338291838140695e-07, + "loss": 1.1507, + "step": 25136 + }, + { + "epoch": 0.76, + "learning_rate": 7.336565591092789e-07, + "loss": 1.0992, + "step": 25137 + }, + { + "epoch": 0.76, + "learning_rate": 7.334839512192273e-07, + "loss": 1.2504, + "step": 25138 + }, + { + "epoch": 0.76, + "learning_rate": 7.333113601455585e-07, + "loss": 1.0394, + "step": 25139 + }, + { + "epoch": 0.76, + "learning_rate": 7.331387858899139e-07, + "loss": 1.049, + "step": 25140 + }, + { + "epoch": 0.76, + "learning_rate": 7.329662284539371e-07, + "loss": 1.0626, + "step": 25141 + }, + { + "epoch": 0.76, + "learning_rate": 7.327936878392708e-07, + "loss": 1.1845, + "step": 25142 + }, + { + "epoch": 0.76, + "learning_rate": 7.326211640475572e-07, + "loss": 1.1639, + "step": 25143 + }, + { + "epoch": 0.76, + "learning_rate": 7.324486570804401e-07, + "loss": 1.0626, + "step": 25144 + }, + { + "epoch": 0.76, + "learning_rate": 7.322761669395594e-07, + "loss": 1.0649, + "step": 25145 + }, + { + "epoch": 0.76, + "learning_rate": 7.321036936265585e-07, + "loss": 1.1466, + "step": 25146 + }, + { + "epoch": 0.76, + "learning_rate": 7.31931237143079e-07, + "loss": 0.9446, + "step": 25147 + }, + { + "epoch": 0.76, + "learning_rate": 7.31758797490763e-07, + "loss": 1.0657, + "step": 25148 + }, + { + "epoch": 0.76, + "learning_rate": 7.315863746712512e-07, + "loss": 1.1407, + "step": 25149 + }, + { + "epoch": 0.76, + "learning_rate": 7.314139686861852e-07, + "loss": 0.8801, + "step": 25150 + }, + { + "epoch": 0.76, + "learning_rate": 7.312415795372065e-07, + "loss": 1.0413, + "step": 25151 + }, + { + "epoch": 0.76, + "learning_rate": 7.31069207225957e-07, + "loss": 1.0671, + "step": 25152 + }, + { + "epoch": 0.76, + "learning_rate": 7.308968517540757e-07, + "loss": 0.986, + "step": 25153 + }, + { + "epoch": 0.76, + "learning_rate": 7.307245131232047e-07, + "loss": 1.0814, + "step": 25154 + }, + { + "epoch": 0.76, + "learning_rate": 7.305521913349839e-07, + "loss": 1.2462, + "step": 25155 + }, + { + "epoch": 0.76, + "learning_rate": 7.303798863910542e-07, + "loss": 1.1226, + "step": 25156 + }, + { + "epoch": 0.76, + "learning_rate": 7.302075982930562e-07, + "loss": 1.1348, + "step": 25157 + }, + { + "epoch": 0.76, + "learning_rate": 7.300353270426292e-07, + "loss": 1.093, + "step": 25158 + }, + { + "epoch": 0.76, + "learning_rate": 7.29863072641413e-07, + "loss": 1.197, + "step": 25159 + }, + { + "epoch": 0.76, + "learning_rate": 7.296908350910481e-07, + "loss": 1.1575, + "step": 25160 + }, + { + "epoch": 0.76, + "learning_rate": 7.295186143931738e-07, + "loss": 1.0059, + "step": 25161 + }, + { + "epoch": 0.76, + "learning_rate": 7.293464105494294e-07, + "loss": 1.1032, + "step": 25162 + }, + { + "epoch": 0.76, + "learning_rate": 7.291742235614547e-07, + "loss": 1.0034, + "step": 25163 + }, + { + "epoch": 0.76, + "learning_rate": 7.290020534308884e-07, + "loss": 1.1169, + "step": 25164 + }, + { + "epoch": 0.76, + "learning_rate": 7.288299001593702e-07, + "loss": 1.1741, + "step": 25165 + }, + { + "epoch": 0.76, + "learning_rate": 7.286577637485378e-07, + "loss": 0.9876, + "step": 25166 + }, + { + "epoch": 0.76, + "learning_rate": 7.284856442000301e-07, + "loss": 1.0972, + "step": 25167 + }, + { + "epoch": 0.76, + "learning_rate": 7.283135415154863e-07, + "loss": 1.2152, + "step": 25168 + }, + { + "epoch": 0.76, + "learning_rate": 7.281414556965441e-07, + "loss": 1.1041, + "step": 25169 + }, + { + "epoch": 0.76, + "learning_rate": 7.279693867448426e-07, + "loss": 1.0753, + "step": 25170 + }, + { + "epoch": 0.76, + "learning_rate": 7.277973346620182e-07, + "loss": 1.0982, + "step": 25171 + }, + { + "epoch": 0.76, + "learning_rate": 7.276252994497099e-07, + "loss": 1.0354, + "step": 25172 + }, + { + "epoch": 0.76, + "learning_rate": 7.27453281109555e-07, + "loss": 1.0811, + "step": 25173 + }, + { + "epoch": 0.76, + "learning_rate": 7.272812796431922e-07, + "loss": 1.0165, + "step": 25174 + }, + { + "epoch": 0.76, + "learning_rate": 7.271092950522568e-07, + "loss": 1.0898, + "step": 25175 + }, + { + "epoch": 0.76, + "learning_rate": 7.26937327338387e-07, + "loss": 1.0942, + "step": 25176 + }, + { + "epoch": 0.76, + "learning_rate": 7.267653765032201e-07, + "loss": 1.1525, + "step": 25177 + }, + { + "epoch": 0.76, + "learning_rate": 7.265934425483937e-07, + "loss": 1.1163, + "step": 25178 + }, + { + "epoch": 0.76, + "learning_rate": 7.264215254755425e-07, + "loss": 1.0231, + "step": 25179 + }, + { + "epoch": 0.76, + "learning_rate": 7.262496252863044e-07, + "loss": 1.2583, + "step": 25180 + }, + { + "epoch": 0.76, + "learning_rate": 7.260777419823156e-07, + "loss": 1.3821, + "step": 25181 + }, + { + "epoch": 0.76, + "learning_rate": 7.259058755652123e-07, + "loss": 1.203, + "step": 25182 + }, + { + "epoch": 0.76, + "learning_rate": 7.257340260366314e-07, + "loss": 0.9813, + "step": 25183 + }, + { + "epoch": 0.76, + "learning_rate": 7.255621933982074e-07, + "loss": 1.0984, + "step": 25184 + }, + { + "epoch": 0.76, + "learning_rate": 7.253903776515764e-07, + "loss": 1.2005, + "step": 25185 + }, + { + "epoch": 0.76, + "learning_rate": 7.252185787983745e-07, + "loss": 1.2299, + "step": 25186 + }, + { + "epoch": 0.76, + "learning_rate": 7.250467968402372e-07, + "loss": 1.1332, + "step": 25187 + }, + { + "epoch": 0.76, + "learning_rate": 7.248750317787992e-07, + "loss": 1.1008, + "step": 25188 + }, + { + "epoch": 0.76, + "learning_rate": 7.247032836156961e-07, + "loss": 1.181, + "step": 25189 + }, + { + "epoch": 0.76, + "learning_rate": 7.245315523525629e-07, + "loss": 1.0833, + "step": 25190 + }, + { + "epoch": 0.76, + "learning_rate": 7.243598379910349e-07, + "loss": 1.0554, + "step": 25191 + }, + { + "epoch": 0.76, + "learning_rate": 7.241881405327452e-07, + "loss": 1.1406, + "step": 25192 + }, + { + "epoch": 0.76, + "learning_rate": 7.240164599793292e-07, + "loss": 1.2582, + "step": 25193 + }, + { + "epoch": 0.76, + "learning_rate": 7.238447963324211e-07, + "loss": 1.0358, + "step": 25194 + }, + { + "epoch": 0.76, + "learning_rate": 7.236731495936558e-07, + "loss": 1.1735, + "step": 25195 + }, + { + "epoch": 0.76, + "learning_rate": 7.235015197646661e-07, + "loss": 1.1197, + "step": 25196 + }, + { + "epoch": 0.76, + "learning_rate": 7.233299068470862e-07, + "loss": 1.0804, + "step": 25197 + }, + { + "epoch": 0.76, + "learning_rate": 7.231583108425499e-07, + "loss": 1.1007, + "step": 25198 + }, + { + "epoch": 0.76, + "learning_rate": 7.229867317526907e-07, + "loss": 1.2651, + "step": 25199 + }, + { + "epoch": 0.76, + "learning_rate": 7.228151695791427e-07, + "loss": 1.1578, + "step": 25200 + }, + { + "epoch": 0.76, + "learning_rate": 7.226436243235377e-07, + "loss": 1.0679, + "step": 25201 + }, + { + "epoch": 0.76, + "learning_rate": 7.224720959875095e-07, + "loss": 1.1376, + "step": 25202 + }, + { + "epoch": 0.76, + "learning_rate": 7.223005845726908e-07, + "loss": 1.0665, + "step": 25203 + }, + { + "epoch": 0.76, + "learning_rate": 7.221290900807148e-07, + "loss": 1.1171, + "step": 25204 + }, + { + "epoch": 0.76, + "learning_rate": 7.219576125132132e-07, + "loss": 1.2402, + "step": 25205 + }, + { + "epoch": 0.76, + "learning_rate": 7.217861518718189e-07, + "loss": 1.1218, + "step": 25206 + }, + { + "epoch": 0.76, + "learning_rate": 7.216147081581637e-07, + "loss": 1.0962, + "step": 25207 + }, + { + "epoch": 0.76, + "learning_rate": 7.214432813738808e-07, + "loss": 1.11, + "step": 25208 + }, + { + "epoch": 0.76, + "learning_rate": 7.212718715206008e-07, + "loss": 1.1891, + "step": 25209 + }, + { + "epoch": 0.76, + "learning_rate": 7.211004785999557e-07, + "loss": 1.0124, + "step": 25210 + }, + { + "epoch": 0.76, + "learning_rate": 7.20929102613577e-07, + "loss": 1.1023, + "step": 25211 + }, + { + "epoch": 0.76, + "learning_rate": 7.207577435630969e-07, + "loss": 1.1013, + "step": 25212 + }, + { + "epoch": 0.76, + "learning_rate": 7.20586401450146e-07, + "loss": 1.142, + "step": 25213 + }, + { + "epoch": 0.76, + "learning_rate": 7.204150762763554e-07, + "loss": 1.1627, + "step": 25214 + }, + { + "epoch": 0.76, + "learning_rate": 7.202437680433563e-07, + "loss": 1.0724, + "step": 25215 + }, + { + "epoch": 0.76, + "learning_rate": 7.200724767527795e-07, + "loss": 1.0235, + "step": 25216 + }, + { + "epoch": 0.76, + "learning_rate": 7.19901202406256e-07, + "loss": 1.0795, + "step": 25217 + }, + { + "epoch": 0.76, + "learning_rate": 7.197299450054151e-07, + "loss": 1.109, + "step": 25218 + }, + { + "epoch": 0.76, + "learning_rate": 7.195587045518879e-07, + "loss": 1.0911, + "step": 25219 + }, + { + "epoch": 0.76, + "learning_rate": 7.193874810473042e-07, + "loss": 1.1194, + "step": 25220 + }, + { + "epoch": 0.76, + "learning_rate": 7.192162744932948e-07, + "loss": 1.0822, + "step": 25221 + }, + { + "epoch": 0.76, + "learning_rate": 7.190450848914882e-07, + "loss": 1.1883, + "step": 25222 + }, + { + "epoch": 0.76, + "learning_rate": 7.188739122435143e-07, + "loss": 1.0734, + "step": 25223 + }, + { + "epoch": 0.76, + "learning_rate": 7.187027565510032e-07, + "loss": 0.9891, + "step": 25224 + }, + { + "epoch": 0.76, + "learning_rate": 7.185316178155841e-07, + "loss": 1.1508, + "step": 25225 + }, + { + "epoch": 0.76, + "learning_rate": 7.183604960388866e-07, + "loss": 1.1083, + "step": 25226 + }, + { + "epoch": 0.76, + "learning_rate": 7.181893912225382e-07, + "loss": 1.028, + "step": 25227 + }, + { + "epoch": 0.76, + "learning_rate": 7.18018303368169e-07, + "loss": 0.9927, + "step": 25228 + }, + { + "epoch": 0.76, + "learning_rate": 7.178472324774069e-07, + "loss": 1.0609, + "step": 25229 + }, + { + "epoch": 0.76, + "learning_rate": 7.176761785518818e-07, + "loss": 1.1595, + "step": 25230 + }, + { + "epoch": 0.76, + "learning_rate": 7.175051415932205e-07, + "loss": 1.1263, + "step": 25231 + }, + { + "epoch": 0.76, + "learning_rate": 7.173341216030516e-07, + "loss": 1.1317, + "step": 25232 + }, + { + "epoch": 0.76, + "learning_rate": 7.171631185830033e-07, + "loss": 1.024, + "step": 25233 + }, + { + "epoch": 0.76, + "learning_rate": 7.169921325347043e-07, + "loss": 1.0402, + "step": 25234 + }, + { + "epoch": 0.76, + "learning_rate": 7.168211634597805e-07, + "loss": 1.0671, + "step": 25235 + }, + { + "epoch": 0.76, + "learning_rate": 7.166502113598605e-07, + "loss": 1.2133, + "step": 25236 + }, + { + "epoch": 0.76, + "learning_rate": 7.164792762365719e-07, + "loss": 1.2356, + "step": 25237 + }, + { + "epoch": 0.76, + "learning_rate": 7.163083580915415e-07, + "loss": 1.1457, + "step": 25238 + }, + { + "epoch": 0.76, + "learning_rate": 7.161374569263968e-07, + "loss": 1.0732, + "step": 25239 + }, + { + "epoch": 0.76, + "learning_rate": 7.159665727427639e-07, + "loss": 1.0126, + "step": 25240 + }, + { + "epoch": 0.76, + "learning_rate": 7.157957055422702e-07, + "loss": 1.24, + "step": 25241 + }, + { + "epoch": 0.76, + "learning_rate": 7.156248553265418e-07, + "loss": 1.0686, + "step": 25242 + }, + { + "epoch": 0.76, + "learning_rate": 7.154540220972057e-07, + "loss": 1.0547, + "step": 25243 + }, + { + "epoch": 0.76, + "learning_rate": 7.152832058558875e-07, + "loss": 1.1888, + "step": 25244 + }, + { + "epoch": 0.76, + "learning_rate": 7.15112406604214e-07, + "loss": 1.1873, + "step": 25245 + }, + { + "epoch": 0.76, + "learning_rate": 7.149416243438104e-07, + "loss": 1.0382, + "step": 25246 + }, + { + "epoch": 0.76, + "learning_rate": 7.147708590763036e-07, + "loss": 1.0808, + "step": 25247 + }, + { + "epoch": 0.76, + "learning_rate": 7.146001108033179e-07, + "loss": 1.2218, + "step": 25248 + }, + { + "epoch": 0.76, + "learning_rate": 7.144293795264792e-07, + "loss": 1.1727, + "step": 25249 + }, + { + "epoch": 0.76, + "learning_rate": 7.142586652474129e-07, + "loss": 1.086, + "step": 25250 + }, + { + "epoch": 0.76, + "learning_rate": 7.14087967967744e-07, + "loss": 1.1365, + "step": 25251 + }, + { + "epoch": 0.76, + "learning_rate": 7.139172876890981e-07, + "loss": 1.1649, + "step": 25252 + }, + { + "epoch": 0.76, + "learning_rate": 7.137466244130989e-07, + "loss": 1.0543, + "step": 25253 + }, + { + "epoch": 0.76, + "learning_rate": 7.135759781413714e-07, + "loss": 1.0673, + "step": 25254 + }, + { + "epoch": 0.76, + "learning_rate": 7.134053488755402e-07, + "loss": 0.9185, + "step": 25255 + }, + { + "epoch": 0.76, + "learning_rate": 7.132347366172304e-07, + "loss": 1.1273, + "step": 25256 + }, + { + "epoch": 0.76, + "learning_rate": 7.130641413680648e-07, + "loss": 1.0179, + "step": 25257 + }, + { + "epoch": 0.76, + "learning_rate": 7.128935631296676e-07, + "loss": 0.9818, + "step": 25258 + }, + { + "epoch": 0.76, + "learning_rate": 7.127230019036635e-07, + "loss": 0.9666, + "step": 25259 + }, + { + "epoch": 0.76, + "learning_rate": 7.12552457691676e-07, + "loss": 0.9681, + "step": 25260 + }, + { + "epoch": 0.76, + "learning_rate": 7.123819304953275e-07, + "loss": 1.1575, + "step": 25261 + }, + { + "epoch": 0.76, + "learning_rate": 7.122114203162423e-07, + "loss": 1.118, + "step": 25262 + }, + { + "epoch": 0.76, + "learning_rate": 7.12040927156043e-07, + "loss": 1.0901, + "step": 25263 + }, + { + "epoch": 0.76, + "learning_rate": 7.118704510163532e-07, + "loss": 1.0608, + "step": 25264 + }, + { + "epoch": 0.76, + "learning_rate": 7.116999918987963e-07, + "loss": 1.0417, + "step": 25265 + }, + { + "epoch": 0.76, + "learning_rate": 7.115295498049935e-07, + "loss": 1.1707, + "step": 25266 + }, + { + "epoch": 0.76, + "learning_rate": 7.113591247365678e-07, + "loss": 1.1646, + "step": 25267 + }, + { + "epoch": 0.76, + "learning_rate": 7.11188716695142e-07, + "loss": 1.2566, + "step": 25268 + }, + { + "epoch": 0.76, + "learning_rate": 7.11018325682338e-07, + "loss": 1.1605, + "step": 25269 + }, + { + "epoch": 0.76, + "learning_rate": 7.10847951699778e-07, + "loss": 1.1688, + "step": 25270 + }, + { + "epoch": 0.76, + "learning_rate": 7.106775947490835e-07, + "loss": 1.1282, + "step": 25271 + }, + { + "epoch": 0.76, + "learning_rate": 7.10507254831877e-07, + "loss": 1.0486, + "step": 25272 + }, + { + "epoch": 0.76, + "learning_rate": 7.1033693194978e-07, + "loss": 1.1074, + "step": 25273 + }, + { + "epoch": 0.76, + "learning_rate": 7.10166626104413e-07, + "loss": 1.1213, + "step": 25274 + }, + { + "epoch": 0.76, + "learning_rate": 7.099963372973975e-07, + "loss": 1.0876, + "step": 25275 + }, + { + "epoch": 0.76, + "learning_rate": 7.098260655303549e-07, + "loss": 1.1597, + "step": 25276 + }, + { + "epoch": 0.76, + "learning_rate": 7.096558108049056e-07, + "loss": 1.0588, + "step": 25277 + }, + { + "epoch": 0.76, + "learning_rate": 7.094855731226719e-07, + "loss": 1.0157, + "step": 25278 + }, + { + "epoch": 0.76, + "learning_rate": 7.093153524852725e-07, + "loss": 1.1899, + "step": 25279 + }, + { + "epoch": 0.76, + "learning_rate": 7.091451488943282e-07, + "loss": 1.2072, + "step": 25280 + }, + { + "epoch": 0.76, + "learning_rate": 7.089749623514597e-07, + "loss": 1.2053, + "step": 25281 + }, + { + "epoch": 0.76, + "learning_rate": 7.088047928582878e-07, + "loss": 1.075, + "step": 25282 + }, + { + "epoch": 0.76, + "learning_rate": 7.086346404164307e-07, + "loss": 1.2008, + "step": 25283 + }, + { + "epoch": 0.76, + "learning_rate": 7.084645050275094e-07, + "loss": 1.0199, + "step": 25284 + }, + { + "epoch": 0.76, + "learning_rate": 7.082943866931428e-07, + "loss": 1.1638, + "step": 25285 + }, + { + "epoch": 0.76, + "learning_rate": 7.081242854149517e-07, + "loss": 1.1849, + "step": 25286 + }, + { + "epoch": 0.76, + "learning_rate": 7.079542011945536e-07, + "loss": 1.195, + "step": 25287 + }, + { + "epoch": 0.76, + "learning_rate": 7.077841340335684e-07, + "loss": 1.0922, + "step": 25288 + }, + { + "epoch": 0.76, + "learning_rate": 7.076140839336151e-07, + "loss": 1.1291, + "step": 25289 + }, + { + "epoch": 0.76, + "learning_rate": 7.074440508963124e-07, + "loss": 1.0145, + "step": 25290 + }, + { + "epoch": 0.76, + "learning_rate": 7.072740349232798e-07, + "loss": 1.0622, + "step": 25291 + }, + { + "epoch": 0.76, + "learning_rate": 7.071040360161344e-07, + "loss": 1.234, + "step": 25292 + }, + { + "epoch": 0.76, + "learning_rate": 7.069340541764949e-07, + "loss": 1.0767, + "step": 25293 + }, + { + "epoch": 0.76, + "learning_rate": 7.067640894059796e-07, + "loss": 1.1444, + "step": 25294 + }, + { + "epoch": 0.76, + "learning_rate": 7.065941417062067e-07, + "loss": 1.171, + "step": 25295 + }, + { + "epoch": 0.76, + "learning_rate": 7.064242110787936e-07, + "loss": 1.1671, + "step": 25296 + }, + { + "epoch": 0.76, + "learning_rate": 7.062542975253584e-07, + "loss": 1.0009, + "step": 25297 + }, + { + "epoch": 0.76, + "learning_rate": 7.060844010475182e-07, + "loss": 1.1837, + "step": 25298 + }, + { + "epoch": 0.76, + "learning_rate": 7.059145216468916e-07, + "loss": 1.182, + "step": 25299 + }, + { + "epoch": 0.76, + "learning_rate": 7.057446593250936e-07, + "loss": 1.252, + "step": 25300 + }, + { + "epoch": 0.76, + "learning_rate": 7.055748140837426e-07, + "loss": 1.0511, + "step": 25301 + }, + { + "epoch": 0.76, + "learning_rate": 7.05404985924455e-07, + "loss": 1.0659, + "step": 25302 + }, + { + "epoch": 0.76, + "learning_rate": 7.052351748488476e-07, + "loss": 1.0865, + "step": 25303 + }, + { + "epoch": 0.76, + "learning_rate": 7.050653808585376e-07, + "loss": 1.2487, + "step": 25304 + }, + { + "epoch": 0.76, + "learning_rate": 7.048956039551399e-07, + "loss": 1.1722, + "step": 25305 + }, + { + "epoch": 0.76, + "learning_rate": 7.047258441402719e-07, + "loss": 1.0139, + "step": 25306 + }, + { + "epoch": 0.76, + "learning_rate": 7.045561014155489e-07, + "loss": 1.0762, + "step": 25307 + }, + { + "epoch": 0.76, + "learning_rate": 7.04386375782588e-07, + "loss": 1.0172, + "step": 25308 + }, + { + "epoch": 0.76, + "learning_rate": 7.042166672430031e-07, + "loss": 1.0548, + "step": 25309 + }, + { + "epoch": 0.76, + "learning_rate": 7.040469757984108e-07, + "loss": 1.1067, + "step": 25310 + }, + { + "epoch": 0.76, + "learning_rate": 7.038773014504264e-07, + "loss": 1.2003, + "step": 25311 + }, + { + "epoch": 0.76, + "learning_rate": 7.037076442006654e-07, + "loss": 1.0496, + "step": 25312 + }, + { + "epoch": 0.76, + "learning_rate": 7.035380040507423e-07, + "loss": 1.1248, + "step": 25313 + }, + { + "epoch": 0.76, + "learning_rate": 7.033683810022718e-07, + "loss": 1.0938, + "step": 25314 + }, + { + "epoch": 0.76, + "learning_rate": 7.031987750568692e-07, + "loss": 1.0455, + "step": 25315 + }, + { + "epoch": 0.76, + "learning_rate": 7.030291862161487e-07, + "loss": 1.1952, + "step": 25316 + }, + { + "epoch": 0.76, + "learning_rate": 7.02859614481726e-07, + "loss": 1.0306, + "step": 25317 + }, + { + "epoch": 0.76, + "learning_rate": 7.026900598552131e-07, + "loss": 1.0162, + "step": 25318 + }, + { + "epoch": 0.76, + "learning_rate": 7.025205223382253e-07, + "loss": 1.1693, + "step": 25319 + }, + { + "epoch": 0.76, + "learning_rate": 7.023510019323768e-07, + "loss": 1.0538, + "step": 25320 + }, + { + "epoch": 0.76, + "learning_rate": 7.021814986392813e-07, + "loss": 1.059, + "step": 25321 + }, + { + "epoch": 0.76, + "learning_rate": 7.020120124605515e-07, + "loss": 1.0756, + "step": 25322 + }, + { + "epoch": 0.76, + "learning_rate": 7.018425433978012e-07, + "loss": 1.0768, + "step": 25323 + }, + { + "epoch": 0.76, + "learning_rate": 7.016730914526442e-07, + "loss": 1.2098, + "step": 25324 + }, + { + "epoch": 0.76, + "learning_rate": 7.015036566266931e-07, + "loss": 1.1241, + "step": 25325 + }, + { + "epoch": 0.76, + "learning_rate": 7.01334238921561e-07, + "loss": 1.0244, + "step": 25326 + }, + { + "epoch": 0.76, + "learning_rate": 7.011648383388608e-07, + "loss": 1.0109, + "step": 25327 + }, + { + "epoch": 0.76, + "learning_rate": 7.009954548802047e-07, + "loss": 1.0574, + "step": 25328 + }, + { + "epoch": 0.76, + "learning_rate": 7.008260885472057e-07, + "loss": 1.0942, + "step": 25329 + }, + { + "epoch": 0.76, + "learning_rate": 7.006567393414765e-07, + "loss": 1.0716, + "step": 25330 + }, + { + "epoch": 0.76, + "learning_rate": 7.004874072646279e-07, + "loss": 0.9884, + "step": 25331 + }, + { + "epoch": 0.76, + "learning_rate": 7.003180923182723e-07, + "loss": 1.08, + "step": 25332 + }, + { + "epoch": 0.76, + "learning_rate": 7.001487945040217e-07, + "loss": 1.0694, + "step": 25333 + }, + { + "epoch": 0.76, + "learning_rate": 6.999795138234888e-07, + "loss": 1.0494, + "step": 25334 + }, + { + "epoch": 0.76, + "learning_rate": 6.99810250278283e-07, + "loss": 1.108, + "step": 25335 + }, + { + "epoch": 0.76, + "learning_rate": 6.996410038700166e-07, + "loss": 1.1279, + "step": 25336 + }, + { + "epoch": 0.76, + "learning_rate": 6.994717746003008e-07, + "loss": 1.1783, + "step": 25337 + }, + { + "epoch": 0.76, + "learning_rate": 6.993025624707476e-07, + "loss": 1.1241, + "step": 25338 + }, + { + "epoch": 0.76, + "learning_rate": 6.991333674829656e-07, + "loss": 1.1068, + "step": 25339 + }, + { + "epoch": 0.76, + "learning_rate": 6.989641896385665e-07, + "loss": 1.1053, + "step": 25340 + }, + { + "epoch": 0.76, + "learning_rate": 6.987950289391613e-07, + "loss": 0.9799, + "step": 25341 + }, + { + "epoch": 0.76, + "learning_rate": 6.986258853863597e-07, + "loss": 1.1527, + "step": 25342 + }, + { + "epoch": 0.76, + "learning_rate": 6.984567589817731e-07, + "loss": 1.1844, + "step": 25343 + }, + { + "epoch": 0.76, + "learning_rate": 6.982876497270094e-07, + "loss": 1.0764, + "step": 25344 + }, + { + "epoch": 0.76, + "learning_rate": 6.981185576236799e-07, + "loss": 1.0372, + "step": 25345 + }, + { + "epoch": 0.76, + "learning_rate": 6.979494826733938e-07, + "loss": 1.1749, + "step": 25346 + }, + { + "epoch": 0.76, + "learning_rate": 6.977804248777614e-07, + "loss": 1.1956, + "step": 25347 + }, + { + "epoch": 0.76, + "learning_rate": 6.976113842383905e-07, + "loss": 1.0067, + "step": 25348 + }, + { + "epoch": 0.76, + "learning_rate": 6.974423607568914e-07, + "loss": 1.1759, + "step": 25349 + }, + { + "epoch": 0.76, + "learning_rate": 6.972733544348728e-07, + "loss": 1.0138, + "step": 25350 + }, + { + "epoch": 0.76, + "learning_rate": 6.971043652739437e-07, + "loss": 1.0626, + "step": 25351 + }, + { + "epoch": 0.76, + "learning_rate": 6.969353932757125e-07, + "loss": 0.9705, + "step": 25352 + }, + { + "epoch": 0.76, + "learning_rate": 6.967664384417883e-07, + "loss": 1.0406, + "step": 25353 + }, + { + "epoch": 0.76, + "learning_rate": 6.965975007737789e-07, + "loss": 1.0536, + "step": 25354 + }, + { + "epoch": 0.76, + "learning_rate": 6.964285802732929e-07, + "loss": 1.1182, + "step": 25355 + }, + { + "epoch": 0.76, + "learning_rate": 6.962596769419388e-07, + "loss": 1.0286, + "step": 25356 + }, + { + "epoch": 0.76, + "learning_rate": 6.96090790781323e-07, + "loss": 0.9911, + "step": 25357 + }, + { + "epoch": 0.76, + "learning_rate": 6.959219217930544e-07, + "loss": 1.1417, + "step": 25358 + }, + { + "epoch": 0.76, + "learning_rate": 6.957530699787402e-07, + "loss": 1.0613, + "step": 25359 + }, + { + "epoch": 0.76, + "learning_rate": 6.955842353399883e-07, + "loss": 1.062, + "step": 25360 + }, + { + "epoch": 0.76, + "learning_rate": 6.954154178784048e-07, + "loss": 1.0639, + "step": 25361 + }, + { + "epoch": 0.76, + "learning_rate": 6.952466175955974e-07, + "loss": 1.0712, + "step": 25362 + }, + { + "epoch": 0.76, + "learning_rate": 6.950778344931733e-07, + "loss": 1.0773, + "step": 25363 + }, + { + "epoch": 0.76, + "learning_rate": 6.949090685727394e-07, + "loss": 1.0847, + "step": 25364 + }, + { + "epoch": 0.76, + "learning_rate": 6.94740319835901e-07, + "loss": 1.043, + "step": 25365 + }, + { + "epoch": 0.76, + "learning_rate": 6.945715882842655e-07, + "loss": 1.0969, + "step": 25366 + }, + { + "epoch": 0.76, + "learning_rate": 6.944028739194389e-07, + "loss": 1.1765, + "step": 25367 + }, + { + "epoch": 0.76, + "learning_rate": 6.942341767430272e-07, + "loss": 1.2083, + "step": 25368 + }, + { + "epoch": 0.76, + "learning_rate": 6.940654967566374e-07, + "loss": 1.1863, + "step": 25369 + }, + { + "epoch": 0.76, + "learning_rate": 6.938968339618734e-07, + "loss": 0.9915, + "step": 25370 + }, + { + "epoch": 0.76, + "learning_rate": 6.937281883603417e-07, + "loss": 1.0785, + "step": 25371 + }, + { + "epoch": 0.76, + "learning_rate": 6.935595599536477e-07, + "loss": 1.1009, + "step": 25372 + }, + { + "epoch": 0.76, + "learning_rate": 6.933909487433976e-07, + "loss": 1.1835, + "step": 25373 + }, + { + "epoch": 0.76, + "learning_rate": 6.932223547311947e-07, + "loss": 1.058, + "step": 25374 + }, + { + "epoch": 0.76, + "learning_rate": 6.930537779186447e-07, + "loss": 1.1581, + "step": 25375 + }, + { + "epoch": 0.76, + "learning_rate": 6.928852183073526e-07, + "loss": 1.0968, + "step": 25376 + }, + { + "epoch": 0.76, + "learning_rate": 6.927166758989229e-07, + "loss": 1.1971, + "step": 25377 + }, + { + "epoch": 0.76, + "learning_rate": 6.925481506949599e-07, + "loss": 1.0972, + "step": 25378 + }, + { + "epoch": 0.76, + "learning_rate": 6.923796426970683e-07, + "loss": 1.1575, + "step": 25379 + }, + { + "epoch": 0.76, + "learning_rate": 6.922111519068517e-07, + "loss": 1.0153, + "step": 25380 + }, + { + "epoch": 0.76, + "learning_rate": 6.920426783259151e-07, + "loss": 1.2128, + "step": 25381 + }, + { + "epoch": 0.76, + "learning_rate": 6.918742219558608e-07, + "loss": 1.1849, + "step": 25382 + }, + { + "epoch": 0.76, + "learning_rate": 6.917057827982929e-07, + "loss": 1.1224, + "step": 25383 + }, + { + "epoch": 0.76, + "learning_rate": 6.915373608548151e-07, + "loss": 1.037, + "step": 25384 + }, + { + "epoch": 0.76, + "learning_rate": 6.913689561270306e-07, + "loss": 1.191, + "step": 25385 + }, + { + "epoch": 0.76, + "learning_rate": 6.912005686165432e-07, + "loss": 1.103, + "step": 25386 + }, + { + "epoch": 0.76, + "learning_rate": 6.910321983249549e-07, + "loss": 1.1403, + "step": 25387 + }, + { + "epoch": 0.76, + "learning_rate": 6.908638452538685e-07, + "loss": 1.1832, + "step": 25388 + }, + { + "epoch": 0.76, + "learning_rate": 6.90695509404887e-07, + "loss": 1.0871, + "step": 25389 + }, + { + "epoch": 0.76, + "learning_rate": 6.905271907796137e-07, + "loss": 1.0145, + "step": 25390 + }, + { + "epoch": 0.76, + "learning_rate": 6.903588893796492e-07, + "loss": 0.8979, + "step": 25391 + }, + { + "epoch": 0.76, + "learning_rate": 6.901906052065968e-07, + "loss": 1.1001, + "step": 25392 + }, + { + "epoch": 0.76, + "learning_rate": 6.90022338262058e-07, + "loss": 1.0353, + "step": 25393 + }, + { + "epoch": 0.76, + "learning_rate": 6.898540885476357e-07, + "loss": 1.0796, + "step": 25394 + }, + { + "epoch": 0.77, + "learning_rate": 6.896858560649297e-07, + "loss": 1.0858, + "step": 25395 + }, + { + "epoch": 0.77, + "learning_rate": 6.895176408155427e-07, + "loss": 1.0178, + "step": 25396 + }, + { + "epoch": 0.77, + "learning_rate": 6.893494428010758e-07, + "loss": 1.0109, + "step": 25397 + }, + { + "epoch": 0.77, + "learning_rate": 6.8918126202313e-07, + "loss": 1.1562, + "step": 25398 + }, + { + "epoch": 0.77, + "learning_rate": 6.890130984833074e-07, + "loss": 1.1889, + "step": 25399 + }, + { + "epoch": 0.77, + "learning_rate": 6.888449521832069e-07, + "loss": 1.0661, + "step": 25400 + }, + { + "epoch": 0.77, + "learning_rate": 6.886768231244304e-07, + "loss": 1.0867, + "step": 25401 + }, + { + "epoch": 0.77, + "learning_rate": 6.885087113085781e-07, + "loss": 1.1023, + "step": 25402 + }, + { + "epoch": 0.77, + "learning_rate": 6.883406167372503e-07, + "loss": 1.046, + "step": 25403 + }, + { + "epoch": 0.77, + "learning_rate": 6.881725394120483e-07, + "loss": 1.1617, + "step": 25404 + }, + { + "epoch": 0.77, + "learning_rate": 6.880044793345702e-07, + "loss": 1.217, + "step": 25405 + }, + { + "epoch": 0.77, + "learning_rate": 6.878364365064169e-07, + "loss": 1.1476, + "step": 25406 + }, + { + "epoch": 0.77, + "learning_rate": 6.876684109291878e-07, + "loss": 1.1569, + "step": 25407 + }, + { + "epoch": 0.77, + "learning_rate": 6.875004026044827e-07, + "loss": 1.1031, + "step": 25408 + }, + { + "epoch": 0.77, + "learning_rate": 6.873324115339005e-07, + "loss": 1.1227, + "step": 25409 + }, + { + "epoch": 0.77, + "learning_rate": 6.871644377190412e-07, + "loss": 1.1752, + "step": 25410 + }, + { + "epoch": 0.77, + "learning_rate": 6.869964811615032e-07, + "loss": 1.184, + "step": 25411 + }, + { + "epoch": 0.77, + "learning_rate": 6.868285418628861e-07, + "loss": 1.1004, + "step": 25412 + }, + { + "epoch": 0.77, + "learning_rate": 6.866606198247877e-07, + "loss": 1.0986, + "step": 25413 + }, + { + "epoch": 0.77, + "learning_rate": 6.864927150488065e-07, + "loss": 1.1584, + "step": 25414 + }, + { + "epoch": 0.77, + "learning_rate": 6.863248275365414e-07, + "loss": 1.0889, + "step": 25415 + }, + { + "epoch": 0.77, + "learning_rate": 6.86156957289591e-07, + "loss": 1.1178, + "step": 25416 + }, + { + "epoch": 0.77, + "learning_rate": 6.859891043095524e-07, + "loss": 1.1187, + "step": 25417 + }, + { + "epoch": 0.77, + "learning_rate": 6.858212685980234e-07, + "loss": 1.0737, + "step": 25418 + }, + { + "epoch": 0.77, + "learning_rate": 6.856534501566026e-07, + "loss": 1.1905, + "step": 25419 + }, + { + "epoch": 0.77, + "learning_rate": 6.854856489868877e-07, + "loss": 1.1471, + "step": 25420 + }, + { + "epoch": 0.77, + "learning_rate": 6.853178650904746e-07, + "loss": 1.0676, + "step": 25421 + }, + { + "epoch": 0.77, + "learning_rate": 6.851500984689619e-07, + "loss": 1.1607, + "step": 25422 + }, + { + "epoch": 0.77, + "learning_rate": 6.849823491239457e-07, + "loss": 1.0117, + "step": 25423 + }, + { + "epoch": 0.77, + "learning_rate": 6.848146170570236e-07, + "loss": 1.1354, + "step": 25424 + }, + { + "epoch": 0.77, + "learning_rate": 6.84646902269793e-07, + "loss": 1.2274, + "step": 25425 + }, + { + "epoch": 0.77, + "learning_rate": 6.844792047638487e-07, + "loss": 1.2302, + "step": 25426 + }, + { + "epoch": 0.77, + "learning_rate": 6.84311524540788e-07, + "loss": 1.1113, + "step": 25427 + }, + { + "epoch": 0.77, + "learning_rate": 6.841438616022073e-07, + "loss": 1.1368, + "step": 25428 + }, + { + "epoch": 0.77, + "learning_rate": 6.839762159497029e-07, + "loss": 1.1021, + "step": 25429 + }, + { + "epoch": 0.77, + "learning_rate": 6.838085875848699e-07, + "loss": 1.0821, + "step": 25430 + }, + { + "epoch": 0.77, + "learning_rate": 6.836409765093041e-07, + "loss": 1.1259, + "step": 25431 + }, + { + "epoch": 0.77, + "learning_rate": 6.834733827246018e-07, + "loss": 1.0944, + "step": 25432 + }, + { + "epoch": 0.77, + "learning_rate": 6.833058062323577e-07, + "loss": 1.0669, + "step": 25433 + }, + { + "epoch": 0.77, + "learning_rate": 6.831382470341674e-07, + "loss": 1.0943, + "step": 25434 + }, + { + "epoch": 0.77, + "learning_rate": 6.829707051316262e-07, + "loss": 1.1132, + "step": 25435 + }, + { + "epoch": 0.77, + "learning_rate": 6.828031805263285e-07, + "loss": 1.2478, + "step": 25436 + }, + { + "epoch": 0.77, + "learning_rate": 6.826356732198694e-07, + "loss": 1.1526, + "step": 25437 + }, + { + "epoch": 0.77, + "learning_rate": 6.824681832138444e-07, + "loss": 1.0745, + "step": 25438 + }, + { + "epoch": 0.77, + "learning_rate": 6.823007105098459e-07, + "loss": 1.1424, + "step": 25439 + }, + { + "epoch": 0.77, + "learning_rate": 6.821332551094692e-07, + "loss": 1.1475, + "step": 25440 + }, + { + "epoch": 0.77, + "learning_rate": 6.819658170143087e-07, + "loss": 1.0547, + "step": 25441 + }, + { + "epoch": 0.77, + "learning_rate": 6.817983962259583e-07, + "loss": 1.0908, + "step": 25442 + }, + { + "epoch": 0.77, + "learning_rate": 6.816309927460113e-07, + "loss": 1.1967, + "step": 25443 + }, + { + "epoch": 0.77, + "learning_rate": 6.81463606576061e-07, + "loss": 1.0764, + "step": 25444 + }, + { + "epoch": 0.77, + "learning_rate": 6.812962377177016e-07, + "loss": 1.0667, + "step": 25445 + }, + { + "epoch": 0.77, + "learning_rate": 6.811288861725268e-07, + "loss": 1.1293, + "step": 25446 + }, + { + "epoch": 0.77, + "learning_rate": 6.809615519421284e-07, + "loss": 1.0796, + "step": 25447 + }, + { + "epoch": 0.77, + "learning_rate": 6.807942350280996e-07, + "loss": 1.0679, + "step": 25448 + }, + { + "epoch": 0.77, + "learning_rate": 6.806269354320339e-07, + "loss": 1.0247, + "step": 25449 + }, + { + "epoch": 0.77, + "learning_rate": 6.804596531555232e-07, + "loss": 1.1585, + "step": 25450 + }, + { + "epoch": 0.77, + "learning_rate": 6.802923882001614e-07, + "loss": 1.1348, + "step": 25451 + }, + { + "epoch": 0.77, + "learning_rate": 6.801251405675385e-07, + "loss": 1.0356, + "step": 25452 + }, + { + "epoch": 0.77, + "learning_rate": 6.799579102592479e-07, + "loss": 1.1783, + "step": 25453 + }, + { + "epoch": 0.77, + "learning_rate": 6.797906972768817e-07, + "loss": 1.0657, + "step": 25454 + }, + { + "epoch": 0.77, + "learning_rate": 6.796235016220318e-07, + "loss": 1.204, + "step": 25455 + }, + { + "epoch": 0.77, + "learning_rate": 6.794563232962889e-07, + "loss": 0.999, + "step": 25456 + }, + { + "epoch": 0.77, + "learning_rate": 6.792891623012451e-07, + "loss": 1.0881, + "step": 25457 + }, + { + "epoch": 0.77, + "learning_rate": 6.791220186384914e-07, + "loss": 1.0162, + "step": 25458 + }, + { + "epoch": 0.77, + "learning_rate": 6.789548923096193e-07, + "loss": 1.0013, + "step": 25459 + }, + { + "epoch": 0.77, + "learning_rate": 6.787877833162193e-07, + "loss": 1.129, + "step": 25460 + }, + { + "epoch": 0.77, + "learning_rate": 6.786206916598825e-07, + "loss": 1.1045, + "step": 25461 + }, + { + "epoch": 0.77, + "learning_rate": 6.784536173421999e-07, + "loss": 1.1448, + "step": 25462 + }, + { + "epoch": 0.77, + "learning_rate": 6.782865603647612e-07, + "loss": 1.0367, + "step": 25463 + }, + { + "epoch": 0.77, + "learning_rate": 6.78119520729158e-07, + "loss": 1.078, + "step": 25464 + }, + { + "epoch": 0.77, + "learning_rate": 6.779524984369786e-07, + "loss": 1.0761, + "step": 25465 + }, + { + "epoch": 0.77, + "learning_rate": 6.777854934898139e-07, + "loss": 1.1669, + "step": 25466 + }, + { + "epoch": 0.77, + "learning_rate": 6.77618505889254e-07, + "loss": 1.0475, + "step": 25467 + }, + { + "epoch": 0.77, + "learning_rate": 6.774515356368888e-07, + "loss": 0.9987, + "step": 25468 + }, + { + "epoch": 0.77, + "learning_rate": 6.772845827343063e-07, + "loss": 1.1464, + "step": 25469 + }, + { + "epoch": 0.77, + "learning_rate": 6.77117647183097e-07, + "loss": 1.0466, + "step": 25470 + }, + { + "epoch": 0.77, + "learning_rate": 6.769507289848496e-07, + "loss": 1.1949, + "step": 25471 + }, + { + "epoch": 0.77, + "learning_rate": 6.76783828141154e-07, + "loss": 1.1215, + "step": 25472 + }, + { + "epoch": 0.77, + "learning_rate": 6.766169446535975e-07, + "loss": 1.1289, + "step": 25473 + }, + { + "epoch": 0.77, + "learning_rate": 6.764500785237696e-07, + "loss": 1.2128, + "step": 25474 + }, + { + "epoch": 0.77, + "learning_rate": 6.762832297532587e-07, + "loss": 1.0923, + "step": 25475 + }, + { + "epoch": 0.77, + "learning_rate": 6.761163983436531e-07, + "loss": 1.1119, + "step": 25476 + }, + { + "epoch": 0.77, + "learning_rate": 6.759495842965416e-07, + "loss": 1.1815, + "step": 25477 + }, + { + "epoch": 0.77, + "learning_rate": 6.757827876135109e-07, + "loss": 1.1462, + "step": 25478 + }, + { + "epoch": 0.77, + "learning_rate": 6.756160082961497e-07, + "loss": 1.0472, + "step": 25479 + }, + { + "epoch": 0.77, + "learning_rate": 6.754492463460452e-07, + "loss": 1.1124, + "step": 25480 + }, + { + "epoch": 0.77, + "learning_rate": 6.75282501764786e-07, + "loss": 0.9057, + "step": 25481 + }, + { + "epoch": 0.77, + "learning_rate": 6.751157745539577e-07, + "loss": 1.1444, + "step": 25482 + }, + { + "epoch": 0.77, + "learning_rate": 6.749490647151482e-07, + "loss": 1.1262, + "step": 25483 + }, + { + "epoch": 0.77, + "learning_rate": 6.74782372249945e-07, + "loss": 1.0135, + "step": 25484 + }, + { + "epoch": 0.77, + "learning_rate": 6.746156971599344e-07, + "loss": 1.0589, + "step": 25485 + }, + { + "epoch": 0.77, + "learning_rate": 6.744490394467041e-07, + "loss": 1.1326, + "step": 25486 + }, + { + "epoch": 0.77, + "learning_rate": 6.742823991118386e-07, + "loss": 1.1365, + "step": 25487 + }, + { + "epoch": 0.77, + "learning_rate": 6.741157761569255e-07, + "loss": 1.1312, + "step": 25488 + }, + { + "epoch": 0.77, + "learning_rate": 6.73949170583551e-07, + "loss": 1.0723, + "step": 25489 + }, + { + "epoch": 0.77, + "learning_rate": 6.737825823933008e-07, + "loss": 0.9454, + "step": 25490 + }, + { + "epoch": 0.77, + "learning_rate": 6.73616011587761e-07, + "loss": 1.0068, + "step": 25491 + }, + { + "epoch": 0.77, + "learning_rate": 6.734494581685172e-07, + "loss": 1.1343, + "step": 25492 + }, + { + "epoch": 0.77, + "learning_rate": 6.732829221371548e-07, + "loss": 1.1382, + "step": 25493 + }, + { + "epoch": 0.77, + "learning_rate": 6.7311640349526e-07, + "loss": 1.0158, + "step": 25494 + }, + { + "epoch": 0.77, + "learning_rate": 6.729499022444163e-07, + "loss": 1.1255, + "step": 25495 + }, + { + "epoch": 0.77, + "learning_rate": 6.727834183862098e-07, + "loss": 1.1943, + "step": 25496 + }, + { + "epoch": 0.77, + "learning_rate": 6.726169519222248e-07, + "loss": 1.0735, + "step": 25497 + }, + { + "epoch": 0.77, + "learning_rate": 6.724505028540474e-07, + "loss": 0.9561, + "step": 25498 + }, + { + "epoch": 0.77, + "learning_rate": 6.722840711832602e-07, + "loss": 1.1005, + "step": 25499 + }, + { + "epoch": 0.77, + "learning_rate": 6.721176569114482e-07, + "loss": 1.0173, + "step": 25500 + }, + { + "epoch": 0.77, + "learning_rate": 6.719512600401959e-07, + "loss": 1.0744, + "step": 25501 + }, + { + "epoch": 0.77, + "learning_rate": 6.717848805710872e-07, + "loss": 1.0439, + "step": 25502 + }, + { + "epoch": 0.77, + "learning_rate": 6.716185185057067e-07, + "loss": 1.1101, + "step": 25503 + }, + { + "epoch": 0.77, + "learning_rate": 6.714521738456364e-07, + "loss": 1.1641, + "step": 25504 + }, + { + "epoch": 0.77, + "learning_rate": 6.712858465924609e-07, + "loss": 1.0616, + "step": 25505 + }, + { + "epoch": 0.77, + "learning_rate": 6.711195367477635e-07, + "loss": 0.9598, + "step": 25506 + }, + { + "epoch": 0.77, + "learning_rate": 6.709532443131281e-07, + "loss": 1.1187, + "step": 25507 + }, + { + "epoch": 0.77, + "learning_rate": 6.707869692901358e-07, + "loss": 1.1121, + "step": 25508 + }, + { + "epoch": 0.77, + "learning_rate": 6.706207116803709e-07, + "loss": 1.0948, + "step": 25509 + }, + { + "epoch": 0.77, + "learning_rate": 6.704544714854155e-07, + "loss": 0.9792, + "step": 25510 + }, + { + "epoch": 0.77, + "learning_rate": 6.702882487068535e-07, + "loss": 0.9614, + "step": 25511 + }, + { + "epoch": 0.77, + "learning_rate": 6.701220433462651e-07, + "loss": 1.1381, + "step": 25512 + }, + { + "epoch": 0.77, + "learning_rate": 6.699558554052335e-07, + "loss": 1.1395, + "step": 25513 + }, + { + "epoch": 0.77, + "learning_rate": 6.697896848853411e-07, + "loss": 1.0392, + "step": 25514 + }, + { + "epoch": 0.77, + "learning_rate": 6.696235317881692e-07, + "loss": 1.0912, + "step": 25515 + }, + { + "epoch": 0.77, + "learning_rate": 6.694573961152998e-07, + "loss": 1.0407, + "step": 25516 + }, + { + "epoch": 0.77, + "learning_rate": 6.692912778683144e-07, + "loss": 1.1863, + "step": 25517 + }, + { + "epoch": 0.77, + "learning_rate": 6.691251770487941e-07, + "loss": 1.1934, + "step": 25518 + }, + { + "epoch": 0.77, + "learning_rate": 6.689590936583207e-07, + "loss": 1.0542, + "step": 25519 + }, + { + "epoch": 0.77, + "learning_rate": 6.687930276984755e-07, + "loss": 1.1521, + "step": 25520 + }, + { + "epoch": 0.77, + "learning_rate": 6.686269791708377e-07, + "loss": 1.0695, + "step": 25521 + }, + { + "epoch": 0.77, + "learning_rate": 6.684609480769894e-07, + "loss": 1.1529, + "step": 25522 + }, + { + "epoch": 0.77, + "learning_rate": 6.682949344185108e-07, + "loss": 1.1418, + "step": 25523 + }, + { + "epoch": 0.77, + "learning_rate": 6.681289381969828e-07, + "loss": 1.2383, + "step": 25524 + }, + { + "epoch": 0.77, + "learning_rate": 6.679629594139842e-07, + "loss": 1.1454, + "step": 25525 + }, + { + "epoch": 0.77, + "learning_rate": 6.67796998071096e-07, + "loss": 1.1147, + "step": 25526 + }, + { + "epoch": 0.77, + "learning_rate": 6.676310541698979e-07, + "loss": 1.1443, + "step": 25527 + }, + { + "epoch": 0.77, + "learning_rate": 6.6746512771197e-07, + "loss": 1.2234, + "step": 25528 + }, + { + "epoch": 0.77, + "learning_rate": 6.672992186988919e-07, + "loss": 1.0308, + "step": 25529 + }, + { + "epoch": 0.77, + "learning_rate": 6.67133327132242e-07, + "loss": 1.1492, + "step": 25530 + }, + { + "epoch": 0.77, + "learning_rate": 6.669674530136e-07, + "loss": 1.0048, + "step": 25531 + }, + { + "epoch": 0.77, + "learning_rate": 6.668015963445451e-07, + "loss": 1.0685, + "step": 25532 + }, + { + "epoch": 0.77, + "learning_rate": 6.666357571266568e-07, + "loss": 1.0853, + "step": 25533 + }, + { + "epoch": 0.77, + "learning_rate": 6.664699353615123e-07, + "loss": 1.1216, + "step": 25534 + }, + { + "epoch": 0.77, + "learning_rate": 6.663041310506909e-07, + "loss": 1.1525, + "step": 25535 + }, + { + "epoch": 0.77, + "learning_rate": 6.661383441957714e-07, + "loss": 1.2213, + "step": 25536 + }, + { + "epoch": 0.77, + "learning_rate": 6.65972574798332e-07, + "loss": 1.2118, + "step": 25537 + }, + { + "epoch": 0.77, + "learning_rate": 6.658068228599499e-07, + "loss": 1.0068, + "step": 25538 + }, + { + "epoch": 0.77, + "learning_rate": 6.656410883822034e-07, + "loss": 1.1109, + "step": 25539 + }, + { + "epoch": 0.77, + "learning_rate": 6.654753713666703e-07, + "loss": 1.0609, + "step": 25540 + }, + { + "epoch": 0.77, + "learning_rate": 6.653096718149279e-07, + "loss": 1.1569, + "step": 25541 + }, + { + "epoch": 0.77, + "learning_rate": 6.651439897285541e-07, + "loss": 1.1116, + "step": 25542 + }, + { + "epoch": 0.77, + "learning_rate": 6.649783251091257e-07, + "loss": 1.1755, + "step": 25543 + }, + { + "epoch": 0.77, + "learning_rate": 6.648126779582198e-07, + "loss": 1.1031, + "step": 25544 + }, + { + "epoch": 0.77, + "learning_rate": 6.646470482774134e-07, + "loss": 1.0847, + "step": 25545 + }, + { + "epoch": 0.77, + "learning_rate": 6.644814360682841e-07, + "loss": 1.1179, + "step": 25546 + }, + { + "epoch": 0.77, + "learning_rate": 6.643158413324067e-07, + "loss": 1.1202, + "step": 25547 + }, + { + "epoch": 0.77, + "learning_rate": 6.641502640713582e-07, + "loss": 1.1299, + "step": 25548 + }, + { + "epoch": 0.77, + "learning_rate": 6.63984704286715e-07, + "loss": 1.0867, + "step": 25549 + }, + { + "epoch": 0.77, + "learning_rate": 6.638191619800541e-07, + "loss": 1.0836, + "step": 25550 + }, + { + "epoch": 0.77, + "learning_rate": 6.636536371529495e-07, + "loss": 1.1939, + "step": 25551 + }, + { + "epoch": 0.77, + "learning_rate": 6.634881298069781e-07, + "loss": 1.0674, + "step": 25552 + }, + { + "epoch": 0.77, + "learning_rate": 6.633226399437151e-07, + "loss": 1.0513, + "step": 25553 + }, + { + "epoch": 0.77, + "learning_rate": 6.631571675647358e-07, + "loss": 1.0539, + "step": 25554 + }, + { + "epoch": 0.77, + "learning_rate": 6.629917126716165e-07, + "loss": 1.2223, + "step": 25555 + }, + { + "epoch": 0.77, + "learning_rate": 6.628262752659306e-07, + "loss": 1.2294, + "step": 25556 + }, + { + "epoch": 0.77, + "learning_rate": 6.626608553492539e-07, + "loss": 1.101, + "step": 25557 + }, + { + "epoch": 0.77, + "learning_rate": 6.624954529231609e-07, + "loss": 1.0984, + "step": 25558 + }, + { + "epoch": 0.77, + "learning_rate": 6.623300679892269e-07, + "loss": 1.1563, + "step": 25559 + }, + { + "epoch": 0.77, + "learning_rate": 6.621647005490248e-07, + "loss": 1.0409, + "step": 25560 + }, + { + "epoch": 0.77, + "learning_rate": 6.619993506041298e-07, + "loss": 1.2964, + "step": 25561 + }, + { + "epoch": 0.77, + "learning_rate": 6.618340181561156e-07, + "loss": 1.124, + "step": 25562 + }, + { + "epoch": 0.77, + "learning_rate": 6.616687032065572e-07, + "loss": 1.1249, + "step": 25563 + }, + { + "epoch": 0.77, + "learning_rate": 6.615034057570263e-07, + "loss": 1.1613, + "step": 25564 + }, + { + "epoch": 0.77, + "learning_rate": 6.613381258090979e-07, + "loss": 1.011, + "step": 25565 + }, + { + "epoch": 0.77, + "learning_rate": 6.611728633643447e-07, + "loss": 1.2272, + "step": 25566 + }, + { + "epoch": 0.77, + "learning_rate": 6.610076184243402e-07, + "loss": 1.0762, + "step": 25567 + }, + { + "epoch": 0.77, + "learning_rate": 6.608423909906586e-07, + "loss": 1.1149, + "step": 25568 + }, + { + "epoch": 0.77, + "learning_rate": 6.606771810648708e-07, + "loss": 1.1615, + "step": 25569 + }, + { + "epoch": 0.77, + "learning_rate": 6.605119886485501e-07, + "loss": 1.093, + "step": 25570 + }, + { + "epoch": 0.77, + "learning_rate": 6.603468137432694e-07, + "loss": 1.0849, + "step": 25571 + }, + { + "epoch": 0.77, + "learning_rate": 6.601816563506013e-07, + "loss": 1.0123, + "step": 25572 + }, + { + "epoch": 0.77, + "learning_rate": 6.600165164721175e-07, + "loss": 1.1345, + "step": 25573 + }, + { + "epoch": 0.77, + "learning_rate": 6.598513941093906e-07, + "loss": 1.1265, + "step": 25574 + }, + { + "epoch": 0.77, + "learning_rate": 6.596862892639918e-07, + "loss": 1.0416, + "step": 25575 + }, + { + "epoch": 0.77, + "learning_rate": 6.595212019374944e-07, + "loss": 1.1135, + "step": 25576 + }, + { + "epoch": 0.77, + "learning_rate": 6.593561321314676e-07, + "loss": 1.1276, + "step": 25577 + }, + { + "epoch": 0.77, + "learning_rate": 6.59191079847484e-07, + "loss": 1.124, + "step": 25578 + }, + { + "epoch": 0.77, + "learning_rate": 6.59026045087115e-07, + "loss": 0.8851, + "step": 25579 + }, + { + "epoch": 0.77, + "learning_rate": 6.58861027851932e-07, + "loss": 1.1356, + "step": 25580 + }, + { + "epoch": 0.77, + "learning_rate": 6.586960281435046e-07, + "loss": 1.2795, + "step": 25581 + }, + { + "epoch": 0.77, + "learning_rate": 6.585310459634039e-07, + "loss": 1.0338, + "step": 25582 + }, + { + "epoch": 0.77, + "learning_rate": 6.583660813132011e-07, + "loss": 1.0766, + "step": 25583 + }, + { + "epoch": 0.77, + "learning_rate": 6.58201134194466e-07, + "loss": 1.0544, + "step": 25584 + }, + { + "epoch": 0.77, + "learning_rate": 6.580362046087701e-07, + "loss": 1.0671, + "step": 25585 + }, + { + "epoch": 0.77, + "learning_rate": 6.578712925576817e-07, + "loss": 1.0654, + "step": 25586 + }, + { + "epoch": 0.77, + "learning_rate": 6.577063980427711e-07, + "loss": 1.0636, + "step": 25587 + }, + { + "epoch": 0.77, + "learning_rate": 6.575415210656083e-07, + "loss": 1.004, + "step": 25588 + }, + { + "epoch": 0.77, + "learning_rate": 6.573766616277638e-07, + "loss": 0.9724, + "step": 25589 + }, + { + "epoch": 0.77, + "learning_rate": 6.572118197308052e-07, + "loss": 1.0444, + "step": 25590 + }, + { + "epoch": 0.77, + "learning_rate": 6.570469953763029e-07, + "loss": 1.1517, + "step": 25591 + }, + { + "epoch": 0.77, + "learning_rate": 6.568821885658253e-07, + "loss": 1.1588, + "step": 25592 + }, + { + "epoch": 0.77, + "learning_rate": 6.567173993009421e-07, + "loss": 1.1407, + "step": 25593 + }, + { + "epoch": 0.77, + "learning_rate": 6.565526275832209e-07, + "loss": 1.1832, + "step": 25594 + }, + { + "epoch": 0.77, + "learning_rate": 6.563878734142312e-07, + "loss": 1.0947, + "step": 25595 + }, + { + "epoch": 0.77, + "learning_rate": 6.562231367955407e-07, + "loss": 1.2042, + "step": 25596 + }, + { + "epoch": 0.77, + "learning_rate": 6.56058417728718e-07, + "loss": 1.0484, + "step": 25597 + }, + { + "epoch": 0.77, + "learning_rate": 6.558937162153311e-07, + "loss": 1.2158, + "step": 25598 + }, + { + "epoch": 0.77, + "learning_rate": 6.557290322569479e-07, + "loss": 1.1454, + "step": 25599 + }, + { + "epoch": 0.77, + "learning_rate": 6.555643658551361e-07, + "loss": 1.1119, + "step": 25600 + }, + { + "epoch": 0.77, + "learning_rate": 6.553997170114631e-07, + "loss": 1.0952, + "step": 25601 + }, + { + "epoch": 0.77, + "learning_rate": 6.552350857274972e-07, + "loss": 1.1426, + "step": 25602 + }, + { + "epoch": 0.77, + "learning_rate": 6.550704720048043e-07, + "loss": 1.1721, + "step": 25603 + }, + { + "epoch": 0.77, + "learning_rate": 6.549058758449517e-07, + "loss": 1.2529, + "step": 25604 + }, + { + "epoch": 0.77, + "learning_rate": 6.547412972495065e-07, + "loss": 1.1802, + "step": 25605 + }, + { + "epoch": 0.77, + "learning_rate": 6.545767362200364e-07, + "loss": 1.1025, + "step": 25606 + }, + { + "epoch": 0.77, + "learning_rate": 6.544121927581059e-07, + "loss": 1.1519, + "step": 25607 + }, + { + "epoch": 0.77, + "learning_rate": 6.542476668652828e-07, + "loss": 1.1231, + "step": 25608 + }, + { + "epoch": 0.77, + "learning_rate": 6.540831585431329e-07, + "loss": 1.1038, + "step": 25609 + }, + { + "epoch": 0.77, + "learning_rate": 6.539186677932222e-07, + "loss": 1.0325, + "step": 25610 + }, + { + "epoch": 0.77, + "learning_rate": 6.537541946171175e-07, + "loss": 1.1178, + "step": 25611 + }, + { + "epoch": 0.77, + "learning_rate": 6.535897390163828e-07, + "loss": 1.2004, + "step": 25612 + }, + { + "epoch": 0.77, + "learning_rate": 6.534253009925848e-07, + "loss": 1.1888, + "step": 25613 + }, + { + "epoch": 0.77, + "learning_rate": 6.532608805472885e-07, + "loss": 1.0723, + "step": 25614 + }, + { + "epoch": 0.77, + "learning_rate": 6.530964776820597e-07, + "loss": 1.0851, + "step": 25615 + }, + { + "epoch": 0.77, + "learning_rate": 6.529320923984625e-07, + "loss": 1.0915, + "step": 25616 + }, + { + "epoch": 0.77, + "learning_rate": 6.527677246980621e-07, + "loss": 1.0522, + "step": 25617 + }, + { + "epoch": 0.77, + "learning_rate": 6.526033745824231e-07, + "loss": 1.1686, + "step": 25618 + }, + { + "epoch": 0.77, + "learning_rate": 6.524390420531112e-07, + "loss": 1.1359, + "step": 25619 + }, + { + "epoch": 0.77, + "learning_rate": 6.522747271116891e-07, + "loss": 1.101, + "step": 25620 + }, + { + "epoch": 0.77, + "learning_rate": 6.521104297597216e-07, + "loss": 1.1119, + "step": 25621 + }, + { + "epoch": 0.77, + "learning_rate": 6.519461499987728e-07, + "loss": 1.1544, + "step": 25622 + }, + { + "epoch": 0.77, + "learning_rate": 6.517818878304066e-07, + "loss": 1.0468, + "step": 25623 + }, + { + "epoch": 0.77, + "learning_rate": 6.516176432561869e-07, + "loss": 1.1111, + "step": 25624 + }, + { + "epoch": 0.77, + "learning_rate": 6.51453416277677e-07, + "loss": 1.199, + "step": 25625 + }, + { + "epoch": 0.77, + "learning_rate": 6.512892068964399e-07, + "loss": 1.0513, + "step": 25626 + }, + { + "epoch": 0.77, + "learning_rate": 6.511250151140396e-07, + "loss": 1.1151, + "step": 25627 + }, + { + "epoch": 0.77, + "learning_rate": 6.509608409320392e-07, + "loss": 1.0611, + "step": 25628 + }, + { + "epoch": 0.77, + "learning_rate": 6.507966843520005e-07, + "loss": 1.0931, + "step": 25629 + }, + { + "epoch": 0.77, + "learning_rate": 6.506325453754866e-07, + "loss": 1.1722, + "step": 25630 + }, + { + "epoch": 0.77, + "learning_rate": 6.504684240040604e-07, + "loss": 1.1625, + "step": 25631 + }, + { + "epoch": 0.77, + "learning_rate": 6.503043202392844e-07, + "loss": 1.0297, + "step": 25632 + }, + { + "epoch": 0.77, + "learning_rate": 6.5014023408272e-07, + "loss": 1.0748, + "step": 25633 + }, + { + "epoch": 0.77, + "learning_rate": 6.499761655359297e-07, + "loss": 1.0684, + "step": 25634 + }, + { + "epoch": 0.77, + "learning_rate": 6.498121146004751e-07, + "loss": 1.1367, + "step": 25635 + }, + { + "epoch": 0.77, + "learning_rate": 6.496480812779182e-07, + "loss": 1.1837, + "step": 25636 + }, + { + "epoch": 0.77, + "learning_rate": 6.494840655698212e-07, + "loss": 1.1636, + "step": 25637 + }, + { + "epoch": 0.77, + "learning_rate": 6.493200674777437e-07, + "loss": 1.1538, + "step": 25638 + }, + { + "epoch": 0.77, + "learning_rate": 6.491560870032479e-07, + "loss": 1.0843, + "step": 25639 + }, + { + "epoch": 0.77, + "learning_rate": 6.48992124147895e-07, + "loss": 1.0385, + "step": 25640 + }, + { + "epoch": 0.77, + "learning_rate": 6.488281789132461e-07, + "loss": 1.1432, + "step": 25641 + }, + { + "epoch": 0.77, + "learning_rate": 6.486642513008607e-07, + "loss": 1.1315, + "step": 25642 + }, + { + "epoch": 0.77, + "learning_rate": 6.485003413123001e-07, + "loss": 1.1052, + "step": 25643 + }, + { + "epoch": 0.77, + "learning_rate": 6.483364489491242e-07, + "loss": 1.0507, + "step": 25644 + }, + { + "epoch": 0.77, + "learning_rate": 6.481725742128947e-07, + "loss": 1.0889, + "step": 25645 + }, + { + "epoch": 0.77, + "learning_rate": 6.480087171051694e-07, + "loss": 1.1166, + "step": 25646 + }, + { + "epoch": 0.77, + "learning_rate": 6.478448776275092e-07, + "loss": 1.1154, + "step": 25647 + }, + { + "epoch": 0.77, + "learning_rate": 6.476810557814736e-07, + "loss": 1.1598, + "step": 25648 + }, + { + "epoch": 0.77, + "learning_rate": 6.475172515686226e-07, + "loss": 1.0765, + "step": 25649 + }, + { + "epoch": 0.77, + "learning_rate": 6.47353464990515e-07, + "loss": 1.1215, + "step": 25650 + }, + { + "epoch": 0.77, + "learning_rate": 6.471896960487109e-07, + "loss": 1.0873, + "step": 25651 + }, + { + "epoch": 0.77, + "learning_rate": 6.470259447447677e-07, + "loss": 1.0635, + "step": 25652 + }, + { + "epoch": 0.77, + "learning_rate": 6.468622110802453e-07, + "loss": 1.0634, + "step": 25653 + }, + { + "epoch": 0.77, + "learning_rate": 6.466984950567018e-07, + "loss": 1.1729, + "step": 25654 + }, + { + "epoch": 0.77, + "learning_rate": 6.465347966756963e-07, + "loss": 1.1404, + "step": 25655 + }, + { + "epoch": 0.77, + "learning_rate": 6.46371115938787e-07, + "loss": 1.152, + "step": 25656 + }, + { + "epoch": 0.77, + "learning_rate": 6.462074528475318e-07, + "loss": 1.0739, + "step": 25657 + }, + { + "epoch": 0.77, + "learning_rate": 6.460438074034895e-07, + "loss": 1.0476, + "step": 25658 + }, + { + "epoch": 0.77, + "learning_rate": 6.458801796082165e-07, + "loss": 1.0533, + "step": 25659 + }, + { + "epoch": 0.77, + "learning_rate": 6.457165694632714e-07, + "loss": 1.0353, + "step": 25660 + }, + { + "epoch": 0.77, + "learning_rate": 6.455529769702112e-07, + "loss": 1.2949, + "step": 25661 + }, + { + "epoch": 0.77, + "learning_rate": 6.453894021305937e-07, + "loss": 1.0638, + "step": 25662 + }, + { + "epoch": 0.77, + "learning_rate": 6.452258449459767e-07, + "loss": 1.0716, + "step": 25663 + }, + { + "epoch": 0.77, + "learning_rate": 6.450623054179156e-07, + "loss": 1.0917, + "step": 25664 + }, + { + "epoch": 0.77, + "learning_rate": 6.44898783547968e-07, + "loss": 1.0451, + "step": 25665 + }, + { + "epoch": 0.77, + "learning_rate": 6.447352793376905e-07, + "loss": 1.0757, + "step": 25666 + }, + { + "epoch": 0.77, + "learning_rate": 6.445717927886402e-07, + "loss": 1.1619, + "step": 25667 + }, + { + "epoch": 0.77, + "learning_rate": 6.444083239023724e-07, + "loss": 1.1961, + "step": 25668 + }, + { + "epoch": 0.77, + "learning_rate": 6.442448726804434e-07, + "loss": 1.1157, + "step": 25669 + }, + { + "epoch": 0.77, + "learning_rate": 6.440814391244097e-07, + "loss": 1.0001, + "step": 25670 + }, + { + "epoch": 0.77, + "learning_rate": 6.439180232358272e-07, + "loss": 1.0298, + "step": 25671 + }, + { + "epoch": 0.77, + "learning_rate": 6.437546250162508e-07, + "loss": 1.0765, + "step": 25672 + }, + { + "epoch": 0.77, + "learning_rate": 6.435912444672363e-07, + "loss": 1.0137, + "step": 25673 + }, + { + "epoch": 0.77, + "learning_rate": 6.434278815903392e-07, + "loss": 1.1285, + "step": 25674 + }, + { + "epoch": 0.77, + "learning_rate": 6.432645363871143e-07, + "loss": 1.1197, + "step": 25675 + }, + { + "epoch": 0.77, + "learning_rate": 6.431012088591173e-07, + "loss": 1.0876, + "step": 25676 + }, + { + "epoch": 0.77, + "learning_rate": 6.429378990079021e-07, + "loss": 1.0276, + "step": 25677 + }, + { + "epoch": 0.77, + "learning_rate": 6.427746068350238e-07, + "loss": 1.0644, + "step": 25678 + }, + { + "epoch": 0.77, + "learning_rate": 6.426113323420366e-07, + "loss": 1.0793, + "step": 25679 + }, + { + "epoch": 0.77, + "learning_rate": 6.424480755304949e-07, + "loss": 1.0209, + "step": 25680 + }, + { + "epoch": 0.77, + "learning_rate": 6.422848364019529e-07, + "loss": 1.0374, + "step": 25681 + }, + { + "epoch": 0.77, + "learning_rate": 6.421216149579645e-07, + "loss": 1.0328, + "step": 25682 + }, + { + "epoch": 0.77, + "learning_rate": 6.419584112000838e-07, + "loss": 1.0605, + "step": 25683 + }, + { + "epoch": 0.77, + "learning_rate": 6.417952251298648e-07, + "loss": 1.0743, + "step": 25684 + }, + { + "epoch": 0.77, + "learning_rate": 6.416320567488596e-07, + "loss": 1.1523, + "step": 25685 + }, + { + "epoch": 0.77, + "learning_rate": 6.414689060586221e-07, + "loss": 1.0688, + "step": 25686 + }, + { + "epoch": 0.77, + "learning_rate": 6.413057730607056e-07, + "loss": 1.171, + "step": 25687 + }, + { + "epoch": 0.77, + "learning_rate": 6.411426577566629e-07, + "loss": 1.0568, + "step": 25688 + }, + { + "epoch": 0.77, + "learning_rate": 6.409795601480475e-07, + "loss": 1.0768, + "step": 25689 + }, + { + "epoch": 0.77, + "learning_rate": 6.408164802364105e-07, + "loss": 1.1361, + "step": 25690 + }, + { + "epoch": 0.77, + "learning_rate": 6.406534180233057e-07, + "loss": 1.0474, + "step": 25691 + }, + { + "epoch": 0.77, + "learning_rate": 6.404903735102844e-07, + "loss": 1.2344, + "step": 25692 + }, + { + "epoch": 0.77, + "learning_rate": 6.403273466989001e-07, + "loss": 1.0212, + "step": 25693 + }, + { + "epoch": 0.77, + "learning_rate": 6.401643375907029e-07, + "loss": 1.0047, + "step": 25694 + }, + { + "epoch": 0.77, + "learning_rate": 6.400013461872457e-07, + "loss": 1.0799, + "step": 25695 + }, + { + "epoch": 0.77, + "learning_rate": 6.398383724900798e-07, + "loss": 1.1565, + "step": 25696 + }, + { + "epoch": 0.77, + "learning_rate": 6.396754165007577e-07, + "loss": 1.1376, + "step": 25697 + }, + { + "epoch": 0.77, + "learning_rate": 6.395124782208284e-07, + "loss": 1.1234, + "step": 25698 + }, + { + "epoch": 0.77, + "learning_rate": 6.393495576518446e-07, + "loss": 1.0785, + "step": 25699 + }, + { + "epoch": 0.77, + "learning_rate": 6.391866547953568e-07, + "loss": 1.1001, + "step": 25700 + }, + { + "epoch": 0.77, + "learning_rate": 6.390237696529162e-07, + "loss": 1.1578, + "step": 25701 + }, + { + "epoch": 0.77, + "learning_rate": 6.388609022260733e-07, + "loss": 1.0087, + "step": 25702 + }, + { + "epoch": 0.77, + "learning_rate": 6.386980525163777e-07, + "loss": 1.1346, + "step": 25703 + }, + { + "epoch": 0.77, + "learning_rate": 6.3853522052538e-07, + "loss": 1.0936, + "step": 25704 + }, + { + "epoch": 0.77, + "learning_rate": 6.38372406254631e-07, + "loss": 1.1265, + "step": 25705 + }, + { + "epoch": 0.77, + "learning_rate": 6.382096097056795e-07, + "loss": 1.159, + "step": 25706 + }, + { + "epoch": 0.77, + "learning_rate": 6.380468308800764e-07, + "loss": 1.0955, + "step": 25707 + }, + { + "epoch": 0.77, + "learning_rate": 6.378840697793703e-07, + "loss": 1.0934, + "step": 25708 + }, + { + "epoch": 0.77, + "learning_rate": 6.37721326405111e-07, + "loss": 1.0905, + "step": 25709 + }, + { + "epoch": 0.77, + "learning_rate": 6.375586007588489e-07, + "loss": 1.1417, + "step": 25710 + }, + { + "epoch": 0.77, + "learning_rate": 6.373958928421309e-07, + "loss": 1.1105, + "step": 25711 + }, + { + "epoch": 0.77, + "learning_rate": 6.37233202656507e-07, + "loss": 1.1376, + "step": 25712 + }, + { + "epoch": 0.77, + "learning_rate": 6.37070530203526e-07, + "loss": 1.0771, + "step": 25713 + }, + { + "epoch": 0.77, + "learning_rate": 6.369078754847361e-07, + "loss": 1.1614, + "step": 25714 + }, + { + "epoch": 0.77, + "learning_rate": 6.367452385016868e-07, + "loss": 1.0914, + "step": 25715 + }, + { + "epoch": 0.77, + "learning_rate": 6.365826192559249e-07, + "loss": 1.1426, + "step": 25716 + }, + { + "epoch": 0.77, + "learning_rate": 6.364200177489988e-07, + "loss": 1.0805, + "step": 25717 + }, + { + "epoch": 0.77, + "learning_rate": 6.362574339824565e-07, + "loss": 1.1544, + "step": 25718 + }, + { + "epoch": 0.77, + "learning_rate": 6.360948679578466e-07, + "loss": 1.1066, + "step": 25719 + }, + { + "epoch": 0.77, + "learning_rate": 6.359323196767153e-07, + "loss": 1.0936, + "step": 25720 + }, + { + "epoch": 0.77, + "learning_rate": 6.357697891406107e-07, + "loss": 1.0234, + "step": 25721 + }, + { + "epoch": 0.77, + "learning_rate": 6.356072763510795e-07, + "loss": 1.0993, + "step": 25722 + }, + { + "epoch": 0.77, + "learning_rate": 6.354447813096697e-07, + "loss": 1.1862, + "step": 25723 + }, + { + "epoch": 0.77, + "learning_rate": 6.352823040179273e-07, + "loss": 1.0256, + "step": 25724 + }, + { + "epoch": 0.77, + "learning_rate": 6.351198444773993e-07, + "loss": 1.226, + "step": 25725 + }, + { + "epoch": 0.77, + "learning_rate": 6.349574026896319e-07, + "loss": 1.123, + "step": 25726 + }, + { + "epoch": 0.78, + "learning_rate": 6.347949786561719e-07, + "loss": 0.9713, + "step": 25727 + }, + { + "epoch": 0.78, + "learning_rate": 6.346325723785663e-07, + "loss": 1.1149, + "step": 25728 + }, + { + "epoch": 0.78, + "learning_rate": 6.344701838583592e-07, + "loss": 1.2074, + "step": 25729 + }, + { + "epoch": 0.78, + "learning_rate": 6.343078130970976e-07, + "loss": 1.0486, + "step": 25730 + }, + { + "epoch": 0.78, + "learning_rate": 6.341454600963271e-07, + "loss": 1.077, + "step": 25731 + }, + { + "epoch": 0.78, + "learning_rate": 6.339831248575931e-07, + "loss": 1.1266, + "step": 25732 + }, + { + "epoch": 0.78, + "learning_rate": 6.33820807382442e-07, + "loss": 1.0297, + "step": 25733 + }, + { + "epoch": 0.78, + "learning_rate": 6.336585076724169e-07, + "loss": 1.1088, + "step": 25734 + }, + { + "epoch": 0.78, + "learning_rate": 6.334962257290645e-07, + "loss": 1.2001, + "step": 25735 + }, + { + "epoch": 0.78, + "learning_rate": 6.333339615539285e-07, + "loss": 1.1266, + "step": 25736 + }, + { + "epoch": 0.78, + "learning_rate": 6.331717151485545e-07, + "loss": 1.2826, + "step": 25737 + }, + { + "epoch": 0.78, + "learning_rate": 6.330094865144868e-07, + "loss": 1.2742, + "step": 25738 + }, + { + "epoch": 0.78, + "learning_rate": 6.328472756532695e-07, + "loss": 1.1186, + "step": 25739 + }, + { + "epoch": 0.78, + "learning_rate": 6.326850825664466e-07, + "loss": 0.9572, + "step": 25740 + }, + { + "epoch": 0.78, + "learning_rate": 6.325229072555634e-07, + "loss": 1.0989, + "step": 25741 + }, + { + "epoch": 0.78, + "learning_rate": 6.323607497221621e-07, + "loss": 1.2629, + "step": 25742 + }, + { + "epoch": 0.78, + "learning_rate": 6.321986099677868e-07, + "loss": 1.201, + "step": 25743 + }, + { + "epoch": 0.78, + "learning_rate": 6.320364879939811e-07, + "loss": 1.1412, + "step": 25744 + }, + { + "epoch": 0.78, + "learning_rate": 6.318743838022892e-07, + "loss": 1.1494, + "step": 25745 + }, + { + "epoch": 0.78, + "learning_rate": 6.317122973942527e-07, + "loss": 1.1309, + "step": 25746 + }, + { + "epoch": 0.78, + "learning_rate": 6.315502287714153e-07, + "loss": 1.1136, + "step": 25747 + }, + { + "epoch": 0.78, + "learning_rate": 6.313881779353198e-07, + "loss": 0.9915, + "step": 25748 + }, + { + "epoch": 0.78, + "learning_rate": 6.312261448875099e-07, + "loss": 1.1429, + "step": 25749 + }, + { + "epoch": 0.78, + "learning_rate": 6.310641296295261e-07, + "loss": 1.017, + "step": 25750 + }, + { + "epoch": 0.78, + "learning_rate": 6.309021321629116e-07, + "loss": 1.1356, + "step": 25751 + }, + { + "epoch": 0.78, + "learning_rate": 6.30740152489209e-07, + "loss": 1.0939, + "step": 25752 + }, + { + "epoch": 0.78, + "learning_rate": 6.305781906099603e-07, + "loss": 1.1353, + "step": 25753 + }, + { + "epoch": 0.78, + "learning_rate": 6.30416246526706e-07, + "loss": 1.1011, + "step": 25754 + }, + { + "epoch": 0.78, + "learning_rate": 6.302543202409888e-07, + "loss": 1.068, + "step": 25755 + }, + { + "epoch": 0.78, + "learning_rate": 6.300924117543503e-07, + "loss": 1.1882, + "step": 25756 + }, + { + "epoch": 0.78, + "learning_rate": 6.29930521068331e-07, + "loss": 1.0523, + "step": 25757 + }, + { + "epoch": 0.78, + "learning_rate": 6.297686481844734e-07, + "loss": 1.0938, + "step": 25758 + }, + { + "epoch": 0.78, + "learning_rate": 6.296067931043168e-07, + "loss": 1.0439, + "step": 25759 + }, + { + "epoch": 0.78, + "learning_rate": 6.294449558294028e-07, + "loss": 1.0481, + "step": 25760 + }, + { + "epoch": 0.78, + "learning_rate": 6.292831363612717e-07, + "loss": 1.0681, + "step": 25761 + }, + { + "epoch": 0.78, + "learning_rate": 6.291213347014641e-07, + "loss": 1.1212, + "step": 25762 + }, + { + "epoch": 0.78, + "learning_rate": 6.289595508515206e-07, + "loss": 1.0913, + "step": 25763 + }, + { + "epoch": 0.78, + "learning_rate": 6.287977848129812e-07, + "loss": 1.0662, + "step": 25764 + }, + { + "epoch": 0.78, + "learning_rate": 6.286360365873853e-07, + "loss": 1.0625, + "step": 25765 + }, + { + "epoch": 0.78, + "learning_rate": 6.284743061762741e-07, + "loss": 1.1855, + "step": 25766 + }, + { + "epoch": 0.78, + "learning_rate": 6.283125935811851e-07, + "loss": 1.1253, + "step": 25767 + }, + { + "epoch": 0.78, + "learning_rate": 6.281508988036589e-07, + "loss": 1.1608, + "step": 25768 + }, + { + "epoch": 0.78, + "learning_rate": 6.279892218452346e-07, + "loss": 1.0828, + "step": 25769 + }, + { + "epoch": 0.78, + "learning_rate": 6.278275627074515e-07, + "loss": 1.1105, + "step": 25770 + }, + { + "epoch": 0.78, + "learning_rate": 6.27665921391849e-07, + "loss": 1.0607, + "step": 25771 + }, + { + "epoch": 0.78, + "learning_rate": 6.275042978999643e-07, + "loss": 0.9916, + "step": 25772 + }, + { + "epoch": 0.78, + "learning_rate": 6.27342692233337e-07, + "loss": 1.1055, + "step": 25773 + }, + { + "epoch": 0.78, + "learning_rate": 6.271811043935055e-07, + "loss": 1.171, + "step": 25774 + }, + { + "epoch": 0.78, + "learning_rate": 6.270195343820085e-07, + "loss": 1.1201, + "step": 25775 + }, + { + "epoch": 0.78, + "learning_rate": 6.268579822003826e-07, + "loss": 1.2386, + "step": 25776 + }, + { + "epoch": 0.78, + "learning_rate": 6.266964478501666e-07, + "loss": 1.014, + "step": 25777 + }, + { + "epoch": 0.78, + "learning_rate": 6.265349313328984e-07, + "loss": 1.1761, + "step": 25778 + }, + { + "epoch": 0.78, + "learning_rate": 6.263734326501161e-07, + "loss": 1.1044, + "step": 25779 + }, + { + "epoch": 0.78, + "learning_rate": 6.262119518033555e-07, + "loss": 1.2234, + "step": 25780 + }, + { + "epoch": 0.78, + "learning_rate": 6.260504887941546e-07, + "loss": 1.0886, + "step": 25781 + }, + { + "epoch": 0.78, + "learning_rate": 6.258890436240505e-07, + "loss": 1.142, + "step": 25782 + }, + { + "epoch": 0.78, + "learning_rate": 6.257276162945802e-07, + "loss": 1.0905, + "step": 25783 + }, + { + "epoch": 0.78, + "learning_rate": 6.255662068072813e-07, + "loss": 1.0086, + "step": 25784 + }, + { + "epoch": 0.78, + "learning_rate": 6.254048151636882e-07, + "loss": 1.0783, + "step": 25785 + }, + { + "epoch": 0.78, + "learning_rate": 6.252434413653385e-07, + "loss": 1.1701, + "step": 25786 + }, + { + "epoch": 0.78, + "learning_rate": 6.250820854137685e-07, + "loss": 1.1003, + "step": 25787 + }, + { + "epoch": 0.78, + "learning_rate": 6.24920747310514e-07, + "loss": 1.1194, + "step": 25788 + }, + { + "epoch": 0.78, + "learning_rate": 6.247594270571108e-07, + "loss": 1.1495, + "step": 25789 + }, + { + "epoch": 0.78, + "learning_rate": 6.245981246550947e-07, + "loss": 1.0508, + "step": 25790 + }, + { + "epoch": 0.78, + "learning_rate": 6.244368401060013e-07, + "loss": 1.0859, + "step": 25791 + }, + { + "epoch": 0.78, + "learning_rate": 6.242755734113667e-07, + "loss": 1.0804, + "step": 25792 + }, + { + "epoch": 0.78, + "learning_rate": 6.241143245727247e-07, + "loss": 1.1221, + "step": 25793 + }, + { + "epoch": 0.78, + "learning_rate": 6.239530935916104e-07, + "loss": 1.0278, + "step": 25794 + }, + { + "epoch": 0.78, + "learning_rate": 6.237918804695594e-07, + "loss": 1.1375, + "step": 25795 + }, + { + "epoch": 0.78, + "learning_rate": 6.236306852081061e-07, + "loss": 1.0714, + "step": 25796 + }, + { + "epoch": 0.78, + "learning_rate": 6.234695078087858e-07, + "loss": 1.0688, + "step": 25797 + }, + { + "epoch": 0.78, + "learning_rate": 6.233083482731309e-07, + "loss": 1.1301, + "step": 25798 + }, + { + "epoch": 0.78, + "learning_rate": 6.23147206602677e-07, + "loss": 1.2412, + "step": 25799 + }, + { + "epoch": 0.78, + "learning_rate": 6.229860827989576e-07, + "loss": 1.3323, + "step": 25800 + }, + { + "epoch": 0.78, + "learning_rate": 6.228249768635075e-07, + "loss": 1.115, + "step": 25801 + }, + { + "epoch": 0.78, + "learning_rate": 6.226638887978589e-07, + "loss": 1.1295, + "step": 25802 + }, + { + "epoch": 0.78, + "learning_rate": 6.225028186035458e-07, + "loss": 1.0023, + "step": 25803 + }, + { + "epoch": 0.78, + "learning_rate": 6.223417662821018e-07, + "loss": 1.0391, + "step": 25804 + }, + { + "epoch": 0.78, + "learning_rate": 6.221807318350604e-07, + "loss": 1.192, + "step": 25805 + }, + { + "epoch": 0.78, + "learning_rate": 6.220197152639534e-07, + "loss": 1.139, + "step": 25806 + }, + { + "epoch": 0.78, + "learning_rate": 6.218587165703142e-07, + "loss": 1.0787, + "step": 25807 + }, + { + "epoch": 0.78, + "learning_rate": 6.216977357556755e-07, + "loss": 1.1838, + "step": 25808 + }, + { + "epoch": 0.78, + "learning_rate": 6.215367728215698e-07, + "loss": 1.1594, + "step": 25809 + }, + { + "epoch": 0.78, + "learning_rate": 6.2137582776953e-07, + "loss": 1.0472, + "step": 25810 + }, + { + "epoch": 0.78, + "learning_rate": 6.212149006010868e-07, + "loss": 1.0398, + "step": 25811 + }, + { + "epoch": 0.78, + "learning_rate": 6.210539913177729e-07, + "loss": 1.0479, + "step": 25812 + }, + { + "epoch": 0.78, + "learning_rate": 6.208930999211202e-07, + "loss": 1.0859, + "step": 25813 + }, + { + "epoch": 0.78, + "learning_rate": 6.2073222641266e-07, + "loss": 1.0715, + "step": 25814 + }, + { + "epoch": 0.78, + "learning_rate": 6.205713707939246e-07, + "loss": 1.1612, + "step": 25815 + }, + { + "epoch": 0.78, + "learning_rate": 6.204105330664439e-07, + "loss": 1.0305, + "step": 25816 + }, + { + "epoch": 0.78, + "learning_rate": 6.202497132317497e-07, + "loss": 1.0942, + "step": 25817 + }, + { + "epoch": 0.78, + "learning_rate": 6.20088911291373e-07, + "loss": 1.2167, + "step": 25818 + }, + { + "epoch": 0.78, + "learning_rate": 6.199281272468446e-07, + "loss": 1.0231, + "step": 25819 + }, + { + "epoch": 0.78, + "learning_rate": 6.197673610996946e-07, + "loss": 1.0912, + "step": 25820 + }, + { + "epoch": 0.78, + "learning_rate": 6.196066128514542e-07, + "loss": 1.04, + "step": 25821 + }, + { + "epoch": 0.78, + "learning_rate": 6.194458825036528e-07, + "loss": 1.0959, + "step": 25822 + }, + { + "epoch": 0.78, + "learning_rate": 6.192851700578218e-07, + "loss": 1.2057, + "step": 25823 + }, + { + "epoch": 0.78, + "learning_rate": 6.191244755154896e-07, + "loss": 1.1265, + "step": 25824 + }, + { + "epoch": 0.78, + "learning_rate": 6.189637988781863e-07, + "loss": 1.0633, + "step": 25825 + }, + { + "epoch": 0.78, + "learning_rate": 6.188031401474417e-07, + "loss": 1.1176, + "step": 25826 + }, + { + "epoch": 0.78, + "learning_rate": 6.186424993247861e-07, + "loss": 1.0873, + "step": 25827 + }, + { + "epoch": 0.78, + "learning_rate": 6.18481876411747e-07, + "loss": 1.1015, + "step": 25828 + }, + { + "epoch": 0.78, + "learning_rate": 6.183212714098541e-07, + "loss": 1.1682, + "step": 25829 + }, + { + "epoch": 0.78, + "learning_rate": 6.181606843206367e-07, + "loss": 1.045, + "step": 25830 + }, + { + "epoch": 0.78, + "learning_rate": 6.180001151456239e-07, + "loss": 1.1589, + "step": 25831 + }, + { + "epoch": 0.78, + "learning_rate": 6.17839563886343e-07, + "loss": 1.1059, + "step": 25832 + }, + { + "epoch": 0.78, + "learning_rate": 6.176790305443228e-07, + "loss": 1.0485, + "step": 25833 + }, + { + "epoch": 0.78, + "learning_rate": 6.175185151210917e-07, + "loss": 1.0226, + "step": 25834 + }, + { + "epoch": 0.78, + "learning_rate": 6.173580176181776e-07, + "loss": 1.0142, + "step": 25835 + }, + { + "epoch": 0.78, + "learning_rate": 6.171975380371092e-07, + "loss": 1.2344, + "step": 25836 + }, + { + "epoch": 0.78, + "learning_rate": 6.170370763794132e-07, + "loss": 1.1655, + "step": 25837 + }, + { + "epoch": 0.78, + "learning_rate": 6.168766326466169e-07, + "loss": 1.0631, + "step": 25838 + }, + { + "epoch": 0.78, + "learning_rate": 6.16716206840248e-07, + "loss": 1.0297, + "step": 25839 + }, + { + "epoch": 0.78, + "learning_rate": 6.165557989618348e-07, + "loss": 1.0469, + "step": 25840 + }, + { + "epoch": 0.78, + "learning_rate": 6.163954090129027e-07, + "loss": 1.1173, + "step": 25841 + }, + { + "epoch": 0.78, + "learning_rate": 6.162350369949787e-07, + "loss": 1.1714, + "step": 25842 + }, + { + "epoch": 0.78, + "learning_rate": 6.160746829095901e-07, + "loss": 1.0473, + "step": 25843 + }, + { + "epoch": 0.78, + "learning_rate": 6.159143467582632e-07, + "loss": 1.0911, + "step": 25844 + }, + { + "epoch": 0.78, + "learning_rate": 6.157540285425243e-07, + "loss": 1.1563, + "step": 25845 + }, + { + "epoch": 0.78, + "learning_rate": 6.155937282638997e-07, + "loss": 1.04, + "step": 25846 + }, + { + "epoch": 0.78, + "learning_rate": 6.15433445923915e-07, + "loss": 1.1257, + "step": 25847 + }, + { + "epoch": 0.78, + "learning_rate": 6.152731815240964e-07, + "loss": 1.0673, + "step": 25848 + }, + { + "epoch": 0.78, + "learning_rate": 6.151129350659702e-07, + "loss": 1.1441, + "step": 25849 + }, + { + "epoch": 0.78, + "learning_rate": 6.149527065510602e-07, + "loss": 1.1205, + "step": 25850 + }, + { + "epoch": 0.78, + "learning_rate": 6.147924959808926e-07, + "loss": 1.1669, + "step": 25851 + }, + { + "epoch": 0.78, + "learning_rate": 6.146323033569926e-07, + "loss": 0.9853, + "step": 25852 + }, + { + "epoch": 0.78, + "learning_rate": 6.144721286808855e-07, + "loss": 1.0356, + "step": 25853 + }, + { + "epoch": 0.78, + "learning_rate": 6.143119719540952e-07, + "loss": 1.2151, + "step": 25854 + }, + { + "epoch": 0.78, + "learning_rate": 6.141518331781465e-07, + "loss": 1.1058, + "step": 25855 + }, + { + "epoch": 0.78, + "learning_rate": 6.139917123545644e-07, + "loss": 1.1956, + "step": 25856 + }, + { + "epoch": 0.78, + "learning_rate": 6.138316094848734e-07, + "loss": 1.1328, + "step": 25857 + }, + { + "epoch": 0.78, + "learning_rate": 6.136715245705962e-07, + "loss": 1.0716, + "step": 25858 + }, + { + "epoch": 0.78, + "learning_rate": 6.135114576132578e-07, + "loss": 1.0956, + "step": 25859 + }, + { + "epoch": 0.78, + "learning_rate": 6.133514086143818e-07, + "loss": 1.0724, + "step": 25860 + }, + { + "epoch": 0.78, + "learning_rate": 6.131913775754916e-07, + "loss": 1.1198, + "step": 25861 + }, + { + "epoch": 0.78, + "learning_rate": 6.130313644981118e-07, + "loss": 1.0956, + "step": 25862 + }, + { + "epoch": 0.78, + "learning_rate": 6.128713693837634e-07, + "loss": 1.0813, + "step": 25863 + }, + { + "epoch": 0.78, + "learning_rate": 6.127113922339712e-07, + "loss": 1.1141, + "step": 25864 + }, + { + "epoch": 0.78, + "learning_rate": 6.125514330502572e-07, + "loss": 1.1245, + "step": 25865 + }, + { + "epoch": 0.78, + "learning_rate": 6.123914918341453e-07, + "loss": 1.0721, + "step": 25866 + }, + { + "epoch": 0.78, + "learning_rate": 6.122315685871566e-07, + "loss": 1.0533, + "step": 25867 + }, + { + "epoch": 0.78, + "learning_rate": 6.120716633108142e-07, + "loss": 1.1564, + "step": 25868 + }, + { + "epoch": 0.78, + "learning_rate": 6.119117760066406e-07, + "loss": 1.2524, + "step": 25869 + }, + { + "epoch": 0.78, + "learning_rate": 6.117519066761573e-07, + "loss": 1.0895, + "step": 25870 + }, + { + "epoch": 0.78, + "learning_rate": 6.115920553208865e-07, + "loss": 1.0918, + "step": 25871 + }, + { + "epoch": 0.78, + "learning_rate": 6.114322219423496e-07, + "loss": 1.0905, + "step": 25872 + }, + { + "epoch": 0.78, + "learning_rate": 6.112724065420686e-07, + "loss": 1.1071, + "step": 25873 + }, + { + "epoch": 0.78, + "learning_rate": 6.111126091215646e-07, + "loss": 1.1297, + "step": 25874 + }, + { + "epoch": 0.78, + "learning_rate": 6.109528296823597e-07, + "loss": 1.1851, + "step": 25875 + }, + { + "epoch": 0.78, + "learning_rate": 6.107930682259732e-07, + "loss": 1.1498, + "step": 25876 + }, + { + "epoch": 0.78, + "learning_rate": 6.106333247539268e-07, + "loss": 1.1038, + "step": 25877 + }, + { + "epoch": 0.78, + "learning_rate": 6.104735992677413e-07, + "loss": 0.971, + "step": 25878 + }, + { + "epoch": 0.78, + "learning_rate": 6.103138917689378e-07, + "loss": 1.192, + "step": 25879 + }, + { + "epoch": 0.78, + "learning_rate": 6.101542022590351e-07, + "loss": 1.2185, + "step": 25880 + }, + { + "epoch": 0.78, + "learning_rate": 6.099945307395544e-07, + "loss": 1.0319, + "step": 25881 + }, + { + "epoch": 0.78, + "learning_rate": 6.098348772120155e-07, + "loss": 1.0756, + "step": 25882 + }, + { + "epoch": 0.78, + "learning_rate": 6.09675241677939e-07, + "loss": 1.1411, + "step": 25883 + }, + { + "epoch": 0.78, + "learning_rate": 6.095156241388428e-07, + "loss": 0.9792, + "step": 25884 + }, + { + "epoch": 0.78, + "learning_rate": 6.093560245962473e-07, + "loss": 1.0338, + "step": 25885 + }, + { + "epoch": 0.78, + "learning_rate": 6.091964430516722e-07, + "loss": 1.1767, + "step": 25886 + }, + { + "epoch": 0.78, + "learning_rate": 6.090368795066362e-07, + "loss": 1.2087, + "step": 25887 + }, + { + "epoch": 0.78, + "learning_rate": 6.088773339626591e-07, + "loss": 1.0305, + "step": 25888 + }, + { + "epoch": 0.78, + "learning_rate": 6.087178064212585e-07, + "loss": 1.2272, + "step": 25889 + }, + { + "epoch": 0.78, + "learning_rate": 6.085582968839532e-07, + "loss": 0.9708, + "step": 25890 + }, + { + "epoch": 0.78, + "learning_rate": 6.083988053522621e-07, + "loss": 1.1332, + "step": 25891 + }, + { + "epoch": 0.78, + "learning_rate": 6.082393318277041e-07, + "loss": 1.1418, + "step": 25892 + }, + { + "epoch": 0.78, + "learning_rate": 6.080798763117957e-07, + "loss": 1.1729, + "step": 25893 + }, + { + "epoch": 0.78, + "learning_rate": 6.079204388060559e-07, + "loss": 1.0756, + "step": 25894 + }, + { + "epoch": 0.78, + "learning_rate": 6.07761019312002e-07, + "loss": 0.9913, + "step": 25895 + }, + { + "epoch": 0.78, + "learning_rate": 6.07601617831152e-07, + "loss": 1.1362, + "step": 25896 + }, + { + "epoch": 0.78, + "learning_rate": 6.074422343650232e-07, + "loss": 1.0371, + "step": 25897 + }, + { + "epoch": 0.78, + "learning_rate": 6.072828689151337e-07, + "loss": 1.0992, + "step": 25898 + }, + { + "epoch": 0.78, + "learning_rate": 6.071235214829988e-07, + "loss": 1.1859, + "step": 25899 + }, + { + "epoch": 0.78, + "learning_rate": 6.069641920701363e-07, + "loss": 1.1422, + "step": 25900 + }, + { + "epoch": 0.78, + "learning_rate": 6.06804880678063e-07, + "loss": 1.0961, + "step": 25901 + }, + { + "epoch": 0.78, + "learning_rate": 6.066455873082955e-07, + "loss": 1.06, + "step": 25902 + }, + { + "epoch": 0.78, + "learning_rate": 6.064863119623502e-07, + "loss": 1.104, + "step": 25903 + }, + { + "epoch": 0.78, + "learning_rate": 6.06327054641743e-07, + "loss": 1.1028, + "step": 25904 + }, + { + "epoch": 0.78, + "learning_rate": 6.061678153479914e-07, + "loss": 1.2064, + "step": 25905 + }, + { + "epoch": 0.78, + "learning_rate": 6.060085940826088e-07, + "loss": 1.0688, + "step": 25906 + }, + { + "epoch": 0.78, + "learning_rate": 6.058493908471128e-07, + "loss": 1.1351, + "step": 25907 + }, + { + "epoch": 0.78, + "learning_rate": 6.056902056430181e-07, + "loss": 1.1432, + "step": 25908 + }, + { + "epoch": 0.78, + "learning_rate": 6.055310384718408e-07, + "loss": 1.1159, + "step": 25909 + }, + { + "epoch": 0.78, + "learning_rate": 6.053718893350952e-07, + "loss": 1.1422, + "step": 25910 + }, + { + "epoch": 0.78, + "learning_rate": 6.052127582342965e-07, + "loss": 1.0759, + "step": 25911 + }, + { + "epoch": 0.78, + "learning_rate": 6.050536451709599e-07, + "loss": 1.1248, + "step": 25912 + }, + { + "epoch": 0.78, + "learning_rate": 6.048945501466e-07, + "loss": 1.1754, + "step": 25913 + }, + { + "epoch": 0.78, + "learning_rate": 6.047354731627319e-07, + "loss": 1.066, + "step": 25914 + }, + { + "epoch": 0.78, + "learning_rate": 6.045764142208685e-07, + "loss": 0.9431, + "step": 25915 + }, + { + "epoch": 0.78, + "learning_rate": 6.044173733225251e-07, + "loss": 0.9963, + "step": 25916 + }, + { + "epoch": 0.78, + "learning_rate": 6.042583504692152e-07, + "loss": 1.1232, + "step": 25917 + }, + { + "epoch": 0.78, + "learning_rate": 6.040993456624533e-07, + "loss": 0.9661, + "step": 25918 + }, + { + "epoch": 0.78, + "learning_rate": 6.039403589037521e-07, + "loss": 1.1103, + "step": 25919 + }, + { + "epoch": 0.78, + "learning_rate": 6.037813901946252e-07, + "loss": 1.0146, + "step": 25920 + }, + { + "epoch": 0.78, + "learning_rate": 6.036224395365864e-07, + "loss": 1.1989, + "step": 25921 + }, + { + "epoch": 0.78, + "learning_rate": 6.034635069311496e-07, + "loss": 1.198, + "step": 25922 + }, + { + "epoch": 0.78, + "learning_rate": 6.033045923798256e-07, + "loss": 1.1309, + "step": 25923 + }, + { + "epoch": 0.78, + "learning_rate": 6.031456958841286e-07, + "loss": 1.0716, + "step": 25924 + }, + { + "epoch": 0.78, + "learning_rate": 6.029868174455713e-07, + "loss": 1.0672, + "step": 25925 + }, + { + "epoch": 0.78, + "learning_rate": 6.028279570656657e-07, + "loss": 1.1073, + "step": 25926 + }, + { + "epoch": 0.78, + "learning_rate": 6.02669114745924e-07, + "loss": 1.2131, + "step": 25927 + }, + { + "epoch": 0.78, + "learning_rate": 6.025102904878588e-07, + "loss": 1.1324, + "step": 25928 + }, + { + "epoch": 0.78, + "learning_rate": 6.023514842929817e-07, + "loss": 1.0741, + "step": 25929 + }, + { + "epoch": 0.78, + "learning_rate": 6.021926961628044e-07, + "loss": 1.158, + "step": 25930 + }, + { + "epoch": 0.78, + "learning_rate": 6.020339260988395e-07, + "loss": 1.1228, + "step": 25931 + }, + { + "epoch": 0.78, + "learning_rate": 6.018751741025969e-07, + "loss": 1.0685, + "step": 25932 + }, + { + "epoch": 0.78, + "learning_rate": 6.017164401755882e-07, + "loss": 1.0591, + "step": 25933 + }, + { + "epoch": 0.78, + "learning_rate": 6.015577243193249e-07, + "loss": 1.1569, + "step": 25934 + }, + { + "epoch": 0.78, + "learning_rate": 6.013990265353187e-07, + "loss": 1.1447, + "step": 25935 + }, + { + "epoch": 0.78, + "learning_rate": 6.012403468250783e-07, + "loss": 1.1533, + "step": 25936 + }, + { + "epoch": 0.78, + "learning_rate": 6.010816851901155e-07, + "loss": 1.213, + "step": 25937 + }, + { + "epoch": 0.78, + "learning_rate": 6.009230416319403e-07, + "loss": 1.0702, + "step": 25938 + }, + { + "epoch": 0.78, + "learning_rate": 6.00764416152064e-07, + "loss": 1.0229, + "step": 25939 + }, + { + "epoch": 0.78, + "learning_rate": 6.00605808751995e-07, + "loss": 1.085, + "step": 25940 + }, + { + "epoch": 0.78, + "learning_rate": 6.004472194332439e-07, + "loss": 1.1147, + "step": 25941 + }, + { + "epoch": 0.78, + "learning_rate": 6.002886481973206e-07, + "loss": 1.3005, + "step": 25942 + }, + { + "epoch": 0.78, + "learning_rate": 6.001300950457343e-07, + "loss": 1.0934, + "step": 25943 + }, + { + "epoch": 0.78, + "learning_rate": 5.999715599799949e-07, + "loss": 1.2006, + "step": 25944 + }, + { + "epoch": 0.78, + "learning_rate": 5.998130430016108e-07, + "loss": 1.1932, + "step": 25945 + }, + { + "epoch": 0.78, + "learning_rate": 5.996545441120913e-07, + "loss": 0.9888, + "step": 25946 + }, + { + "epoch": 0.78, + "learning_rate": 5.994960633129454e-07, + "loss": 1.0964, + "step": 25947 + }, + { + "epoch": 0.78, + "learning_rate": 5.993376006056823e-07, + "loss": 1.0898, + "step": 25948 + }, + { + "epoch": 0.78, + "learning_rate": 5.991791559918092e-07, + "loss": 1.1793, + "step": 25949 + }, + { + "epoch": 0.78, + "learning_rate": 5.990207294728348e-07, + "loss": 1.1887, + "step": 25950 + }, + { + "epoch": 0.78, + "learning_rate": 5.988623210502678e-07, + "loss": 1.1487, + "step": 25951 + }, + { + "epoch": 0.78, + "learning_rate": 5.987039307256157e-07, + "loss": 1.0328, + "step": 25952 + }, + { + "epoch": 0.78, + "learning_rate": 5.985455585003866e-07, + "loss": 1.1907, + "step": 25953 + }, + { + "epoch": 0.78, + "learning_rate": 5.983872043760879e-07, + "loss": 1.0598, + "step": 25954 + }, + { + "epoch": 0.78, + "learning_rate": 5.982288683542273e-07, + "loss": 1.0385, + "step": 25955 + }, + { + "epoch": 0.78, + "learning_rate": 5.980705504363118e-07, + "loss": 1.059, + "step": 25956 + }, + { + "epoch": 0.78, + "learning_rate": 5.979122506238497e-07, + "loss": 1.1064, + "step": 25957 + }, + { + "epoch": 0.78, + "learning_rate": 5.977539689183459e-07, + "loss": 1.0421, + "step": 25958 + }, + { + "epoch": 0.78, + "learning_rate": 5.975957053213083e-07, + "loss": 1.0635, + "step": 25959 + }, + { + "epoch": 0.78, + "learning_rate": 5.974374598342431e-07, + "loss": 0.9929, + "step": 25960 + }, + { + "epoch": 0.78, + "learning_rate": 5.972792324586579e-07, + "loss": 1.1214, + "step": 25961 + }, + { + "epoch": 0.78, + "learning_rate": 5.971210231960572e-07, + "loss": 1.1207, + "step": 25962 + }, + { + "epoch": 0.78, + "learning_rate": 5.969628320479481e-07, + "loss": 1.0422, + "step": 25963 + }, + { + "epoch": 0.78, + "learning_rate": 5.96804659015836e-07, + "loss": 1.1382, + "step": 25964 + }, + { + "epoch": 0.78, + "learning_rate": 5.966465041012279e-07, + "loss": 1.1281, + "step": 25965 + }, + { + "epoch": 0.78, + "learning_rate": 5.964883673056277e-07, + "loss": 1.0511, + "step": 25966 + }, + { + "epoch": 0.78, + "learning_rate": 5.963302486305414e-07, + "loss": 1.1815, + "step": 25967 + }, + { + "epoch": 0.78, + "learning_rate": 5.961721480774743e-07, + "loss": 1.2411, + "step": 25968 + }, + { + "epoch": 0.78, + "learning_rate": 5.960140656479313e-07, + "loss": 1.1197, + "step": 25969 + }, + { + "epoch": 0.78, + "learning_rate": 5.958560013434183e-07, + "loss": 1.1265, + "step": 25970 + }, + { + "epoch": 0.78, + "learning_rate": 5.956979551654382e-07, + "loss": 1.1278, + "step": 25971 + }, + { + "epoch": 0.78, + "learning_rate": 5.955399271154966e-07, + "loss": 1.1201, + "step": 25972 + }, + { + "epoch": 0.78, + "learning_rate": 5.953819171950975e-07, + "loss": 0.9517, + "step": 25973 + }, + { + "epoch": 0.78, + "learning_rate": 5.952239254057463e-07, + "loss": 1.0478, + "step": 25974 + }, + { + "epoch": 0.78, + "learning_rate": 5.950659517489449e-07, + "loss": 1.1782, + "step": 25975 + }, + { + "epoch": 0.78, + "learning_rate": 5.949079962261984e-07, + "loss": 1.0281, + "step": 25976 + }, + { + "epoch": 0.78, + "learning_rate": 5.947500588390101e-07, + "loss": 1.1053, + "step": 25977 + }, + { + "epoch": 0.78, + "learning_rate": 5.945921395888837e-07, + "loss": 1.1217, + "step": 25978 + }, + { + "epoch": 0.78, + "learning_rate": 5.944342384773224e-07, + "loss": 0.989, + "step": 25979 + }, + { + "epoch": 0.78, + "learning_rate": 5.942763555058304e-07, + "loss": 1.1234, + "step": 25980 + }, + { + "epoch": 0.78, + "learning_rate": 5.941184906759087e-07, + "loss": 1.1093, + "step": 25981 + }, + { + "epoch": 0.78, + "learning_rate": 5.93960643989061e-07, + "loss": 1.0381, + "step": 25982 + }, + { + "epoch": 0.78, + "learning_rate": 5.938028154467901e-07, + "loss": 1.0372, + "step": 25983 + }, + { + "epoch": 0.78, + "learning_rate": 5.936450050505985e-07, + "loss": 0.9922, + "step": 25984 + }, + { + "epoch": 0.78, + "learning_rate": 5.934872128019881e-07, + "loss": 1.1133, + "step": 25985 + }, + { + "epoch": 0.78, + "learning_rate": 5.933294387024613e-07, + "loss": 1.186, + "step": 25986 + }, + { + "epoch": 0.78, + "learning_rate": 5.931716827535206e-07, + "loss": 1.1101, + "step": 25987 + }, + { + "epoch": 0.78, + "learning_rate": 5.930139449566663e-07, + "loss": 1.1495, + "step": 25988 + }, + { + "epoch": 0.78, + "learning_rate": 5.92856225313401e-07, + "loss": 1.0881, + "step": 25989 + }, + { + "epoch": 0.78, + "learning_rate": 5.926985238252259e-07, + "loss": 1.0665, + "step": 25990 + }, + { + "epoch": 0.78, + "learning_rate": 5.92540840493643e-07, + "loss": 1.0314, + "step": 25991 + }, + { + "epoch": 0.78, + "learning_rate": 5.92383175320152e-07, + "loss": 1.0735, + "step": 25992 + }, + { + "epoch": 0.78, + "learning_rate": 5.922255283062542e-07, + "loss": 1.2356, + "step": 25993 + }, + { + "epoch": 0.78, + "learning_rate": 5.920678994534507e-07, + "loss": 1.0327, + "step": 25994 + }, + { + "epoch": 0.78, + "learning_rate": 5.91910288763242e-07, + "loss": 1.1393, + "step": 25995 + }, + { + "epoch": 0.78, + "learning_rate": 5.917526962371289e-07, + "loss": 1.2061, + "step": 25996 + }, + { + "epoch": 0.78, + "learning_rate": 5.915951218766102e-07, + "loss": 1.1241, + "step": 25997 + }, + { + "epoch": 0.78, + "learning_rate": 5.914375656831872e-07, + "loss": 1.1635, + "step": 25998 + }, + { + "epoch": 0.78, + "learning_rate": 5.912800276583594e-07, + "loss": 1.1932, + "step": 25999 + }, + { + "epoch": 0.78, + "learning_rate": 5.91122507803627e-07, + "loss": 1.0845, + "step": 26000 + }, + { + "epoch": 0.78, + "learning_rate": 5.909650061204883e-07, + "loss": 1.1069, + "step": 26001 + }, + { + "epoch": 0.78, + "learning_rate": 5.908075226104432e-07, + "loss": 1.0489, + "step": 26002 + }, + { + "epoch": 0.78, + "learning_rate": 5.906500572749913e-07, + "loss": 1.1702, + "step": 26003 + }, + { + "epoch": 0.78, + "learning_rate": 5.904926101156316e-07, + "loss": 1.1844, + "step": 26004 + }, + { + "epoch": 0.78, + "learning_rate": 5.90335181133862e-07, + "loss": 1.1249, + "step": 26005 + }, + { + "epoch": 0.78, + "learning_rate": 5.90177770331182e-07, + "loss": 1.1841, + "step": 26006 + }, + { + "epoch": 0.78, + "learning_rate": 5.900203777090896e-07, + "loss": 1.0735, + "step": 26007 + }, + { + "epoch": 0.78, + "learning_rate": 5.898630032690833e-07, + "loss": 1.0126, + "step": 26008 + }, + { + "epoch": 0.78, + "learning_rate": 5.897056470126613e-07, + "loss": 1.1013, + "step": 26009 + }, + { + "epoch": 0.78, + "learning_rate": 5.895483089413217e-07, + "loss": 1.0939, + "step": 26010 + }, + { + "epoch": 0.78, + "learning_rate": 5.893909890565618e-07, + "loss": 1.1644, + "step": 26011 + }, + { + "epoch": 0.78, + "learning_rate": 5.892336873598798e-07, + "loss": 1.1602, + "step": 26012 + }, + { + "epoch": 0.78, + "learning_rate": 5.890764038527732e-07, + "loss": 1.0306, + "step": 26013 + }, + { + "epoch": 0.78, + "learning_rate": 5.889191385367385e-07, + "loss": 1.2174, + "step": 26014 + }, + { + "epoch": 0.78, + "learning_rate": 5.887618914132731e-07, + "loss": 1.0767, + "step": 26015 + }, + { + "epoch": 0.78, + "learning_rate": 5.88604662483874e-07, + "loss": 1.0765, + "step": 26016 + }, + { + "epoch": 0.78, + "learning_rate": 5.884474517500388e-07, + "loss": 1.2534, + "step": 26017 + }, + { + "epoch": 0.78, + "learning_rate": 5.882902592132622e-07, + "loss": 1.067, + "step": 26018 + }, + { + "epoch": 0.78, + "learning_rate": 5.881330848750419e-07, + "loss": 1.1066, + "step": 26019 + }, + { + "epoch": 0.78, + "learning_rate": 5.879759287368736e-07, + "loss": 1.0955, + "step": 26020 + }, + { + "epoch": 0.78, + "learning_rate": 5.878187908002538e-07, + "loss": 1.03, + "step": 26021 + }, + { + "epoch": 0.78, + "learning_rate": 5.876616710666788e-07, + "loss": 1.0365, + "step": 26022 + }, + { + "epoch": 0.78, + "learning_rate": 5.87504569537643e-07, + "loss": 1.1227, + "step": 26023 + }, + { + "epoch": 0.78, + "learning_rate": 5.873474862146425e-07, + "loss": 1.0478, + "step": 26024 + }, + { + "epoch": 0.78, + "learning_rate": 5.87190421099173e-07, + "loss": 0.9384, + "step": 26025 + }, + { + "epoch": 0.78, + "learning_rate": 5.870333741927301e-07, + "loss": 1.2007, + "step": 26026 + }, + { + "epoch": 0.78, + "learning_rate": 5.868763454968074e-07, + "loss": 1.0778, + "step": 26027 + }, + { + "epoch": 0.78, + "learning_rate": 5.867193350129003e-07, + "loss": 1.0749, + "step": 26028 + }, + { + "epoch": 0.78, + "learning_rate": 5.865623427425038e-07, + "loss": 1.1914, + "step": 26029 + }, + { + "epoch": 0.78, + "learning_rate": 5.864053686871129e-07, + "loss": 1.1295, + "step": 26030 + }, + { + "epoch": 0.78, + "learning_rate": 5.862484128482207e-07, + "loss": 1.178, + "step": 26031 + }, + { + "epoch": 0.78, + "learning_rate": 5.860914752273219e-07, + "loss": 1.1066, + "step": 26032 + }, + { + "epoch": 0.78, + "learning_rate": 5.859345558259106e-07, + "loss": 1.165, + "step": 26033 + }, + { + "epoch": 0.78, + "learning_rate": 5.857776546454802e-07, + "loss": 1.0042, + "step": 26034 + }, + { + "epoch": 0.78, + "learning_rate": 5.856207716875248e-07, + "loss": 1.1298, + "step": 26035 + }, + { + "epoch": 0.78, + "learning_rate": 5.854639069535376e-07, + "loss": 1.08, + "step": 26036 + }, + { + "epoch": 0.78, + "learning_rate": 5.85307060445012e-07, + "loss": 1.2631, + "step": 26037 + }, + { + "epoch": 0.78, + "learning_rate": 5.851502321634408e-07, + "loss": 1.0446, + "step": 26038 + }, + { + "epoch": 0.78, + "learning_rate": 5.849934221103182e-07, + "loss": 1.2104, + "step": 26039 + }, + { + "epoch": 0.78, + "learning_rate": 5.84836630287135e-07, + "loss": 1.0184, + "step": 26040 + }, + { + "epoch": 0.78, + "learning_rate": 5.846798566953848e-07, + "loss": 1.0602, + "step": 26041 + }, + { + "epoch": 0.78, + "learning_rate": 5.845231013365599e-07, + "loss": 1.0975, + "step": 26042 + }, + { + "epoch": 0.78, + "learning_rate": 5.843663642121533e-07, + "loss": 1.1318, + "step": 26043 + }, + { + "epoch": 0.78, + "learning_rate": 5.842096453236554e-07, + "loss": 1.0452, + "step": 26044 + }, + { + "epoch": 0.78, + "learning_rate": 5.840529446725593e-07, + "loss": 1.2138, + "step": 26045 + }, + { + "epoch": 0.78, + "learning_rate": 5.838962622603561e-07, + "loss": 1.0746, + "step": 26046 + }, + { + "epoch": 0.78, + "learning_rate": 5.83739598088538e-07, + "loss": 1.1271, + "step": 26047 + }, + { + "epoch": 0.78, + "learning_rate": 5.835829521585964e-07, + "loss": 1.1996, + "step": 26048 + }, + { + "epoch": 0.78, + "learning_rate": 5.834263244720217e-07, + "loss": 1.0549, + "step": 26049 + }, + { + "epoch": 0.78, + "learning_rate": 5.832697150303052e-07, + "loss": 0.9641, + "step": 26050 + }, + { + "epoch": 0.78, + "learning_rate": 5.831131238349378e-07, + "loss": 1.1328, + "step": 26051 + }, + { + "epoch": 0.78, + "learning_rate": 5.82956550887411e-07, + "loss": 1.0282, + "step": 26052 + }, + { + "epoch": 0.78, + "learning_rate": 5.827999961892139e-07, + "loss": 1.2624, + "step": 26053 + }, + { + "epoch": 0.78, + "learning_rate": 5.826434597418376e-07, + "loss": 1.0692, + "step": 26054 + }, + { + "epoch": 0.78, + "learning_rate": 5.824869415467718e-07, + "loss": 1.1051, + "step": 26055 + }, + { + "epoch": 0.78, + "learning_rate": 5.823304416055079e-07, + "loss": 1.1569, + "step": 26056 + }, + { + "epoch": 0.78, + "learning_rate": 5.821739599195337e-07, + "loss": 1.1078, + "step": 26057 + }, + { + "epoch": 0.78, + "learning_rate": 5.820174964903397e-07, + "loss": 1.1502, + "step": 26058 + }, + { + "epoch": 0.79, + "learning_rate": 5.818610513194156e-07, + "loss": 0.9613, + "step": 26059 + }, + { + "epoch": 0.79, + "learning_rate": 5.817046244082503e-07, + "loss": 1.1477, + "step": 26060 + }, + { + "epoch": 0.79, + "learning_rate": 5.815482157583333e-07, + "loss": 1.1564, + "step": 26061 + }, + { + "epoch": 0.79, + "learning_rate": 5.813918253711537e-07, + "loss": 1.1728, + "step": 26062 + }, + { + "epoch": 0.79, + "learning_rate": 5.812354532481995e-07, + "loss": 1.1133, + "step": 26063 + }, + { + "epoch": 0.79, + "learning_rate": 5.810790993909596e-07, + "loss": 1.1043, + "step": 26064 + }, + { + "epoch": 0.79, + "learning_rate": 5.809227638009224e-07, + "loss": 1.1418, + "step": 26065 + }, + { + "epoch": 0.79, + "learning_rate": 5.807664464795762e-07, + "loss": 1.0935, + "step": 26066 + }, + { + "epoch": 0.79, + "learning_rate": 5.80610147428409e-07, + "loss": 1.0887, + "step": 26067 + }, + { + "epoch": 0.79, + "learning_rate": 5.80453866648909e-07, + "loss": 0.9912, + "step": 26068 + }, + { + "epoch": 0.79, + "learning_rate": 5.802976041425645e-07, + "loss": 1.1503, + "step": 26069 + }, + { + "epoch": 0.79, + "learning_rate": 5.801413599108613e-07, + "loss": 1.1028, + "step": 26070 + }, + { + "epoch": 0.79, + "learning_rate": 5.799851339552878e-07, + "loss": 1.0447, + "step": 26071 + }, + { + "epoch": 0.79, + "learning_rate": 5.798289262773312e-07, + "loss": 1.0688, + "step": 26072 + }, + { + "epoch": 0.79, + "learning_rate": 5.796727368784782e-07, + "loss": 1.1498, + "step": 26073 + }, + { + "epoch": 0.79, + "learning_rate": 5.79516565760217e-07, + "loss": 1.2463, + "step": 26074 + }, + { + "epoch": 0.79, + "learning_rate": 5.793604129240321e-07, + "loss": 1.1503, + "step": 26075 + }, + { + "epoch": 0.79, + "learning_rate": 5.792042783714111e-07, + "loss": 1.1141, + "step": 26076 + }, + { + "epoch": 0.79, + "learning_rate": 5.790481621038405e-07, + "loss": 1.0234, + "step": 26077 + }, + { + "epoch": 0.79, + "learning_rate": 5.788920641228065e-07, + "loss": 1.1349, + "step": 26078 + }, + { + "epoch": 0.79, + "learning_rate": 5.787359844297946e-07, + "loss": 1.1393, + "step": 26079 + }, + { + "epoch": 0.79, + "learning_rate": 5.785799230262906e-07, + "loss": 1.1105, + "step": 26080 + }, + { + "epoch": 0.79, + "learning_rate": 5.784238799137804e-07, + "loss": 1.1648, + "step": 26081 + }, + { + "epoch": 0.79, + "learning_rate": 5.782678550937501e-07, + "loss": 1.0644, + "step": 26082 + }, + { + "epoch": 0.79, + "learning_rate": 5.781118485676834e-07, + "loss": 1.0816, + "step": 26083 + }, + { + "epoch": 0.79, + "learning_rate": 5.779558603370666e-07, + "loss": 1.002, + "step": 26084 + }, + { + "epoch": 0.79, + "learning_rate": 5.777998904033841e-07, + "loss": 1.1001, + "step": 26085 + }, + { + "epoch": 0.79, + "learning_rate": 5.776439387681209e-07, + "loss": 1.1874, + "step": 26086 + }, + { + "epoch": 0.79, + "learning_rate": 5.774880054327622e-07, + "loss": 1.0787, + "step": 26087 + }, + { + "epoch": 0.79, + "learning_rate": 5.773320903987912e-07, + "loss": 1.1006, + "step": 26088 + }, + { + "epoch": 0.79, + "learning_rate": 5.771761936676929e-07, + "loss": 1.0863, + "step": 26089 + }, + { + "epoch": 0.79, + "learning_rate": 5.770203152409506e-07, + "loss": 1.0795, + "step": 26090 + }, + { + "epoch": 0.79, + "learning_rate": 5.768644551200492e-07, + "loss": 1.0014, + "step": 26091 + }, + { + "epoch": 0.79, + "learning_rate": 5.76708613306472e-07, + "loss": 1.1823, + "step": 26092 + }, + { + "epoch": 0.79, + "learning_rate": 5.765527898017024e-07, + "loss": 1.133, + "step": 26093 + }, + { + "epoch": 0.79, + "learning_rate": 5.763969846072237e-07, + "loss": 1.2018, + "step": 26094 + }, + { + "epoch": 0.79, + "learning_rate": 5.762411977245203e-07, + "loss": 1.0336, + "step": 26095 + }, + { + "epoch": 0.79, + "learning_rate": 5.760854291550733e-07, + "loss": 1.111, + "step": 26096 + }, + { + "epoch": 0.79, + "learning_rate": 5.759296789003665e-07, + "loss": 1.0111, + "step": 26097 + }, + { + "epoch": 0.79, + "learning_rate": 5.757739469618826e-07, + "loss": 1.1553, + "step": 26098 + }, + { + "epoch": 0.79, + "learning_rate": 5.756182333411037e-07, + "loss": 1.0569, + "step": 26099 + }, + { + "epoch": 0.79, + "learning_rate": 5.754625380395132e-07, + "loss": 1.1352, + "step": 26100 + }, + { + "epoch": 0.79, + "learning_rate": 5.753068610585918e-07, + "loss": 1.074, + "step": 26101 + }, + { + "epoch": 0.79, + "learning_rate": 5.751512023998221e-07, + "loss": 1.0257, + "step": 26102 + }, + { + "epoch": 0.79, + "learning_rate": 5.749955620646858e-07, + "loss": 1.0584, + "step": 26103 + }, + { + "epoch": 0.79, + "learning_rate": 5.748399400546656e-07, + "loss": 1.053, + "step": 26104 + }, + { + "epoch": 0.79, + "learning_rate": 5.746843363712412e-07, + "loss": 1.0655, + "step": 26105 + }, + { + "epoch": 0.79, + "learning_rate": 5.745287510158945e-07, + "loss": 1.0593, + "step": 26106 + }, + { + "epoch": 0.79, + "learning_rate": 5.743731839901067e-07, + "loss": 1.0192, + "step": 26107 + }, + { + "epoch": 0.79, + "learning_rate": 5.742176352953596e-07, + "loss": 1.0673, + "step": 26108 + }, + { + "epoch": 0.79, + "learning_rate": 5.740621049331327e-07, + "loss": 1.0421, + "step": 26109 + }, + { + "epoch": 0.79, + "learning_rate": 5.739065929049065e-07, + "loss": 1.1478, + "step": 26110 + }, + { + "epoch": 0.79, + "learning_rate": 5.737510992121622e-07, + "loss": 1.1243, + "step": 26111 + }, + { + "epoch": 0.79, + "learning_rate": 5.735956238563803e-07, + "loss": 1.1654, + "step": 26112 + }, + { + "epoch": 0.79, + "learning_rate": 5.734401668390396e-07, + "loss": 1.1058, + "step": 26113 + }, + { + "epoch": 0.79, + "learning_rate": 5.732847281616208e-07, + "loss": 1.0646, + "step": 26114 + }, + { + "epoch": 0.79, + "learning_rate": 5.731293078256034e-07, + "loss": 1.0027, + "step": 26115 + }, + { + "epoch": 0.79, + "learning_rate": 5.729739058324668e-07, + "loss": 1.1167, + "step": 26116 + }, + { + "epoch": 0.79, + "learning_rate": 5.728185221836907e-07, + "loss": 0.9915, + "step": 26117 + }, + { + "epoch": 0.79, + "learning_rate": 5.726631568807539e-07, + "loss": 1.0138, + "step": 26118 + }, + { + "epoch": 0.79, + "learning_rate": 5.725078099251358e-07, + "loss": 1.0403, + "step": 26119 + }, + { + "epoch": 0.79, + "learning_rate": 5.723524813183151e-07, + "loss": 1.0764, + "step": 26120 + }, + { + "epoch": 0.79, + "learning_rate": 5.721971710617707e-07, + "loss": 1.1043, + "step": 26121 + }, + { + "epoch": 0.79, + "learning_rate": 5.720418791569804e-07, + "loss": 1.1238, + "step": 26122 + }, + { + "epoch": 0.79, + "learning_rate": 5.718866056054228e-07, + "loss": 1.105, + "step": 26123 + }, + { + "epoch": 0.79, + "learning_rate": 5.717313504085762e-07, + "loss": 1.0122, + "step": 26124 + }, + { + "epoch": 0.79, + "learning_rate": 5.71576113567919e-07, + "loss": 1.171, + "step": 26125 + }, + { + "epoch": 0.79, + "learning_rate": 5.714208950849279e-07, + "loss": 1.0531, + "step": 26126 + }, + { + "epoch": 0.79, + "learning_rate": 5.71265694961081e-07, + "loss": 1.0151, + "step": 26127 + }, + { + "epoch": 0.79, + "learning_rate": 5.711105131978558e-07, + "loss": 1.014, + "step": 26128 + }, + { + "epoch": 0.79, + "learning_rate": 5.709553497967293e-07, + "loss": 1.2077, + "step": 26129 + }, + { + "epoch": 0.79, + "learning_rate": 5.708002047591799e-07, + "loss": 1.1494, + "step": 26130 + }, + { + "epoch": 0.79, + "learning_rate": 5.706450780866823e-07, + "loss": 1.025, + "step": 26131 + }, + { + "epoch": 0.79, + "learning_rate": 5.704899697807145e-07, + "loss": 1.1014, + "step": 26132 + }, + { + "epoch": 0.79, + "learning_rate": 5.70334879842753e-07, + "loss": 1.0208, + "step": 26133 + }, + { + "epoch": 0.79, + "learning_rate": 5.701798082742749e-07, + "loss": 1.1906, + "step": 26134 + }, + { + "epoch": 0.79, + "learning_rate": 5.700247550767546e-07, + "loss": 1.0904, + "step": 26135 + }, + { + "epoch": 0.79, + "learning_rate": 5.698697202516693e-07, + "loss": 1.2463, + "step": 26136 + }, + { + "epoch": 0.79, + "learning_rate": 5.697147038004946e-07, + "loss": 1.1423, + "step": 26137 + }, + { + "epoch": 0.79, + "learning_rate": 5.695597057247071e-07, + "loss": 1.024, + "step": 26138 + }, + { + "epoch": 0.79, + "learning_rate": 5.694047260257807e-07, + "loss": 1.0969, + "step": 26139 + }, + { + "epoch": 0.79, + "learning_rate": 5.692497647051911e-07, + "loss": 1.1025, + "step": 26140 + }, + { + "epoch": 0.79, + "learning_rate": 5.690948217644143e-07, + "loss": 1.0963, + "step": 26141 + }, + { + "epoch": 0.79, + "learning_rate": 5.689398972049249e-07, + "loss": 1.0792, + "step": 26142 + }, + { + "epoch": 0.79, + "learning_rate": 5.687849910281976e-07, + "loss": 1.044, + "step": 26143 + }, + { + "epoch": 0.79, + "learning_rate": 5.686301032357075e-07, + "loss": 1.3112, + "step": 26144 + }, + { + "epoch": 0.79, + "learning_rate": 5.684752338289281e-07, + "loss": 1.1542, + "step": 26145 + }, + { + "epoch": 0.79, + "learning_rate": 5.683203828093342e-07, + "loss": 1.1219, + "step": 26146 + }, + { + "epoch": 0.79, + "learning_rate": 5.681655501784001e-07, + "loss": 1.1471, + "step": 26147 + }, + { + "epoch": 0.79, + "learning_rate": 5.680107359375994e-07, + "loss": 1.0621, + "step": 26148 + }, + { + "epoch": 0.79, + "learning_rate": 5.678559400884059e-07, + "loss": 0.9938, + "step": 26149 + }, + { + "epoch": 0.79, + "learning_rate": 5.677011626322936e-07, + "loss": 1.0375, + "step": 26150 + }, + { + "epoch": 0.79, + "learning_rate": 5.675464035707363e-07, + "loss": 1.1237, + "step": 26151 + }, + { + "epoch": 0.79, + "learning_rate": 5.673916629052057e-07, + "loss": 1.1416, + "step": 26152 + }, + { + "epoch": 0.79, + "learning_rate": 5.672369406371756e-07, + "loss": 1.0695, + "step": 26153 + }, + { + "epoch": 0.79, + "learning_rate": 5.670822367681189e-07, + "loss": 1.0014, + "step": 26154 + }, + { + "epoch": 0.79, + "learning_rate": 5.669275512995088e-07, + "loss": 1.1298, + "step": 26155 + }, + { + "epoch": 0.79, + "learning_rate": 5.667728842328177e-07, + "loss": 1.0237, + "step": 26156 + }, + { + "epoch": 0.79, + "learning_rate": 5.666182355695171e-07, + "loss": 1.1639, + "step": 26157 + }, + { + "epoch": 0.79, + "learning_rate": 5.664636053110797e-07, + "loss": 1.137, + "step": 26158 + }, + { + "epoch": 0.79, + "learning_rate": 5.663089934589777e-07, + "loss": 1.1815, + "step": 26159 + }, + { + "epoch": 0.79, + "learning_rate": 5.661544000146835e-07, + "loss": 1.0688, + "step": 26160 + }, + { + "epoch": 0.79, + "learning_rate": 5.659998249796673e-07, + "loss": 1.1661, + "step": 26161 + }, + { + "epoch": 0.79, + "learning_rate": 5.658452683554011e-07, + "loss": 1.1038, + "step": 26162 + }, + { + "epoch": 0.79, + "learning_rate": 5.656907301433565e-07, + "loss": 1.1378, + "step": 26163 + }, + { + "epoch": 0.79, + "learning_rate": 5.655362103450054e-07, + "loss": 1.1508, + "step": 26164 + }, + { + "epoch": 0.79, + "learning_rate": 5.653817089618172e-07, + "loss": 1.0761, + "step": 26165 + }, + { + "epoch": 0.79, + "learning_rate": 5.652272259952632e-07, + "loss": 1.0959, + "step": 26166 + }, + { + "epoch": 0.79, + "learning_rate": 5.650727614468143e-07, + "loss": 1.1495, + "step": 26167 + }, + { + "epoch": 0.79, + "learning_rate": 5.649183153179407e-07, + "loss": 1.1235, + "step": 26168 + }, + { + "epoch": 0.79, + "learning_rate": 5.647638876101139e-07, + "loss": 1.15, + "step": 26169 + }, + { + "epoch": 0.79, + "learning_rate": 5.646094783248018e-07, + "loss": 1.0381, + "step": 26170 + }, + { + "epoch": 0.79, + "learning_rate": 5.644550874634754e-07, + "loss": 1.1296, + "step": 26171 + }, + { + "epoch": 0.79, + "learning_rate": 5.643007150276045e-07, + "loss": 1.1469, + "step": 26172 + }, + { + "epoch": 0.79, + "learning_rate": 5.641463610186582e-07, + "loss": 0.9845, + "step": 26173 + }, + { + "epoch": 0.79, + "learning_rate": 5.639920254381065e-07, + "loss": 1.1151, + "step": 26174 + }, + { + "epoch": 0.79, + "learning_rate": 5.638377082874183e-07, + "loss": 1.1166, + "step": 26175 + }, + { + "epoch": 0.79, + "learning_rate": 5.636834095680624e-07, + "loss": 1.0969, + "step": 26176 + }, + { + "epoch": 0.79, + "learning_rate": 5.635291292815087e-07, + "loss": 1.0985, + "step": 26177 + }, + { + "epoch": 0.79, + "learning_rate": 5.633748674292244e-07, + "loss": 1.1077, + "step": 26178 + }, + { + "epoch": 0.79, + "learning_rate": 5.632206240126786e-07, + "loss": 1.0905, + "step": 26179 + }, + { + "epoch": 0.79, + "learning_rate": 5.630663990333399e-07, + "loss": 1.1127, + "step": 26180 + }, + { + "epoch": 0.79, + "learning_rate": 5.629121924926759e-07, + "loss": 1.1503, + "step": 26181 + }, + { + "epoch": 0.79, + "learning_rate": 5.627580043921558e-07, + "loss": 1.0959, + "step": 26182 + }, + { + "epoch": 0.79, + "learning_rate": 5.626038347332458e-07, + "loss": 1.2095, + "step": 26183 + }, + { + "epoch": 0.79, + "learning_rate": 5.62449683517414e-07, + "loss": 0.9807, + "step": 26184 + }, + { + "epoch": 0.79, + "learning_rate": 5.622955507461283e-07, + "loss": 0.9792, + "step": 26185 + }, + { + "epoch": 0.79, + "learning_rate": 5.621414364208563e-07, + "loss": 1.1089, + "step": 26186 + }, + { + "epoch": 0.79, + "learning_rate": 5.619873405430637e-07, + "loss": 1.1275, + "step": 26187 + }, + { + "epoch": 0.79, + "learning_rate": 5.618332631142184e-07, + "loss": 1.1021, + "step": 26188 + }, + { + "epoch": 0.79, + "learning_rate": 5.616792041357869e-07, + "loss": 1.0349, + "step": 26189 + }, + { + "epoch": 0.79, + "learning_rate": 5.615251636092367e-07, + "loss": 1.1022, + "step": 26190 + }, + { + "epoch": 0.79, + "learning_rate": 5.613711415360326e-07, + "loss": 1.1184, + "step": 26191 + }, + { + "epoch": 0.79, + "learning_rate": 5.612171379176414e-07, + "loss": 1.1976, + "step": 26192 + }, + { + "epoch": 0.79, + "learning_rate": 5.610631527555293e-07, + "loss": 1.2638, + "step": 26193 + }, + { + "epoch": 0.79, + "learning_rate": 5.609091860511622e-07, + "loss": 1.0115, + "step": 26194 + }, + { + "epoch": 0.79, + "learning_rate": 5.607552378060066e-07, + "loss": 1.1169, + "step": 26195 + }, + { + "epoch": 0.79, + "learning_rate": 5.606013080215265e-07, + "loss": 1.1156, + "step": 26196 + }, + { + "epoch": 0.79, + "learning_rate": 5.604473966991877e-07, + "loss": 1.1285, + "step": 26197 + }, + { + "epoch": 0.79, + "learning_rate": 5.602935038404555e-07, + "loss": 1.223, + "step": 26198 + }, + { + "epoch": 0.79, + "learning_rate": 5.601396294467954e-07, + "loss": 1.0921, + "step": 26199 + }, + { + "epoch": 0.79, + "learning_rate": 5.599857735196712e-07, + "loss": 1.167, + "step": 26200 + }, + { + "epoch": 0.79, + "learning_rate": 5.598319360605484e-07, + "loss": 1.213, + "step": 26201 + }, + { + "epoch": 0.79, + "learning_rate": 5.596781170708912e-07, + "loss": 1.0827, + "step": 26202 + }, + { + "epoch": 0.79, + "learning_rate": 5.595243165521644e-07, + "loss": 1.145, + "step": 26203 + }, + { + "epoch": 0.79, + "learning_rate": 5.593705345058309e-07, + "loss": 1.1005, + "step": 26204 + }, + { + "epoch": 0.79, + "learning_rate": 5.592167709333552e-07, + "loss": 1.1519, + "step": 26205 + }, + { + "epoch": 0.79, + "learning_rate": 5.590630258362012e-07, + "loss": 1.0248, + "step": 26206 + }, + { + "epoch": 0.79, + "learning_rate": 5.589092992158324e-07, + "loss": 0.9836, + "step": 26207 + }, + { + "epoch": 0.79, + "learning_rate": 5.587555910737127e-07, + "loss": 1.1057, + "step": 26208 + }, + { + "epoch": 0.79, + "learning_rate": 5.586019014113045e-07, + "loss": 1.1337, + "step": 26209 + }, + { + "epoch": 0.79, + "learning_rate": 5.584482302300708e-07, + "loss": 1.1186, + "step": 26210 + }, + { + "epoch": 0.79, + "learning_rate": 5.582945775314752e-07, + "loss": 1.1272, + "step": 26211 + }, + { + "epoch": 0.79, + "learning_rate": 5.581409433169807e-07, + "loss": 1.0214, + "step": 26212 + }, + { + "epoch": 0.79, + "learning_rate": 5.579873275880485e-07, + "loss": 1.1578, + "step": 26213 + }, + { + "epoch": 0.79, + "learning_rate": 5.578337303461414e-07, + "loss": 1.1247, + "step": 26214 + }, + { + "epoch": 0.79, + "learning_rate": 5.576801515927219e-07, + "loss": 1.0699, + "step": 26215 + }, + { + "epoch": 0.79, + "learning_rate": 5.575265913292527e-07, + "loss": 1.0325, + "step": 26216 + }, + { + "epoch": 0.79, + "learning_rate": 5.573730495571942e-07, + "loss": 1.1527, + "step": 26217 + }, + { + "epoch": 0.79, + "learning_rate": 5.572195262780086e-07, + "loss": 1.311, + "step": 26218 + }, + { + "epoch": 0.79, + "learning_rate": 5.570660214931572e-07, + "loss": 1.1538, + "step": 26219 + }, + { + "epoch": 0.79, + "learning_rate": 5.569125352041019e-07, + "loss": 1.0728, + "step": 26220 + }, + { + "epoch": 0.79, + "learning_rate": 5.567590674123038e-07, + "loss": 1.1224, + "step": 26221 + }, + { + "epoch": 0.79, + "learning_rate": 5.566056181192231e-07, + "loss": 1.0236, + "step": 26222 + }, + { + "epoch": 0.79, + "learning_rate": 5.564521873263207e-07, + "loss": 1.1493, + "step": 26223 + }, + { + "epoch": 0.79, + "learning_rate": 5.562987750350576e-07, + "loss": 1.1501, + "step": 26224 + }, + { + "epoch": 0.79, + "learning_rate": 5.561453812468939e-07, + "loss": 1.076, + "step": 26225 + }, + { + "epoch": 0.79, + "learning_rate": 5.559920059632901e-07, + "loss": 1.0897, + "step": 26226 + }, + { + "epoch": 0.79, + "learning_rate": 5.558386491857068e-07, + "loss": 1.0118, + "step": 26227 + }, + { + "epoch": 0.79, + "learning_rate": 5.556853109156024e-07, + "loss": 1.1233, + "step": 26228 + }, + { + "epoch": 0.79, + "learning_rate": 5.555319911544376e-07, + "loss": 1.073, + "step": 26229 + }, + { + "epoch": 0.79, + "learning_rate": 5.553786899036717e-07, + "loss": 1.2617, + "step": 26230 + }, + { + "epoch": 0.79, + "learning_rate": 5.552254071647642e-07, + "loss": 1.2408, + "step": 26231 + }, + { + "epoch": 0.79, + "learning_rate": 5.55072142939174e-07, + "loss": 1.0374, + "step": 26232 + }, + { + "epoch": 0.79, + "learning_rate": 5.549188972283603e-07, + "loss": 1.0569, + "step": 26233 + }, + { + "epoch": 0.79, + "learning_rate": 5.547656700337828e-07, + "loss": 0.9506, + "step": 26234 + }, + { + "epoch": 0.79, + "learning_rate": 5.546124613568984e-07, + "loss": 1.0562, + "step": 26235 + }, + { + "epoch": 0.79, + "learning_rate": 5.544592711991665e-07, + "loss": 1.0486, + "step": 26236 + }, + { + "epoch": 0.79, + "learning_rate": 5.543060995620452e-07, + "loss": 1.0347, + "step": 26237 + }, + { + "epoch": 0.79, + "learning_rate": 5.541529464469936e-07, + "loss": 1.1159, + "step": 26238 + }, + { + "epoch": 0.79, + "learning_rate": 5.539998118554682e-07, + "loss": 1.0347, + "step": 26239 + }, + { + "epoch": 0.79, + "learning_rate": 5.538466957889271e-07, + "loss": 1.057, + "step": 26240 + }, + { + "epoch": 0.79, + "learning_rate": 5.536935982488284e-07, + "loss": 0.9886, + "step": 26241 + }, + { + "epoch": 0.79, + "learning_rate": 5.535405192366298e-07, + "loss": 1.119, + "step": 26242 + }, + { + "epoch": 0.79, + "learning_rate": 5.533874587537874e-07, + "loss": 1.0532, + "step": 26243 + }, + { + "epoch": 0.79, + "learning_rate": 5.532344168017589e-07, + "loss": 1.2326, + "step": 26244 + }, + { + "epoch": 0.79, + "learning_rate": 5.530813933820012e-07, + "loss": 1.0974, + "step": 26245 + }, + { + "epoch": 0.79, + "learning_rate": 5.529283884959707e-07, + "loss": 1.099, + "step": 26246 + }, + { + "epoch": 0.79, + "learning_rate": 5.527754021451251e-07, + "loss": 1.1041, + "step": 26247 + }, + { + "epoch": 0.79, + "learning_rate": 5.526224343309191e-07, + "loss": 1.1095, + "step": 26248 + }, + { + "epoch": 0.79, + "learning_rate": 5.524694850548096e-07, + "loss": 1.0181, + "step": 26249 + }, + { + "epoch": 0.79, + "learning_rate": 5.523165543182529e-07, + "loss": 1.1248, + "step": 26250 + }, + { + "epoch": 0.79, + "learning_rate": 5.52163642122705e-07, + "loss": 1.1158, + "step": 26251 + }, + { + "epoch": 0.79, + "learning_rate": 5.520107484696205e-07, + "loss": 1.1063, + "step": 26252 + }, + { + "epoch": 0.79, + "learning_rate": 5.518578733604554e-07, + "loss": 1.1225, + "step": 26253 + }, + { + "epoch": 0.79, + "learning_rate": 5.517050167966653e-07, + "loss": 0.9852, + "step": 26254 + }, + { + "epoch": 0.79, + "learning_rate": 5.515521787797048e-07, + "loss": 1.1434, + "step": 26255 + }, + { + "epoch": 0.79, + "learning_rate": 5.513993593110295e-07, + "loss": 1.0984, + "step": 26256 + }, + { + "epoch": 0.79, + "learning_rate": 5.512465583920937e-07, + "loss": 1.0445, + "step": 26257 + }, + { + "epoch": 0.79, + "learning_rate": 5.510937760243521e-07, + "loss": 1.0941, + "step": 26258 + }, + { + "epoch": 0.79, + "learning_rate": 5.50941012209259e-07, + "loss": 1.1241, + "step": 26259 + }, + { + "epoch": 0.79, + "learning_rate": 5.507882669482695e-07, + "loss": 1.0413, + "step": 26260 + }, + { + "epoch": 0.79, + "learning_rate": 5.506355402428362e-07, + "loss": 1.0664, + "step": 26261 + }, + { + "epoch": 0.79, + "learning_rate": 5.504828320944139e-07, + "loss": 1.067, + "step": 26262 + }, + { + "epoch": 0.79, + "learning_rate": 5.50330142504456e-07, + "loss": 1.0811, + "step": 26263 + }, + { + "epoch": 0.79, + "learning_rate": 5.501774714744168e-07, + "loss": 1.1682, + "step": 26264 + }, + { + "epoch": 0.79, + "learning_rate": 5.500248190057483e-07, + "loss": 1.0726, + "step": 26265 + }, + { + "epoch": 0.79, + "learning_rate": 5.498721850999045e-07, + "loss": 1.0935, + "step": 26266 + }, + { + "epoch": 0.79, + "learning_rate": 5.497195697583383e-07, + "loss": 1.1347, + "step": 26267 + }, + { + "epoch": 0.79, + "learning_rate": 5.495669729825032e-07, + "loss": 1.1324, + "step": 26268 + }, + { + "epoch": 0.79, + "learning_rate": 5.494143947738504e-07, + "loss": 1.0867, + "step": 26269 + }, + { + "epoch": 0.79, + "learning_rate": 5.49261835133833e-07, + "loss": 1.1094, + "step": 26270 + }, + { + "epoch": 0.79, + "learning_rate": 5.491092940639037e-07, + "loss": 1.0449, + "step": 26271 + }, + { + "epoch": 0.79, + "learning_rate": 5.489567715655142e-07, + "loss": 1.0198, + "step": 26272 + }, + { + "epoch": 0.79, + "learning_rate": 5.48804267640117e-07, + "loss": 1.1438, + "step": 26273 + }, + { + "epoch": 0.79, + "learning_rate": 5.486517822891632e-07, + "loss": 1.1507, + "step": 26274 + }, + { + "epoch": 0.79, + "learning_rate": 5.484993155141044e-07, + "loss": 0.9999, + "step": 26275 + }, + { + "epoch": 0.79, + "learning_rate": 5.483468673163922e-07, + "loss": 1.076, + "step": 26276 + }, + { + "epoch": 0.79, + "learning_rate": 5.481944376974787e-07, + "loss": 1.2587, + "step": 26277 + }, + { + "epoch": 0.79, + "learning_rate": 5.480420266588135e-07, + "loss": 1.0526, + "step": 26278 + }, + { + "epoch": 0.79, + "learning_rate": 5.478896342018478e-07, + "loss": 1.1592, + "step": 26279 + }, + { + "epoch": 0.79, + "learning_rate": 5.477372603280329e-07, + "loss": 1.1308, + "step": 26280 + }, + { + "epoch": 0.79, + "learning_rate": 5.47584905038819e-07, + "loss": 1.0997, + "step": 26281 + }, + { + "epoch": 0.79, + "learning_rate": 5.474325683356563e-07, + "loss": 1.0466, + "step": 26282 + }, + { + "epoch": 0.79, + "learning_rate": 5.472802502199953e-07, + "loss": 1.1276, + "step": 26283 + }, + { + "epoch": 0.79, + "learning_rate": 5.471279506932859e-07, + "loss": 1.0934, + "step": 26284 + }, + { + "epoch": 0.79, + "learning_rate": 5.469756697569778e-07, + "loss": 1.0628, + "step": 26285 + }, + { + "epoch": 0.79, + "learning_rate": 5.468234074125214e-07, + "loss": 1.0786, + "step": 26286 + }, + { + "epoch": 0.79, + "learning_rate": 5.46671163661365e-07, + "loss": 1.1591, + "step": 26287 + }, + { + "epoch": 0.79, + "learning_rate": 5.465189385049582e-07, + "loss": 1.059, + "step": 26288 + }, + { + "epoch": 0.79, + "learning_rate": 5.463667319447503e-07, + "loss": 1.0919, + "step": 26289 + }, + { + "epoch": 0.79, + "learning_rate": 5.462145439821909e-07, + "loss": 1.1288, + "step": 26290 + }, + { + "epoch": 0.79, + "learning_rate": 5.460623746187271e-07, + "loss": 1.0714, + "step": 26291 + }, + { + "epoch": 0.79, + "learning_rate": 5.459102238558089e-07, + "loss": 1.0832, + "step": 26292 + }, + { + "epoch": 0.79, + "learning_rate": 5.457580916948841e-07, + "loss": 1.2238, + "step": 26293 + }, + { + "epoch": 0.79, + "learning_rate": 5.456059781374016e-07, + "loss": 1.1151, + "step": 26294 + }, + { + "epoch": 0.79, + "learning_rate": 5.454538831848083e-07, + "loss": 1.1715, + "step": 26295 + }, + { + "epoch": 0.79, + "learning_rate": 5.453018068385526e-07, + "loss": 1.1923, + "step": 26296 + }, + { + "epoch": 0.79, + "learning_rate": 5.451497491000826e-07, + "loss": 1.0456, + "step": 26297 + }, + { + "epoch": 0.79, + "learning_rate": 5.449977099708459e-07, + "loss": 1.183, + "step": 26298 + }, + { + "epoch": 0.79, + "learning_rate": 5.448456894522888e-07, + "loss": 0.9645, + "step": 26299 + }, + { + "epoch": 0.79, + "learning_rate": 5.446936875458592e-07, + "loss": 1.0872, + "step": 26300 + }, + { + "epoch": 0.79, + "learning_rate": 5.445417042530041e-07, + "loss": 1.123, + "step": 26301 + }, + { + "epoch": 0.79, + "learning_rate": 5.443897395751699e-07, + "loss": 1.1412, + "step": 26302 + }, + { + "epoch": 0.79, + "learning_rate": 5.442377935138044e-07, + "loss": 1.063, + "step": 26303 + }, + { + "epoch": 0.79, + "learning_rate": 5.440858660703524e-07, + "loss": 1.0454, + "step": 26304 + }, + { + "epoch": 0.79, + "learning_rate": 5.43933957246261e-07, + "loss": 1.0517, + "step": 26305 + }, + { + "epoch": 0.79, + "learning_rate": 5.437820670429761e-07, + "loss": 1.2324, + "step": 26306 + }, + { + "epoch": 0.79, + "learning_rate": 5.436301954619438e-07, + "loss": 1.1418, + "step": 26307 + }, + { + "epoch": 0.79, + "learning_rate": 5.4347834250461e-07, + "loss": 1.0497, + "step": 26308 + }, + { + "epoch": 0.79, + "learning_rate": 5.433265081724209e-07, + "loss": 1.0864, + "step": 26309 + }, + { + "epoch": 0.79, + "learning_rate": 5.431746924668202e-07, + "loss": 1.1268, + "step": 26310 + }, + { + "epoch": 0.79, + "learning_rate": 5.430228953892539e-07, + "loss": 1.1505, + "step": 26311 + }, + { + "epoch": 0.79, + "learning_rate": 5.428711169411671e-07, + "loss": 1.0836, + "step": 26312 + }, + { + "epoch": 0.79, + "learning_rate": 5.42719357124005e-07, + "loss": 1.1451, + "step": 26313 + }, + { + "epoch": 0.79, + "learning_rate": 5.425676159392116e-07, + "loss": 1.158, + "step": 26314 + }, + { + "epoch": 0.79, + "learning_rate": 5.42415893388232e-07, + "loss": 1.0579, + "step": 26315 + }, + { + "epoch": 0.79, + "learning_rate": 5.422641894725109e-07, + "loss": 1.1528, + "step": 26316 + }, + { + "epoch": 0.79, + "learning_rate": 5.42112504193491e-07, + "loss": 1.1533, + "step": 26317 + }, + { + "epoch": 0.79, + "learning_rate": 5.419608375526172e-07, + "loss": 1.1246, + "step": 26318 + }, + { + "epoch": 0.79, + "learning_rate": 5.418091895513334e-07, + "loss": 1.1003, + "step": 26319 + }, + { + "epoch": 0.79, + "learning_rate": 5.416575601910837e-07, + "loss": 1.1191, + "step": 26320 + }, + { + "epoch": 0.79, + "learning_rate": 5.415059494733099e-07, + "loss": 1.0104, + "step": 26321 + }, + { + "epoch": 0.79, + "learning_rate": 5.413543573994564e-07, + "loss": 1.132, + "step": 26322 + }, + { + "epoch": 0.79, + "learning_rate": 5.412027839709661e-07, + "loss": 1.0577, + "step": 26323 + }, + { + "epoch": 0.79, + "learning_rate": 5.410512291892825e-07, + "loss": 1.0344, + "step": 26324 + }, + { + "epoch": 0.79, + "learning_rate": 5.408996930558469e-07, + "loss": 1.1421, + "step": 26325 + }, + { + "epoch": 0.79, + "learning_rate": 5.407481755721031e-07, + "loss": 1.0636, + "step": 26326 + }, + { + "epoch": 0.79, + "learning_rate": 5.405966767394927e-07, + "loss": 1.142, + "step": 26327 + }, + { + "epoch": 0.79, + "learning_rate": 5.404451965594585e-07, + "loss": 1.058, + "step": 26328 + }, + { + "epoch": 0.79, + "learning_rate": 5.402937350334427e-07, + "loss": 1.0614, + "step": 26329 + }, + { + "epoch": 0.79, + "learning_rate": 5.401422921628863e-07, + "loss": 1.128, + "step": 26330 + }, + { + "epoch": 0.79, + "learning_rate": 5.399908679492313e-07, + "loss": 1.1846, + "step": 26331 + }, + { + "epoch": 0.79, + "learning_rate": 5.39839462393919e-07, + "loss": 1.1201, + "step": 26332 + }, + { + "epoch": 0.79, + "learning_rate": 5.396880754983921e-07, + "loss": 1.0847, + "step": 26333 + }, + { + "epoch": 0.79, + "learning_rate": 5.395367072640898e-07, + "loss": 1.1094, + "step": 26334 + }, + { + "epoch": 0.79, + "learning_rate": 5.393853576924535e-07, + "loss": 1.1905, + "step": 26335 + }, + { + "epoch": 0.79, + "learning_rate": 5.392340267849247e-07, + "loss": 1.1326, + "step": 26336 + }, + { + "epoch": 0.79, + "learning_rate": 5.390827145429436e-07, + "loss": 1.0775, + "step": 26337 + }, + { + "epoch": 0.79, + "learning_rate": 5.389314209679505e-07, + "loss": 1.2273, + "step": 26338 + }, + { + "epoch": 0.79, + "learning_rate": 5.387801460613859e-07, + "loss": 1.0679, + "step": 26339 + }, + { + "epoch": 0.79, + "learning_rate": 5.386288898246897e-07, + "loss": 1.1761, + "step": 26340 + }, + { + "epoch": 0.79, + "learning_rate": 5.384776522593019e-07, + "loss": 1.019, + "step": 26341 + }, + { + "epoch": 0.79, + "learning_rate": 5.383264333666627e-07, + "loss": 1.1043, + "step": 26342 + }, + { + "epoch": 0.79, + "learning_rate": 5.381752331482104e-07, + "loss": 1.0598, + "step": 26343 + }, + { + "epoch": 0.79, + "learning_rate": 5.380240516053853e-07, + "loss": 1.0053, + "step": 26344 + }, + { + "epoch": 0.79, + "learning_rate": 5.378728887396259e-07, + "loss": 1.1342, + "step": 26345 + }, + { + "epoch": 0.79, + "learning_rate": 5.377217445523725e-07, + "loss": 1.0276, + "step": 26346 + }, + { + "epoch": 0.79, + "learning_rate": 5.375706190450625e-07, + "loss": 1.1155, + "step": 26347 + }, + { + "epoch": 0.79, + "learning_rate": 5.374195122191347e-07, + "loss": 1.0553, + "step": 26348 + }, + { + "epoch": 0.79, + "learning_rate": 5.372684240760285e-07, + "loss": 1.2493, + "step": 26349 + }, + { + "epoch": 0.79, + "learning_rate": 5.371173546171817e-07, + "loss": 1.1731, + "step": 26350 + }, + { + "epoch": 0.79, + "learning_rate": 5.369663038440321e-07, + "loss": 1.0629, + "step": 26351 + }, + { + "epoch": 0.79, + "learning_rate": 5.368152717580174e-07, + "loss": 1.2584, + "step": 26352 + }, + { + "epoch": 0.79, + "learning_rate": 5.366642583605763e-07, + "loss": 1.0189, + "step": 26353 + }, + { + "epoch": 0.79, + "learning_rate": 5.365132636531456e-07, + "loss": 1.2773, + "step": 26354 + }, + { + "epoch": 0.79, + "learning_rate": 5.363622876371638e-07, + "loss": 1.075, + "step": 26355 + }, + { + "epoch": 0.79, + "learning_rate": 5.362113303140664e-07, + "loss": 0.9967, + "step": 26356 + }, + { + "epoch": 0.79, + "learning_rate": 5.360603916852916e-07, + "loss": 1.0202, + "step": 26357 + }, + { + "epoch": 0.79, + "learning_rate": 5.359094717522759e-07, + "loss": 1.0887, + "step": 26358 + }, + { + "epoch": 0.79, + "learning_rate": 5.357585705164567e-07, + "loss": 1.0095, + "step": 26359 + }, + { + "epoch": 0.79, + "learning_rate": 5.356076879792693e-07, + "loss": 1.1438, + "step": 26360 + }, + { + "epoch": 0.79, + "learning_rate": 5.354568241421504e-07, + "loss": 1.144, + "step": 26361 + }, + { + "epoch": 0.79, + "learning_rate": 5.353059790065368e-07, + "loss": 1.0241, + "step": 26362 + }, + { + "epoch": 0.79, + "learning_rate": 5.351551525738638e-07, + "loss": 1.053, + "step": 26363 + }, + { + "epoch": 0.79, + "learning_rate": 5.350043448455674e-07, + "loss": 1.1162, + "step": 26364 + }, + { + "epoch": 0.79, + "learning_rate": 5.348535558230833e-07, + "loss": 1.1075, + "step": 26365 + }, + { + "epoch": 0.79, + "learning_rate": 5.347027855078471e-07, + "loss": 1.1873, + "step": 26366 + }, + { + "epoch": 0.79, + "learning_rate": 5.345520339012936e-07, + "loss": 1.1246, + "step": 26367 + }, + { + "epoch": 0.79, + "learning_rate": 5.344013010048588e-07, + "loss": 1.1957, + "step": 26368 + }, + { + "epoch": 0.79, + "learning_rate": 5.342505868199765e-07, + "loss": 1.2139, + "step": 26369 + }, + { + "epoch": 0.79, + "learning_rate": 5.340998913480819e-07, + "loss": 1.095, + "step": 26370 + }, + { + "epoch": 0.79, + "learning_rate": 5.339492145906092e-07, + "loss": 1.0399, + "step": 26371 + }, + { + "epoch": 0.79, + "learning_rate": 5.33798556548994e-07, + "loss": 1.1459, + "step": 26372 + }, + { + "epoch": 0.79, + "learning_rate": 5.33647917224669e-07, + "loss": 1.2216, + "step": 26373 + }, + { + "epoch": 0.79, + "learning_rate": 5.334972966190685e-07, + "loss": 1.2341, + "step": 26374 + }, + { + "epoch": 0.79, + "learning_rate": 5.333466947336269e-07, + "loss": 1.0153, + "step": 26375 + }, + { + "epoch": 0.79, + "learning_rate": 5.331961115697781e-07, + "loss": 0.9824, + "step": 26376 + }, + { + "epoch": 0.79, + "learning_rate": 5.330455471289545e-07, + "loss": 1.1543, + "step": 26377 + }, + { + "epoch": 0.79, + "learning_rate": 5.328950014125899e-07, + "loss": 1.0616, + "step": 26378 + }, + { + "epoch": 0.79, + "learning_rate": 5.327444744221178e-07, + "loss": 1.1725, + "step": 26379 + }, + { + "epoch": 0.79, + "learning_rate": 5.325939661589704e-07, + "loss": 1.2048, + "step": 26380 + }, + { + "epoch": 0.79, + "learning_rate": 5.324434766245817e-07, + "loss": 1.2656, + "step": 26381 + }, + { + "epoch": 0.79, + "learning_rate": 5.322930058203829e-07, + "loss": 1.073, + "step": 26382 + }, + { + "epoch": 0.79, + "learning_rate": 5.32142553747807e-07, + "loss": 1.0491, + "step": 26383 + }, + { + "epoch": 0.79, + "learning_rate": 5.319921204082865e-07, + "loss": 1.0196, + "step": 26384 + }, + { + "epoch": 0.79, + "learning_rate": 5.318417058032535e-07, + "loss": 1.0792, + "step": 26385 + }, + { + "epoch": 0.79, + "learning_rate": 5.316913099341389e-07, + "loss": 1.1011, + "step": 26386 + }, + { + "epoch": 0.79, + "learning_rate": 5.315409328023752e-07, + "loss": 1.1673, + "step": 26387 + }, + { + "epoch": 0.79, + "learning_rate": 5.313905744093936e-07, + "loss": 1.1415, + "step": 26388 + }, + { + "epoch": 0.79, + "learning_rate": 5.312402347566259e-07, + "loss": 1.1246, + "step": 26389 + }, + { + "epoch": 0.79, + "learning_rate": 5.310899138455028e-07, + "loss": 1.1038, + "step": 26390 + }, + { + "epoch": 0.8, + "learning_rate": 5.309396116774562e-07, + "loss": 1.1155, + "step": 26391 + }, + { + "epoch": 0.8, + "learning_rate": 5.307893282539153e-07, + "loss": 1.2275, + "step": 26392 + }, + { + "epoch": 0.8, + "learning_rate": 5.306390635763118e-07, + "loss": 1.2374, + "step": 26393 + }, + { + "epoch": 0.8, + "learning_rate": 5.30488817646076e-07, + "loss": 1.1155, + "step": 26394 + }, + { + "epoch": 0.8, + "learning_rate": 5.303385904646377e-07, + "loss": 0.9977, + "step": 26395 + }, + { + "epoch": 0.8, + "learning_rate": 5.301883820334278e-07, + "loss": 1.1349, + "step": 26396 + }, + { + "epoch": 0.8, + "learning_rate": 5.300381923538755e-07, + "loss": 1.0352, + "step": 26397 + }, + { + "epoch": 0.8, + "learning_rate": 5.298880214274118e-07, + "loss": 1.0829, + "step": 26398 + }, + { + "epoch": 0.8, + "learning_rate": 5.297378692554647e-07, + "loss": 1.2068, + "step": 26399 + }, + { + "epoch": 0.8, + "learning_rate": 5.295877358394638e-07, + "loss": 1.0445, + "step": 26400 + }, + { + "epoch": 0.8, + "learning_rate": 5.294376211808388e-07, + "loss": 1.0908, + "step": 26401 + }, + { + "epoch": 0.8, + "learning_rate": 5.292875252810195e-07, + "loss": 1.0714, + "step": 26402 + }, + { + "epoch": 0.8, + "learning_rate": 5.29137448141433e-07, + "loss": 0.9523, + "step": 26403 + }, + { + "epoch": 0.8, + "learning_rate": 5.289873897635086e-07, + "loss": 1.1414, + "step": 26404 + }, + { + "epoch": 0.8, + "learning_rate": 5.288373501486754e-07, + "loss": 1.1476, + "step": 26405 + }, + { + "epoch": 0.8, + "learning_rate": 5.28687329298361e-07, + "loss": 1.1286, + "step": 26406 + }, + { + "epoch": 0.8, + "learning_rate": 5.285373272139946e-07, + "loss": 1.1348, + "step": 26407 + }, + { + "epoch": 0.8, + "learning_rate": 5.283873438970024e-07, + "loss": 1.1277, + "step": 26408 + }, + { + "epoch": 0.8, + "learning_rate": 5.282373793488135e-07, + "loss": 1.1381, + "step": 26409 + }, + { + "epoch": 0.8, + "learning_rate": 5.280874335708549e-07, + "loss": 1.101, + "step": 26410 + }, + { + "epoch": 0.8, + "learning_rate": 5.27937506564555e-07, + "loss": 1.2411, + "step": 26411 + }, + { + "epoch": 0.8, + "learning_rate": 5.277875983313397e-07, + "loss": 1.1623, + "step": 26412 + }, + { + "epoch": 0.8, + "learning_rate": 5.276377088726361e-07, + "loss": 1.0715, + "step": 26413 + }, + { + "epoch": 0.8, + "learning_rate": 5.274878381898721e-07, + "loss": 0.9903, + "step": 26414 + }, + { + "epoch": 0.8, + "learning_rate": 5.273379862844744e-07, + "loss": 1.1605, + "step": 26415 + }, + { + "epoch": 0.8, + "learning_rate": 5.271881531578682e-07, + "loss": 0.9769, + "step": 26416 + }, + { + "epoch": 0.8, + "learning_rate": 5.270383388114808e-07, + "loss": 1.1737, + "step": 26417 + }, + { + "epoch": 0.8, + "learning_rate": 5.268885432467383e-07, + "loss": 1.0851, + "step": 26418 + }, + { + "epoch": 0.8, + "learning_rate": 5.267387664650664e-07, + "loss": 1.0342, + "step": 26419 + }, + { + "epoch": 0.8, + "learning_rate": 5.265890084678913e-07, + "loss": 1.1188, + "step": 26420 + }, + { + "epoch": 0.8, + "learning_rate": 5.264392692566381e-07, + "loss": 1.1259, + "step": 26421 + }, + { + "epoch": 0.8, + "learning_rate": 5.262895488327327e-07, + "loss": 1.0898, + "step": 26422 + }, + { + "epoch": 0.8, + "learning_rate": 5.261398471976003e-07, + "loss": 1.1078, + "step": 26423 + }, + { + "epoch": 0.8, + "learning_rate": 5.259901643526666e-07, + "loss": 1.2524, + "step": 26424 + }, + { + "epoch": 0.8, + "learning_rate": 5.25840500299355e-07, + "loss": 1.0533, + "step": 26425 + }, + { + "epoch": 0.8, + "learning_rate": 5.25690855039091e-07, + "loss": 1.1774, + "step": 26426 + }, + { + "epoch": 0.8, + "learning_rate": 5.255412285732995e-07, + "loss": 1.1307, + "step": 26427 + }, + { + "epoch": 0.8, + "learning_rate": 5.253916209034049e-07, + "loss": 1.026, + "step": 26428 + }, + { + "epoch": 0.8, + "learning_rate": 5.252420320308307e-07, + "loss": 1.041, + "step": 26429 + }, + { + "epoch": 0.8, + "learning_rate": 5.25092461957001e-07, + "loss": 1.0313, + "step": 26430 + }, + { + "epoch": 0.8, + "learning_rate": 5.249429106833401e-07, + "loss": 1.0322, + "step": 26431 + }, + { + "epoch": 0.8, + "learning_rate": 5.247933782112716e-07, + "loss": 1.1243, + "step": 26432 + }, + { + "epoch": 0.8, + "learning_rate": 5.246438645422191e-07, + "loss": 1.1309, + "step": 26433 + }, + { + "epoch": 0.8, + "learning_rate": 5.244943696776053e-07, + "loss": 1.0612, + "step": 26434 + }, + { + "epoch": 0.8, + "learning_rate": 5.243448936188536e-07, + "loss": 0.9391, + "step": 26435 + }, + { + "epoch": 0.8, + "learning_rate": 5.24195436367387e-07, + "loss": 1.1807, + "step": 26436 + }, + { + "epoch": 0.8, + "learning_rate": 5.24045997924629e-07, + "loss": 1.1188, + "step": 26437 + }, + { + "epoch": 0.8, + "learning_rate": 5.238965782920005e-07, + "loss": 1.0748, + "step": 26438 + }, + { + "epoch": 0.8, + "learning_rate": 5.237471774709252e-07, + "loss": 1.1996, + "step": 26439 + }, + { + "epoch": 0.8, + "learning_rate": 5.235977954628249e-07, + "loss": 1.0681, + "step": 26440 + }, + { + "epoch": 0.8, + "learning_rate": 5.234484322691221e-07, + "loss": 1.1228, + "step": 26441 + }, + { + "epoch": 0.8, + "learning_rate": 5.232990878912381e-07, + "loss": 1.0036, + "step": 26442 + }, + { + "epoch": 0.8, + "learning_rate": 5.231497623305942e-07, + "loss": 1.2256, + "step": 26443 + }, + { + "epoch": 0.8, + "learning_rate": 5.230004555886128e-07, + "loss": 1.0963, + "step": 26444 + }, + { + "epoch": 0.8, + "learning_rate": 5.22851167666715e-07, + "loss": 1.05, + "step": 26445 + }, + { + "epoch": 0.8, + "learning_rate": 5.227018985663218e-07, + "loss": 1.0901, + "step": 26446 + }, + { + "epoch": 0.8, + "learning_rate": 5.225526482888541e-07, + "loss": 1.0321, + "step": 26447 + }, + { + "epoch": 0.8, + "learning_rate": 5.224034168357329e-07, + "loss": 1.0811, + "step": 26448 + }, + { + "epoch": 0.8, + "learning_rate": 5.222542042083786e-07, + "loss": 0.9818, + "step": 26449 + }, + { + "epoch": 0.8, + "learning_rate": 5.221050104082126e-07, + "loss": 1.086, + "step": 26450 + }, + { + "epoch": 0.8, + "learning_rate": 5.219558354366536e-07, + "loss": 1.1136, + "step": 26451 + }, + { + "epoch": 0.8, + "learning_rate": 5.218066792951224e-07, + "loss": 1.0304, + "step": 26452 + }, + { + "epoch": 0.8, + "learning_rate": 5.216575419850389e-07, + "loss": 1.1576, + "step": 26453 + }, + { + "epoch": 0.8, + "learning_rate": 5.215084235078233e-07, + "loss": 1.1412, + "step": 26454 + }, + { + "epoch": 0.8, + "learning_rate": 5.213593238648943e-07, + "loss": 1.0572, + "step": 26455 + }, + { + "epoch": 0.8, + "learning_rate": 5.212102430576713e-07, + "loss": 1.0668, + "step": 26456 + }, + { + "epoch": 0.8, + "learning_rate": 5.210611810875738e-07, + "loss": 1.155, + "step": 26457 + }, + { + "epoch": 0.8, + "learning_rate": 5.209121379560208e-07, + "loss": 1.0743, + "step": 26458 + }, + { + "epoch": 0.8, + "learning_rate": 5.207631136644317e-07, + "loss": 1.0897, + "step": 26459 + }, + { + "epoch": 0.8, + "learning_rate": 5.206141082142241e-07, + "loss": 1.0643, + "step": 26460 + }, + { + "epoch": 0.8, + "learning_rate": 5.204651216068166e-07, + "loss": 0.9096, + "step": 26461 + }, + { + "epoch": 0.8, + "learning_rate": 5.203161538436279e-07, + "loss": 1.0261, + "step": 26462 + }, + { + "epoch": 0.8, + "learning_rate": 5.201672049260767e-07, + "loss": 0.9612, + "step": 26463 + }, + { + "epoch": 0.8, + "learning_rate": 5.200182748555793e-07, + "loss": 1.0782, + "step": 26464 + }, + { + "epoch": 0.8, + "learning_rate": 5.198693636335544e-07, + "loss": 1.0778, + "step": 26465 + }, + { + "epoch": 0.8, + "learning_rate": 5.197204712614196e-07, + "loss": 0.9937, + "step": 26466 + }, + { + "epoch": 0.8, + "learning_rate": 5.195715977405929e-07, + "loss": 1.1365, + "step": 26467 + }, + { + "epoch": 0.8, + "learning_rate": 5.194227430724899e-07, + "loss": 1.1455, + "step": 26468 + }, + { + "epoch": 0.8, + "learning_rate": 5.192739072585287e-07, + "loss": 1.2615, + "step": 26469 + }, + { + "epoch": 0.8, + "learning_rate": 5.191250903001258e-07, + "loss": 1.1892, + "step": 26470 + }, + { + "epoch": 0.8, + "learning_rate": 5.189762921986983e-07, + "loss": 1.0469, + "step": 26471 + }, + { + "epoch": 0.8, + "learning_rate": 5.188275129556622e-07, + "loss": 1.1715, + "step": 26472 + }, + { + "epoch": 0.8, + "learning_rate": 5.186787525724338e-07, + "loss": 1.1873, + "step": 26473 + }, + { + "epoch": 0.8, + "learning_rate": 5.185300110504304e-07, + "loss": 0.933, + "step": 26474 + }, + { + "epoch": 0.8, + "learning_rate": 5.183812883910663e-07, + "loss": 1.1335, + "step": 26475 + }, + { + "epoch": 0.8, + "learning_rate": 5.182325845957578e-07, + "loss": 1.0049, + "step": 26476 + }, + { + "epoch": 0.8, + "learning_rate": 5.180838996659207e-07, + "loss": 1.2094, + "step": 26477 + }, + { + "epoch": 0.8, + "learning_rate": 5.179352336029705e-07, + "loss": 1.1592, + "step": 26478 + }, + { + "epoch": 0.8, + "learning_rate": 5.177865864083221e-07, + "loss": 1.1995, + "step": 26479 + }, + { + "epoch": 0.8, + "learning_rate": 5.176379580833915e-07, + "loss": 1.124, + "step": 26480 + }, + { + "epoch": 0.8, + "learning_rate": 5.174893486295921e-07, + "loss": 1.0143, + "step": 26481 + }, + { + "epoch": 0.8, + "learning_rate": 5.173407580483392e-07, + "loss": 1.0646, + "step": 26482 + }, + { + "epoch": 0.8, + "learning_rate": 5.171921863410476e-07, + "loss": 1.1096, + "step": 26483 + }, + { + "epoch": 0.8, + "learning_rate": 5.17043633509132e-07, + "loss": 1.1071, + "step": 26484 + }, + { + "epoch": 0.8, + "learning_rate": 5.168950995540054e-07, + "loss": 1.0851, + "step": 26485 + }, + { + "epoch": 0.8, + "learning_rate": 5.167465844770822e-07, + "loss": 1.0455, + "step": 26486 + }, + { + "epoch": 0.8, + "learning_rate": 5.165980882797764e-07, + "loss": 1.1796, + "step": 26487 + }, + { + "epoch": 0.8, + "learning_rate": 5.164496109635015e-07, + "loss": 1.0919, + "step": 26488 + }, + { + "epoch": 0.8, + "learning_rate": 5.163011525296718e-07, + "loss": 1.0374, + "step": 26489 + }, + { + "epoch": 0.8, + "learning_rate": 5.16152712979699e-07, + "loss": 0.9885, + "step": 26490 + }, + { + "epoch": 0.8, + "learning_rate": 5.160042923149969e-07, + "loss": 1.1141, + "step": 26491 + }, + { + "epoch": 0.8, + "learning_rate": 5.158558905369784e-07, + "loss": 1.1041, + "step": 26492 + }, + { + "epoch": 0.8, + "learning_rate": 5.15707507647057e-07, + "loss": 1.1447, + "step": 26493 + }, + { + "epoch": 0.8, + "learning_rate": 5.155591436466437e-07, + "loss": 1.1255, + "step": 26494 + }, + { + "epoch": 0.8, + "learning_rate": 5.154107985371517e-07, + "loss": 1.1162, + "step": 26495 + }, + { + "epoch": 0.8, + "learning_rate": 5.152624723199928e-07, + "loss": 1.0646, + "step": 26496 + }, + { + "epoch": 0.8, + "learning_rate": 5.151141649965805e-07, + "loss": 1.1342, + "step": 26497 + }, + { + "epoch": 0.8, + "learning_rate": 5.149658765683244e-07, + "loss": 1.2705, + "step": 26498 + }, + { + "epoch": 0.8, + "learning_rate": 5.14817607036637e-07, + "loss": 1.0936, + "step": 26499 + }, + { + "epoch": 0.8, + "learning_rate": 5.146693564029301e-07, + "loss": 1.224, + "step": 26500 + }, + { + "epoch": 0.8, + "learning_rate": 5.145211246686146e-07, + "loss": 1.066, + "step": 26501 + }, + { + "epoch": 0.8, + "learning_rate": 5.143729118351018e-07, + "loss": 1.0957, + "step": 26502 + }, + { + "epoch": 0.8, + "learning_rate": 5.142247179038027e-07, + "loss": 1.1, + "step": 26503 + }, + { + "epoch": 0.8, + "learning_rate": 5.140765428761277e-07, + "loss": 1.0883, + "step": 26504 + }, + { + "epoch": 0.8, + "learning_rate": 5.139283867534878e-07, + "loss": 1.029, + "step": 26505 + }, + { + "epoch": 0.8, + "learning_rate": 5.137802495372934e-07, + "loss": 1.1457, + "step": 26506 + }, + { + "epoch": 0.8, + "learning_rate": 5.136321312289541e-07, + "loss": 1.2058, + "step": 26507 + }, + { + "epoch": 0.8, + "learning_rate": 5.134840318298803e-07, + "loss": 1.0349, + "step": 26508 + }, + { + "epoch": 0.8, + "learning_rate": 5.133359513414815e-07, + "loss": 1.1097, + "step": 26509 + }, + { + "epoch": 0.8, + "learning_rate": 5.131878897651685e-07, + "loss": 1.1035, + "step": 26510 + }, + { + "epoch": 0.8, + "learning_rate": 5.130398471023492e-07, + "loss": 1.0613, + "step": 26511 + }, + { + "epoch": 0.8, + "learning_rate": 5.128918233544336e-07, + "loss": 1.0175, + "step": 26512 + }, + { + "epoch": 0.8, + "learning_rate": 5.127438185228309e-07, + "loss": 1.1235, + "step": 26513 + }, + { + "epoch": 0.8, + "learning_rate": 5.125958326089498e-07, + "loss": 1.0873, + "step": 26514 + }, + { + "epoch": 0.8, + "learning_rate": 5.124478656141998e-07, + "loss": 1.0804, + "step": 26515 + }, + { + "epoch": 0.8, + "learning_rate": 5.122999175399884e-07, + "loss": 1.0408, + "step": 26516 + }, + { + "epoch": 0.8, + "learning_rate": 5.121519883877243e-07, + "loss": 1.1288, + "step": 26517 + }, + { + "epoch": 0.8, + "learning_rate": 5.120040781588162e-07, + "loss": 1.1123, + "step": 26518 + }, + { + "epoch": 0.8, + "learning_rate": 5.118561868546724e-07, + "loss": 1.125, + "step": 26519 + }, + { + "epoch": 0.8, + "learning_rate": 5.117083144766993e-07, + "loss": 1.1632, + "step": 26520 + }, + { + "epoch": 0.8, + "learning_rate": 5.115604610263056e-07, + "loss": 1.0914, + "step": 26521 + }, + { + "epoch": 0.8, + "learning_rate": 5.114126265048985e-07, + "loss": 1.0988, + "step": 26522 + }, + { + "epoch": 0.8, + "learning_rate": 5.112648109138862e-07, + "loss": 0.9608, + "step": 26523 + }, + { + "epoch": 0.8, + "learning_rate": 5.111170142546745e-07, + "loss": 1.2146, + "step": 26524 + }, + { + "epoch": 0.8, + "learning_rate": 5.109692365286709e-07, + "loss": 1.0374, + "step": 26525 + }, + { + "epoch": 0.8, + "learning_rate": 5.108214777372822e-07, + "loss": 1.1069, + "step": 26526 + }, + { + "epoch": 0.8, + "learning_rate": 5.106737378819152e-07, + "loss": 1.1495, + "step": 26527 + }, + { + "epoch": 0.8, + "learning_rate": 5.105260169639759e-07, + "loss": 1.0236, + "step": 26528 + }, + { + "epoch": 0.8, + "learning_rate": 5.103783149848706e-07, + "loss": 1.0825, + "step": 26529 + }, + { + "epoch": 0.8, + "learning_rate": 5.102306319460059e-07, + "loss": 1.0878, + "step": 26530 + }, + { + "epoch": 0.8, + "learning_rate": 5.10082967848787e-07, + "loss": 1.2156, + "step": 26531 + }, + { + "epoch": 0.8, + "learning_rate": 5.099353226946208e-07, + "loss": 1.1407, + "step": 26532 + }, + { + "epoch": 0.8, + "learning_rate": 5.09787696484911e-07, + "loss": 1.1236, + "step": 26533 + }, + { + "epoch": 0.8, + "learning_rate": 5.096400892210637e-07, + "loss": 0.9695, + "step": 26534 + }, + { + "epoch": 0.8, + "learning_rate": 5.094925009044843e-07, + "loss": 1.0109, + "step": 26535 + }, + { + "epoch": 0.8, + "learning_rate": 5.093449315365784e-07, + "loss": 1.2082, + "step": 26536 + }, + { + "epoch": 0.8, + "learning_rate": 5.091973811187492e-07, + "loss": 1.2191, + "step": 26537 + }, + { + "epoch": 0.8, + "learning_rate": 5.090498496524024e-07, + "loss": 0.9481, + "step": 26538 + }, + { + "epoch": 0.8, + "learning_rate": 5.089023371389418e-07, + "loss": 1.102, + "step": 26539 + }, + { + "epoch": 0.8, + "learning_rate": 5.087548435797723e-07, + "loss": 1.0886, + "step": 26540 + }, + { + "epoch": 0.8, + "learning_rate": 5.086073689762983e-07, + "loss": 1.0286, + "step": 26541 + }, + { + "epoch": 0.8, + "learning_rate": 5.084599133299222e-07, + "loss": 1.076, + "step": 26542 + }, + { + "epoch": 0.8, + "learning_rate": 5.083124766420486e-07, + "loss": 1.0686, + "step": 26543 + }, + { + "epoch": 0.8, + "learning_rate": 5.081650589140811e-07, + "loss": 1.1048, + "step": 26544 + }, + { + "epoch": 0.8, + "learning_rate": 5.080176601474235e-07, + "loss": 1.2372, + "step": 26545 + }, + { + "epoch": 0.8, + "learning_rate": 5.078702803434779e-07, + "loss": 1.1254, + "step": 26546 + }, + { + "epoch": 0.8, + "learning_rate": 5.077229195036476e-07, + "loss": 1.1266, + "step": 26547 + }, + { + "epoch": 0.8, + "learning_rate": 5.075755776293356e-07, + "loss": 1.1453, + "step": 26548 + }, + { + "epoch": 0.8, + "learning_rate": 5.074282547219452e-07, + "loss": 1.0429, + "step": 26549 + }, + { + "epoch": 0.8, + "learning_rate": 5.072809507828778e-07, + "loss": 1.0894, + "step": 26550 + }, + { + "epoch": 0.8, + "learning_rate": 5.071336658135357e-07, + "loss": 1.1555, + "step": 26551 + }, + { + "epoch": 0.8, + "learning_rate": 5.069863998153213e-07, + "loss": 1.0958, + "step": 26552 + }, + { + "epoch": 0.8, + "learning_rate": 5.068391527896366e-07, + "loss": 1.0743, + "step": 26553 + }, + { + "epoch": 0.8, + "learning_rate": 5.066919247378832e-07, + "loss": 1.2765, + "step": 26554 + }, + { + "epoch": 0.8, + "learning_rate": 5.065447156614628e-07, + "loss": 1.0628, + "step": 26555 + }, + { + "epoch": 0.8, + "learning_rate": 5.06397525561777e-07, + "loss": 1.0798, + "step": 26556 + }, + { + "epoch": 0.8, + "learning_rate": 5.062503544402261e-07, + "loss": 1.1554, + "step": 26557 + }, + { + "epoch": 0.8, + "learning_rate": 5.061032022982115e-07, + "loss": 1.0253, + "step": 26558 + }, + { + "epoch": 0.8, + "learning_rate": 5.059560691371343e-07, + "loss": 1.0947, + "step": 26559 + }, + { + "epoch": 0.8, + "learning_rate": 5.05808954958395e-07, + "loss": 1.2061, + "step": 26560 + }, + { + "epoch": 0.8, + "learning_rate": 5.056618597633939e-07, + "loss": 1.0081, + "step": 26561 + }, + { + "epoch": 0.8, + "learning_rate": 5.05514783553532e-07, + "loss": 1.1285, + "step": 26562 + }, + { + "epoch": 0.8, + "learning_rate": 5.053677263302082e-07, + "loss": 1.1461, + "step": 26563 + }, + { + "epoch": 0.8, + "learning_rate": 5.052206880948229e-07, + "loss": 1.0767, + "step": 26564 + }, + { + "epoch": 0.8, + "learning_rate": 5.050736688487762e-07, + "loss": 1.0685, + "step": 26565 + }, + { + "epoch": 0.8, + "learning_rate": 5.04926668593467e-07, + "loss": 1.1021, + "step": 26566 + }, + { + "epoch": 0.8, + "learning_rate": 5.04779687330296e-07, + "loss": 1.1604, + "step": 26567 + }, + { + "epoch": 0.8, + "learning_rate": 5.046327250606606e-07, + "loss": 1.1337, + "step": 26568 + }, + { + "epoch": 0.8, + "learning_rate": 5.044857817859608e-07, + "loss": 0.996, + "step": 26569 + }, + { + "epoch": 0.8, + "learning_rate": 5.043388575075953e-07, + "loss": 1.0599, + "step": 26570 + }, + { + "epoch": 0.8, + "learning_rate": 5.041919522269631e-07, + "loss": 1.0679, + "step": 26571 + }, + { + "epoch": 0.8, + "learning_rate": 5.04045065945462e-07, + "loss": 1.0239, + "step": 26572 + }, + { + "epoch": 0.8, + "learning_rate": 5.038981986644903e-07, + "loss": 1.1609, + "step": 26573 + }, + { + "epoch": 0.8, + "learning_rate": 5.037513503854465e-07, + "loss": 1.1208, + "step": 26574 + }, + { + "epoch": 0.8, + "learning_rate": 5.036045211097293e-07, + "loss": 1.1061, + "step": 26575 + }, + { + "epoch": 0.8, + "learning_rate": 5.034577108387348e-07, + "loss": 1.1243, + "step": 26576 + }, + { + "epoch": 0.8, + "learning_rate": 5.033109195738611e-07, + "loss": 1.1032, + "step": 26577 + }, + { + "epoch": 0.8, + "learning_rate": 5.031641473165061e-07, + "loss": 1.0242, + "step": 26578 + }, + { + "epoch": 0.8, + "learning_rate": 5.030173940680666e-07, + "loss": 1.1288, + "step": 26579 + }, + { + "epoch": 0.8, + "learning_rate": 5.028706598299402e-07, + "loss": 1.0972, + "step": 26580 + }, + { + "epoch": 0.8, + "learning_rate": 5.027239446035228e-07, + "loss": 1.1516, + "step": 26581 + }, + { + "epoch": 0.8, + "learning_rate": 5.025772483902114e-07, + "loss": 1.0814, + "step": 26582 + }, + { + "epoch": 0.8, + "learning_rate": 5.024305711914026e-07, + "loss": 1.1888, + "step": 26583 + }, + { + "epoch": 0.8, + "learning_rate": 5.02283913008493e-07, + "loss": 1.1403, + "step": 26584 + }, + { + "epoch": 0.8, + "learning_rate": 5.021372738428782e-07, + "loss": 1.1315, + "step": 26585 + }, + { + "epoch": 0.8, + "learning_rate": 5.019906536959542e-07, + "loss": 1.1039, + "step": 26586 + }, + { + "epoch": 0.8, + "learning_rate": 5.01844052569117e-07, + "loss": 1.0626, + "step": 26587 + }, + { + "epoch": 0.8, + "learning_rate": 5.016974704637629e-07, + "loss": 1.0563, + "step": 26588 + }, + { + "epoch": 0.8, + "learning_rate": 5.015509073812857e-07, + "loss": 1.0476, + "step": 26589 + }, + { + "epoch": 0.8, + "learning_rate": 5.014043633230814e-07, + "loss": 1.0573, + "step": 26590 + }, + { + "epoch": 0.8, + "learning_rate": 5.01257838290545e-07, + "loss": 1.0923, + "step": 26591 + }, + { + "epoch": 0.8, + "learning_rate": 5.011113322850714e-07, + "loss": 1.1656, + "step": 26592 + }, + { + "epoch": 0.8, + "learning_rate": 5.009648453080556e-07, + "loss": 1.118, + "step": 26593 + }, + { + "epoch": 0.8, + "learning_rate": 5.008183773608913e-07, + "loss": 1.1957, + "step": 26594 + }, + { + "epoch": 0.8, + "learning_rate": 5.006719284449732e-07, + "loss": 0.9793, + "step": 26595 + }, + { + "epoch": 0.8, + "learning_rate": 5.005254985616953e-07, + "loss": 1.083, + "step": 26596 + }, + { + "epoch": 0.8, + "learning_rate": 5.003790877124526e-07, + "loss": 1.0811, + "step": 26597 + }, + { + "epoch": 0.8, + "learning_rate": 5.00232695898637e-07, + "loss": 1.0984, + "step": 26598 + }, + { + "epoch": 0.8, + "learning_rate": 5.000863231216433e-07, + "loss": 1.2212, + "step": 26599 + }, + { + "epoch": 0.8, + "learning_rate": 4.999399693828641e-07, + "loss": 1.1971, + "step": 26600 + }, + { + "epoch": 0.8, + "learning_rate": 4.997936346836943e-07, + "loss": 1.0867, + "step": 26601 + }, + { + "epoch": 0.8, + "learning_rate": 4.99647319025525e-07, + "loss": 1.0501, + "step": 26602 + }, + { + "epoch": 0.8, + "learning_rate": 4.995010224097496e-07, + "loss": 1.0167, + "step": 26603 + }, + { + "epoch": 0.8, + "learning_rate": 4.993547448377611e-07, + "loss": 1.0903, + "step": 26604 + }, + { + "epoch": 0.8, + "learning_rate": 4.992084863109519e-07, + "loss": 0.9753, + "step": 26605 + }, + { + "epoch": 0.8, + "learning_rate": 4.990622468307149e-07, + "loss": 1.0917, + "step": 26606 + }, + { + "epoch": 0.8, + "learning_rate": 4.98916026398441e-07, + "loss": 1.0113, + "step": 26607 + }, + { + "epoch": 0.8, + "learning_rate": 4.98769825015523e-07, + "loss": 1.0452, + "step": 26608 + }, + { + "epoch": 0.8, + "learning_rate": 4.986236426833521e-07, + "loss": 1.0274, + "step": 26609 + }, + { + "epoch": 0.8, + "learning_rate": 4.984774794033207e-07, + "loss": 1.0813, + "step": 26610 + }, + { + "epoch": 0.8, + "learning_rate": 4.983313351768193e-07, + "loss": 1.1136, + "step": 26611 + }, + { + "epoch": 0.8, + "learning_rate": 4.981852100052395e-07, + "loss": 1.08, + "step": 26612 + }, + { + "epoch": 0.8, + "learning_rate": 4.980391038899727e-07, + "loss": 1.2363, + "step": 26613 + }, + { + "epoch": 0.8, + "learning_rate": 4.9789301683241e-07, + "loss": 1.0733, + "step": 26614 + }, + { + "epoch": 0.8, + "learning_rate": 4.977469488339406e-07, + "loss": 1.0422, + "step": 26615 + }, + { + "epoch": 0.8, + "learning_rate": 4.976008998959564e-07, + "loss": 1.0977, + "step": 26616 + }, + { + "epoch": 0.8, + "learning_rate": 4.97454870019847e-07, + "loss": 1.0081, + "step": 26617 + }, + { + "epoch": 0.8, + "learning_rate": 4.973088592070027e-07, + "loss": 1.0223, + "step": 26618 + }, + { + "epoch": 0.8, + "learning_rate": 4.971628674588144e-07, + "loss": 1.1136, + "step": 26619 + }, + { + "epoch": 0.8, + "learning_rate": 4.970168947766702e-07, + "loss": 1.042, + "step": 26620 + }, + { + "epoch": 0.8, + "learning_rate": 4.968709411619604e-07, + "loss": 1.2106, + "step": 26621 + }, + { + "epoch": 0.8, + "learning_rate": 4.967250066160747e-07, + "loss": 1.1032, + "step": 26622 + }, + { + "epoch": 0.8, + "learning_rate": 4.965790911404025e-07, + "loss": 1.0847, + "step": 26623 + }, + { + "epoch": 0.8, + "learning_rate": 4.964331947363321e-07, + "loss": 1.1041, + "step": 26624 + }, + { + "epoch": 0.8, + "learning_rate": 4.962873174052526e-07, + "loss": 1.194, + "step": 26625 + }, + { + "epoch": 0.8, + "learning_rate": 4.96141459148553e-07, + "loss": 1.0407, + "step": 26626 + }, + { + "epoch": 0.8, + "learning_rate": 4.959956199676222e-07, + "loss": 1.204, + "step": 26627 + }, + { + "epoch": 0.8, + "learning_rate": 4.958497998638473e-07, + "loss": 1.053, + "step": 26628 + }, + { + "epoch": 0.8, + "learning_rate": 4.95703998838617e-07, + "loss": 1.2064, + "step": 26629 + }, + { + "epoch": 0.8, + "learning_rate": 4.955582168933193e-07, + "loss": 1.0875, + "step": 26630 + }, + { + "epoch": 0.8, + "learning_rate": 4.95412454029342e-07, + "loss": 1.028, + "step": 26631 + }, + { + "epoch": 0.8, + "learning_rate": 4.952667102480732e-07, + "loss": 1.1951, + "step": 26632 + }, + { + "epoch": 0.8, + "learning_rate": 4.951209855508996e-07, + "loss": 1.0355, + "step": 26633 + }, + { + "epoch": 0.8, + "learning_rate": 4.949752799392083e-07, + "loss": 1.087, + "step": 26634 + }, + { + "epoch": 0.8, + "learning_rate": 4.948295934143865e-07, + "loss": 1.0961, + "step": 26635 + }, + { + "epoch": 0.8, + "learning_rate": 4.946839259778216e-07, + "loss": 1.1357, + "step": 26636 + }, + { + "epoch": 0.8, + "learning_rate": 4.945382776308999e-07, + "loss": 1.0746, + "step": 26637 + }, + { + "epoch": 0.8, + "learning_rate": 4.943926483750084e-07, + "loss": 1.1583, + "step": 26638 + }, + { + "epoch": 0.8, + "learning_rate": 4.942470382115324e-07, + "loss": 1.1035, + "step": 26639 + }, + { + "epoch": 0.8, + "learning_rate": 4.941014471418587e-07, + "loss": 1.175, + "step": 26640 + }, + { + "epoch": 0.8, + "learning_rate": 4.939558751673732e-07, + "loss": 1.1282, + "step": 26641 + }, + { + "epoch": 0.8, + "learning_rate": 4.938103222894613e-07, + "loss": 1.2959, + "step": 26642 + }, + { + "epoch": 0.8, + "learning_rate": 4.936647885095092e-07, + "loss": 1.2157, + "step": 26643 + }, + { + "epoch": 0.8, + "learning_rate": 4.935192738289018e-07, + "loss": 1.042, + "step": 26644 + }, + { + "epoch": 0.8, + "learning_rate": 4.933737782490252e-07, + "loss": 1.0693, + "step": 26645 + }, + { + "epoch": 0.8, + "learning_rate": 4.932283017712636e-07, + "loss": 1.0978, + "step": 26646 + }, + { + "epoch": 0.8, + "learning_rate": 4.930828443970015e-07, + "loss": 1.0382, + "step": 26647 + }, + { + "epoch": 0.8, + "learning_rate": 4.929374061276246e-07, + "loss": 1.2322, + "step": 26648 + }, + { + "epoch": 0.8, + "learning_rate": 4.927919869645173e-07, + "loss": 1.218, + "step": 26649 + }, + { + "epoch": 0.8, + "learning_rate": 4.926465869090632e-07, + "loss": 1.0464, + "step": 26650 + }, + { + "epoch": 0.8, + "learning_rate": 4.925012059626466e-07, + "loss": 1.1028, + "step": 26651 + }, + { + "epoch": 0.8, + "learning_rate": 4.923558441266518e-07, + "loss": 1.0266, + "step": 26652 + }, + { + "epoch": 0.8, + "learning_rate": 4.92210501402463e-07, + "loss": 1.1301, + "step": 26653 + }, + { + "epoch": 0.8, + "learning_rate": 4.920651777914625e-07, + "loss": 1.2329, + "step": 26654 + }, + { + "epoch": 0.8, + "learning_rate": 4.919198732950348e-07, + "loss": 1.1173, + "step": 26655 + }, + { + "epoch": 0.8, + "learning_rate": 4.917745879145625e-07, + "loss": 1.1777, + "step": 26656 + }, + { + "epoch": 0.8, + "learning_rate": 4.916293216514289e-07, + "loss": 1.0613, + "step": 26657 + }, + { + "epoch": 0.8, + "learning_rate": 4.91484074507018e-07, + "loss": 1.1031, + "step": 26658 + }, + { + "epoch": 0.8, + "learning_rate": 4.913388464827102e-07, + "loss": 1.1342, + "step": 26659 + }, + { + "epoch": 0.8, + "learning_rate": 4.911936375798893e-07, + "loss": 1.1245, + "step": 26660 + }, + { + "epoch": 0.8, + "learning_rate": 4.910484477999375e-07, + "loss": 1.1357, + "step": 26661 + }, + { + "epoch": 0.8, + "learning_rate": 4.909032771442376e-07, + "loss": 1.0288, + "step": 26662 + }, + { + "epoch": 0.8, + "learning_rate": 4.907581256141705e-07, + "loss": 1.1141, + "step": 26663 + }, + { + "epoch": 0.8, + "learning_rate": 4.906129932111181e-07, + "loss": 1.0637, + "step": 26664 + }, + { + "epoch": 0.8, + "learning_rate": 4.90467879936462e-07, + "loss": 1.1397, + "step": 26665 + }, + { + "epoch": 0.8, + "learning_rate": 4.903227857915843e-07, + "loss": 1.0149, + "step": 26666 + }, + { + "epoch": 0.8, + "learning_rate": 4.901777107778657e-07, + "loss": 1.1617, + "step": 26667 + }, + { + "epoch": 0.8, + "learning_rate": 4.900326548966871e-07, + "loss": 1.1689, + "step": 26668 + }, + { + "epoch": 0.8, + "learning_rate": 4.8988761814943e-07, + "loss": 1.0139, + "step": 26669 + }, + { + "epoch": 0.8, + "learning_rate": 4.89742600537475e-07, + "loss": 1.085, + "step": 26670 + }, + { + "epoch": 0.8, + "learning_rate": 4.895976020622018e-07, + "loss": 1.0521, + "step": 26671 + }, + { + "epoch": 0.8, + "learning_rate": 4.89452622724991e-07, + "loss": 1.0351, + "step": 26672 + }, + { + "epoch": 0.8, + "learning_rate": 4.893076625272228e-07, + "loss": 1.1569, + "step": 26673 + }, + { + "epoch": 0.8, + "learning_rate": 4.891627214702777e-07, + "loss": 1.0633, + "step": 26674 + }, + { + "epoch": 0.8, + "learning_rate": 4.890177995555353e-07, + "loss": 0.9084, + "step": 26675 + }, + { + "epoch": 0.8, + "learning_rate": 4.888728967843745e-07, + "loss": 1.0567, + "step": 26676 + }, + { + "epoch": 0.8, + "learning_rate": 4.887280131581751e-07, + "loss": 1.1077, + "step": 26677 + }, + { + "epoch": 0.8, + "learning_rate": 4.885831486783163e-07, + "loss": 1.074, + "step": 26678 + }, + { + "epoch": 0.8, + "learning_rate": 4.884383033461779e-07, + "loss": 1.1755, + "step": 26679 + }, + { + "epoch": 0.8, + "learning_rate": 4.882934771631373e-07, + "loss": 1.1857, + "step": 26680 + }, + { + "epoch": 0.8, + "learning_rate": 4.881486701305738e-07, + "loss": 1.0934, + "step": 26681 + }, + { + "epoch": 0.8, + "learning_rate": 4.880038822498662e-07, + "loss": 1.1019, + "step": 26682 + }, + { + "epoch": 0.8, + "learning_rate": 4.878591135223934e-07, + "loss": 1.0472, + "step": 26683 + }, + { + "epoch": 0.8, + "learning_rate": 4.877143639495319e-07, + "loss": 1.0364, + "step": 26684 + }, + { + "epoch": 0.8, + "learning_rate": 4.875696335326608e-07, + "loss": 1.2593, + "step": 26685 + }, + { + "epoch": 0.8, + "learning_rate": 4.874249222731573e-07, + "loss": 1.1403, + "step": 26686 + }, + { + "epoch": 0.8, + "learning_rate": 4.872802301723992e-07, + "loss": 1.0743, + "step": 26687 + }, + { + "epoch": 0.8, + "learning_rate": 4.871355572317648e-07, + "loss": 1.0808, + "step": 26688 + }, + { + "epoch": 0.8, + "learning_rate": 4.869909034526296e-07, + "loss": 1.0662, + "step": 26689 + }, + { + "epoch": 0.8, + "learning_rate": 4.868462688363717e-07, + "loss": 1.0548, + "step": 26690 + }, + { + "epoch": 0.8, + "learning_rate": 4.867016533843677e-07, + "loss": 1.0464, + "step": 26691 + }, + { + "epoch": 0.8, + "learning_rate": 4.865570570979944e-07, + "loss": 1.0463, + "step": 26692 + }, + { + "epoch": 0.8, + "learning_rate": 4.86412479978628e-07, + "loss": 1.2435, + "step": 26693 + }, + { + "epoch": 0.8, + "learning_rate": 4.86267922027645e-07, + "loss": 1.0678, + "step": 26694 + }, + { + "epoch": 0.8, + "learning_rate": 4.861233832464218e-07, + "loss": 1.0805, + "step": 26695 + }, + { + "epoch": 0.8, + "learning_rate": 4.859788636363346e-07, + "loss": 1.1094, + "step": 26696 + }, + { + "epoch": 0.8, + "learning_rate": 4.858343631987581e-07, + "loss": 0.9767, + "step": 26697 + }, + { + "epoch": 0.8, + "learning_rate": 4.85689881935068e-07, + "loss": 1.1155, + "step": 26698 + }, + { + "epoch": 0.8, + "learning_rate": 4.855454198466405e-07, + "loss": 0.9399, + "step": 26699 + }, + { + "epoch": 0.8, + "learning_rate": 4.854009769348502e-07, + "loss": 0.9948, + "step": 26700 + }, + { + "epoch": 0.8, + "learning_rate": 4.852565532010731e-07, + "loss": 1.1743, + "step": 26701 + }, + { + "epoch": 0.8, + "learning_rate": 4.851121486466828e-07, + "loss": 1.12, + "step": 26702 + }, + { + "epoch": 0.8, + "learning_rate": 4.84967763273054e-07, + "loss": 1.0994, + "step": 26703 + }, + { + "epoch": 0.8, + "learning_rate": 4.848233970815619e-07, + "loss": 1.3264, + "step": 26704 + }, + { + "epoch": 0.8, + "learning_rate": 4.846790500735812e-07, + "loss": 1.1763, + "step": 26705 + }, + { + "epoch": 0.8, + "learning_rate": 4.845347222504845e-07, + "loss": 1.0808, + "step": 26706 + }, + { + "epoch": 0.8, + "learning_rate": 4.843904136136468e-07, + "loss": 0.9594, + "step": 26707 + }, + { + "epoch": 0.8, + "learning_rate": 4.842461241644414e-07, + "loss": 1.1879, + "step": 26708 + }, + { + "epoch": 0.8, + "learning_rate": 4.84101853904243e-07, + "loss": 1.13, + "step": 26709 + }, + { + "epoch": 0.8, + "learning_rate": 4.839576028344232e-07, + "loss": 1.133, + "step": 26710 + }, + { + "epoch": 0.8, + "learning_rate": 4.838133709563561e-07, + "loss": 1.0695, + "step": 26711 + }, + { + "epoch": 0.8, + "learning_rate": 4.836691582714145e-07, + "loss": 0.9899, + "step": 26712 + }, + { + "epoch": 0.8, + "learning_rate": 4.835249647809717e-07, + "loss": 1.0833, + "step": 26713 + }, + { + "epoch": 0.8, + "learning_rate": 4.833807904864005e-07, + "loss": 1.0747, + "step": 26714 + }, + { + "epoch": 0.8, + "learning_rate": 4.832366353890724e-07, + "loss": 1.082, + "step": 26715 + }, + { + "epoch": 0.8, + "learning_rate": 4.830924994903602e-07, + "loss": 0.9834, + "step": 26716 + }, + { + "epoch": 0.8, + "learning_rate": 4.829483827916362e-07, + "loss": 1.1937, + "step": 26717 + }, + { + "epoch": 0.8, + "learning_rate": 4.828042852942719e-07, + "loss": 0.9649, + "step": 26718 + }, + { + "epoch": 0.8, + "learning_rate": 4.826602069996394e-07, + "loss": 1.0088, + "step": 26719 + }, + { + "epoch": 0.8, + "learning_rate": 4.8251614790911e-07, + "loss": 1.1026, + "step": 26720 + }, + { + "epoch": 0.8, + "learning_rate": 4.823721080240562e-07, + "loss": 1.0761, + "step": 26721 + }, + { + "epoch": 0.81, + "learning_rate": 4.822280873458474e-07, + "loss": 1.0041, + "step": 26722 + }, + { + "epoch": 0.81, + "learning_rate": 4.820840858758552e-07, + "loss": 1.1349, + "step": 26723 + }, + { + "epoch": 0.81, + "learning_rate": 4.819401036154508e-07, + "loss": 1.2547, + "step": 26724 + }, + { + "epoch": 0.81, + "learning_rate": 4.817961405660046e-07, + "loss": 1.0748, + "step": 26725 + }, + { + "epoch": 0.81, + "learning_rate": 4.816521967288873e-07, + "loss": 1.0695, + "step": 26726 + }, + { + "epoch": 0.81, + "learning_rate": 4.815082721054698e-07, + "loss": 1.0894, + "step": 26727 + }, + { + "epoch": 0.81, + "learning_rate": 4.813643666971205e-07, + "loss": 1.1099, + "step": 26728 + }, + { + "epoch": 0.81, + "learning_rate": 4.812204805052101e-07, + "loss": 1.1324, + "step": 26729 + }, + { + "epoch": 0.81, + "learning_rate": 4.810766135311087e-07, + "loss": 1.1479, + "step": 26730 + }, + { + "epoch": 0.81, + "learning_rate": 4.809327657761861e-07, + "loss": 1.2925, + "step": 26731 + }, + { + "epoch": 0.81, + "learning_rate": 4.807889372418107e-07, + "loss": 1.1049, + "step": 26732 + }, + { + "epoch": 0.81, + "learning_rate": 4.80645127929352e-07, + "loss": 1.0289, + "step": 26733 + }, + { + "epoch": 0.81, + "learning_rate": 4.80501337840179e-07, + "loss": 0.9136, + "step": 26734 + }, + { + "epoch": 0.81, + "learning_rate": 4.803575669756616e-07, + "loss": 1.061, + "step": 26735 + }, + { + "epoch": 0.81, + "learning_rate": 4.802138153371666e-07, + "loss": 1.0251, + "step": 26736 + }, + { + "epoch": 0.81, + "learning_rate": 4.800700829260635e-07, + "loss": 1.2432, + "step": 26737 + }, + { + "epoch": 0.81, + "learning_rate": 4.799263697437201e-07, + "loss": 1.0213, + "step": 26738 + }, + { + "epoch": 0.81, + "learning_rate": 4.797826757915051e-07, + "loss": 1.0154, + "step": 26739 + }, + { + "epoch": 0.81, + "learning_rate": 4.796390010707863e-07, + "loss": 1.1151, + "step": 26740 + }, + { + "epoch": 0.81, + "learning_rate": 4.794953455829307e-07, + "loss": 1.2255, + "step": 26741 + }, + { + "epoch": 0.81, + "learning_rate": 4.793517093293063e-07, + "loss": 0.9701, + "step": 26742 + }, + { + "epoch": 0.81, + "learning_rate": 4.792080923112805e-07, + "loss": 1.0781, + "step": 26743 + }, + { + "epoch": 0.81, + "learning_rate": 4.790644945302212e-07, + "loss": 1.0479, + "step": 26744 + }, + { + "epoch": 0.81, + "learning_rate": 4.789209159874936e-07, + "loss": 1.0458, + "step": 26745 + }, + { + "epoch": 0.81, + "learning_rate": 4.787773566844658e-07, + "loss": 1.1274, + "step": 26746 + }, + { + "epoch": 0.81, + "learning_rate": 4.786338166225041e-07, + "loss": 1.2301, + "step": 26747 + }, + { + "epoch": 0.81, + "learning_rate": 4.784902958029746e-07, + "loss": 1.0396, + "step": 26748 + }, + { + "epoch": 0.81, + "learning_rate": 4.783467942272444e-07, + "loss": 1.093, + "step": 26749 + }, + { + "epoch": 0.81, + "learning_rate": 4.782033118966786e-07, + "loss": 1.1595, + "step": 26750 + }, + { + "epoch": 0.81, + "learning_rate": 4.780598488126437e-07, + "loss": 1.074, + "step": 26751 + }, + { + "epoch": 0.81, + "learning_rate": 4.779164049765053e-07, + "loss": 1.1156, + "step": 26752 + }, + { + "epoch": 0.81, + "learning_rate": 4.777729803896295e-07, + "loss": 1.1522, + "step": 26753 + }, + { + "epoch": 0.81, + "learning_rate": 4.776295750533802e-07, + "loss": 1.0342, + "step": 26754 + }, + { + "epoch": 0.81, + "learning_rate": 4.774861889691235e-07, + "loss": 1.1772, + "step": 26755 + }, + { + "epoch": 0.81, + "learning_rate": 4.773428221382242e-07, + "loss": 1.1407, + "step": 26756 + }, + { + "epoch": 0.81, + "learning_rate": 4.771994745620476e-07, + "loss": 1.1052, + "step": 26757 + }, + { + "epoch": 0.81, + "learning_rate": 4.770561462419573e-07, + "loss": 1.0309, + "step": 26758 + }, + { + "epoch": 0.81, + "learning_rate": 4.769128371793181e-07, + "loss": 1.0909, + "step": 26759 + }, + { + "epoch": 0.81, + "learning_rate": 4.7676954737549436e-07, + "loss": 1.0845, + "step": 26760 + }, + { + "epoch": 0.81, + "learning_rate": 4.766262768318508e-07, + "loss": 1.1458, + "step": 26761 + }, + { + "epoch": 0.81, + "learning_rate": 4.764830255497499e-07, + "loss": 1.2075, + "step": 26762 + }, + { + "epoch": 0.81, + "learning_rate": 4.763397935305561e-07, + "loss": 1.0466, + "step": 26763 + }, + { + "epoch": 0.81, + "learning_rate": 4.7619658077563275e-07, + "loss": 1.108, + "step": 26764 + }, + { + "epoch": 0.81, + "learning_rate": 4.7605338728634323e-07, + "loss": 1.1584, + "step": 26765 + }, + { + "epoch": 0.81, + "learning_rate": 4.7591021306405137e-07, + "loss": 1.0999, + "step": 26766 + }, + { + "epoch": 0.81, + "learning_rate": 4.75767058110119e-07, + "loss": 1.1898, + "step": 26767 + }, + { + "epoch": 0.81, + "learning_rate": 4.7562392242590903e-07, + "loss": 1.2347, + "step": 26768 + }, + { + "epoch": 0.81, + "learning_rate": 4.754808060127844e-07, + "loss": 1.1545, + "step": 26769 + }, + { + "epoch": 0.81, + "learning_rate": 4.7533770887210837e-07, + "loss": 1.0637, + "step": 26770 + }, + { + "epoch": 0.81, + "learning_rate": 4.751946310052413e-07, + "loss": 1.1127, + "step": 26771 + }, + { + "epoch": 0.81, + "learning_rate": 4.7505157241354625e-07, + "loss": 1.0452, + "step": 26772 + }, + { + "epoch": 0.81, + "learning_rate": 4.749085330983852e-07, + "loss": 1.2263, + "step": 26773 + }, + { + "epoch": 0.81, + "learning_rate": 4.7476551306111924e-07, + "loss": 1.0388, + "step": 26774 + }, + { + "epoch": 0.81, + "learning_rate": 4.746225123031104e-07, + "loss": 1.2545, + "step": 26775 + }, + { + "epoch": 0.81, + "learning_rate": 4.744795308257197e-07, + "loss": 1.1263, + "step": 26776 + }, + { + "epoch": 0.81, + "learning_rate": 4.7433656863030833e-07, + "loss": 1.0969, + "step": 26777 + }, + { + "epoch": 0.81, + "learning_rate": 4.741936257182375e-07, + "loss": 1.1104, + "step": 26778 + }, + { + "epoch": 0.81, + "learning_rate": 4.74050702090868e-07, + "loss": 1.0707, + "step": 26779 + }, + { + "epoch": 0.81, + "learning_rate": 4.7390779774955956e-07, + "loss": 1.1014, + "step": 26780 + }, + { + "epoch": 0.81, + "learning_rate": 4.737649126956731e-07, + "loss": 1.1329, + "step": 26781 + }, + { + "epoch": 0.81, + "learning_rate": 4.7362204693056886e-07, + "loss": 1.1418, + "step": 26782 + }, + { + "epoch": 0.81, + "learning_rate": 4.734792004556074e-07, + "loss": 1.0622, + "step": 26783 + }, + { + "epoch": 0.81, + "learning_rate": 4.7333637327214745e-07, + "loss": 1.0623, + "step": 26784 + }, + { + "epoch": 0.81, + "learning_rate": 4.7319356538154893e-07, + "loss": 1.0541, + "step": 26785 + }, + { + "epoch": 0.81, + "learning_rate": 4.730507767851716e-07, + "loss": 1.04, + "step": 26786 + }, + { + "epoch": 0.81, + "learning_rate": 4.729080074843753e-07, + "loss": 1.2128, + "step": 26787 + }, + { + "epoch": 0.81, + "learning_rate": 4.727652574805178e-07, + "loss": 1.0996, + "step": 26788 + }, + { + "epoch": 0.81, + "learning_rate": 4.726225267749587e-07, + "loss": 1.1866, + "step": 26789 + }, + { + "epoch": 0.81, + "learning_rate": 4.7247981536905683e-07, + "loss": 1.0277, + "step": 26790 + }, + { + "epoch": 0.81, + "learning_rate": 4.7233712326417046e-07, + "loss": 0.9565, + "step": 26791 + }, + { + "epoch": 0.81, + "learning_rate": 4.721944504616588e-07, + "loss": 1.1855, + "step": 26792 + }, + { + "epoch": 0.81, + "learning_rate": 4.720517969628788e-07, + "loss": 1.07, + "step": 26793 + }, + { + "epoch": 0.81, + "learning_rate": 4.7190916276918906e-07, + "loss": 0.9344, + "step": 26794 + }, + { + "epoch": 0.81, + "learning_rate": 4.717665478819472e-07, + "loss": 1.0919, + "step": 26795 + }, + { + "epoch": 0.81, + "learning_rate": 4.716239523025118e-07, + "loss": 1.0865, + "step": 26796 + }, + { + "epoch": 0.81, + "learning_rate": 4.714813760322387e-07, + "loss": 1.153, + "step": 26797 + }, + { + "epoch": 0.81, + "learning_rate": 4.7133881907248573e-07, + "loss": 1.1696, + "step": 26798 + }, + { + "epoch": 0.81, + "learning_rate": 4.711962814246104e-07, + "loss": 1.0848, + "step": 26799 + }, + { + "epoch": 0.81, + "learning_rate": 4.710537630899695e-07, + "loss": 1.0505, + "step": 26800 + }, + { + "epoch": 0.81, + "learning_rate": 4.709112640699193e-07, + "loss": 1.1852, + "step": 26801 + }, + { + "epoch": 0.81, + "learning_rate": 4.707687843658168e-07, + "loss": 1.0508, + "step": 26802 + }, + { + "epoch": 0.81, + "learning_rate": 4.7062632397901876e-07, + "loss": 1.1682, + "step": 26803 + }, + { + "epoch": 0.81, + "learning_rate": 4.7048388291087987e-07, + "loss": 1.094, + "step": 26804 + }, + { + "epoch": 0.81, + "learning_rate": 4.703414611627574e-07, + "loss": 1.2061, + "step": 26805 + }, + { + "epoch": 0.81, + "learning_rate": 4.701990587360064e-07, + "loss": 1.1042, + "step": 26806 + }, + { + "epoch": 0.81, + "learning_rate": 4.70056675631983e-07, + "loss": 1.0348, + "step": 26807 + }, + { + "epoch": 0.81, + "learning_rate": 4.6991431185204217e-07, + "loss": 1.15, + "step": 26808 + }, + { + "epoch": 0.81, + "learning_rate": 4.697719673975401e-07, + "loss": 1.1415, + "step": 26809 + }, + { + "epoch": 0.81, + "learning_rate": 4.696296422698304e-07, + "loss": 1.0345, + "step": 26810 + }, + { + "epoch": 0.81, + "learning_rate": 4.6948733647026875e-07, + "loss": 1.2621, + "step": 26811 + }, + { + "epoch": 0.81, + "learning_rate": 4.6934505000020974e-07, + "loss": 1.0931, + "step": 26812 + }, + { + "epoch": 0.81, + "learning_rate": 4.692027828610082e-07, + "loss": 1.1641, + "step": 26813 + }, + { + "epoch": 0.81, + "learning_rate": 4.690605350540178e-07, + "loss": 1.1707, + "step": 26814 + }, + { + "epoch": 0.81, + "learning_rate": 4.68918306580593e-07, + "loss": 1.0214, + "step": 26815 + }, + { + "epoch": 0.81, + "learning_rate": 4.6877609744208743e-07, + "loss": 1.0663, + "step": 26816 + }, + { + "epoch": 0.81, + "learning_rate": 4.686339076398555e-07, + "loss": 1.2599, + "step": 26817 + }, + { + "epoch": 0.81, + "learning_rate": 4.684917371752506e-07, + "loss": 1.0677, + "step": 26818 + }, + { + "epoch": 0.81, + "learning_rate": 4.6834958604962566e-07, + "loss": 1.116, + "step": 26819 + }, + { + "epoch": 0.81, + "learning_rate": 4.6820745426433416e-07, + "loss": 1.0701, + "step": 26820 + }, + { + "epoch": 0.81, + "learning_rate": 4.68065341820729e-07, + "loss": 1.0383, + "step": 26821 + }, + { + "epoch": 0.81, + "learning_rate": 4.6792324872016403e-07, + "loss": 1.0956, + "step": 26822 + }, + { + "epoch": 0.81, + "learning_rate": 4.6778117496399046e-07, + "loss": 1.1339, + "step": 26823 + }, + { + "epoch": 0.81, + "learning_rate": 4.67639120553561e-07, + "loss": 1.2478, + "step": 26824 + }, + { + "epoch": 0.81, + "learning_rate": 4.674970854902286e-07, + "loss": 1.125, + "step": 26825 + }, + { + "epoch": 0.81, + "learning_rate": 4.673550697753454e-07, + "loss": 1.1268, + "step": 26826 + }, + { + "epoch": 0.81, + "learning_rate": 4.6721307341026257e-07, + "loss": 1.0191, + "step": 26827 + }, + { + "epoch": 0.81, + "learning_rate": 4.6707109639633235e-07, + "loss": 1.118, + "step": 26828 + }, + { + "epoch": 0.81, + "learning_rate": 4.669291387349059e-07, + "loss": 1.127, + "step": 26829 + }, + { + "epoch": 0.81, + "learning_rate": 4.6678720042733524e-07, + "loss": 1.1537, + "step": 26830 + }, + { + "epoch": 0.81, + "learning_rate": 4.6664528147497086e-07, + "loss": 1.1399, + "step": 26831 + }, + { + "epoch": 0.81, + "learning_rate": 4.665033818791642e-07, + "loss": 1.1581, + "step": 26832 + }, + { + "epoch": 0.81, + "learning_rate": 4.663615016412662e-07, + "loss": 1.061, + "step": 26833 + }, + { + "epoch": 0.81, + "learning_rate": 4.662196407626271e-07, + "loss": 0.9205, + "step": 26834 + }, + { + "epoch": 0.81, + "learning_rate": 4.660777992445981e-07, + "loss": 1.1005, + "step": 26835 + }, + { + "epoch": 0.81, + "learning_rate": 4.659359770885283e-07, + "loss": 1.1554, + "step": 26836 + }, + { + "epoch": 0.81, + "learning_rate": 4.6579417429576833e-07, + "loss": 1.1378, + "step": 26837 + }, + { + "epoch": 0.81, + "learning_rate": 4.656523908676683e-07, + "loss": 1.1924, + "step": 26838 + }, + { + "epoch": 0.81, + "learning_rate": 4.6551062680557813e-07, + "loss": 1.1608, + "step": 26839 + }, + { + "epoch": 0.81, + "learning_rate": 4.6536888211084624e-07, + "loss": 1.0491, + "step": 26840 + }, + { + "epoch": 0.81, + "learning_rate": 4.6522715678482293e-07, + "loss": 1.0574, + "step": 26841 + }, + { + "epoch": 0.81, + "learning_rate": 4.6508545082885716e-07, + "loss": 1.2547, + "step": 26842 + }, + { + "epoch": 0.81, + "learning_rate": 4.649437642442975e-07, + "loss": 1.1743, + "step": 26843 + }, + { + "epoch": 0.81, + "learning_rate": 4.64802097032494e-07, + "loss": 1.175, + "step": 26844 + }, + { + "epoch": 0.81, + "learning_rate": 4.6466044919479367e-07, + "loss": 1.0856, + "step": 26845 + }, + { + "epoch": 0.81, + "learning_rate": 4.6451882073254574e-07, + "loss": 1.1652, + "step": 26846 + }, + { + "epoch": 0.81, + "learning_rate": 4.6437721164709794e-07, + "loss": 1.0463, + "step": 26847 + }, + { + "epoch": 0.81, + "learning_rate": 4.6423562193979976e-07, + "loss": 1.0406, + "step": 26848 + }, + { + "epoch": 0.81, + "learning_rate": 4.6409405161199713e-07, + "loss": 1.0656, + "step": 26849 + }, + { + "epoch": 0.81, + "learning_rate": 4.639525006650386e-07, + "loss": 1.1301, + "step": 26850 + }, + { + "epoch": 0.81, + "learning_rate": 4.6381096910027154e-07, + "loss": 1.1573, + "step": 26851 + }, + { + "epoch": 0.81, + "learning_rate": 4.636694569190442e-07, + "loss": 1.0746, + "step": 26852 + }, + { + "epoch": 0.81, + "learning_rate": 4.6352796412270225e-07, + "loss": 1.1177, + "step": 26853 + }, + { + "epoch": 0.81, + "learning_rate": 4.6338649071259346e-07, + "loss": 1.1565, + "step": 26854 + }, + { + "epoch": 0.81, + "learning_rate": 4.6324503669006426e-07, + "loss": 0.9729, + "step": 26855 + }, + { + "epoch": 0.81, + "learning_rate": 4.6310360205646136e-07, + "loss": 1.04, + "step": 26856 + }, + { + "epoch": 0.81, + "learning_rate": 4.6296218681313093e-07, + "loss": 1.0792, + "step": 26857 + }, + { + "epoch": 0.81, + "learning_rate": 4.6282079096141963e-07, + "loss": 1.0981, + "step": 26858 + }, + { + "epoch": 0.81, + "learning_rate": 4.6267941450267335e-07, + "loss": 1.105, + "step": 26859 + }, + { + "epoch": 0.81, + "learning_rate": 4.625380574382379e-07, + "loss": 1.0643, + "step": 26860 + }, + { + "epoch": 0.81, + "learning_rate": 4.6239671976945926e-07, + "loss": 1.2139, + "step": 26861 + }, + { + "epoch": 0.81, + "learning_rate": 4.622554014976821e-07, + "loss": 1.0301, + "step": 26862 + }, + { + "epoch": 0.81, + "learning_rate": 4.6211410262425175e-07, + "loss": 1.1536, + "step": 26863 + }, + { + "epoch": 0.81, + "learning_rate": 4.619728231505141e-07, + "loss": 1.1456, + "step": 26864 + }, + { + "epoch": 0.81, + "learning_rate": 4.618315630778139e-07, + "loss": 0.9985, + "step": 26865 + }, + { + "epoch": 0.81, + "learning_rate": 4.6169032240749506e-07, + "loss": 1.0538, + "step": 26866 + }, + { + "epoch": 0.81, + "learning_rate": 4.615491011409029e-07, + "loss": 1.2155, + "step": 26867 + }, + { + "epoch": 0.81, + "learning_rate": 4.614078992793813e-07, + "loss": 1.1308, + "step": 26868 + }, + { + "epoch": 0.81, + "learning_rate": 4.6126671682427545e-07, + "loss": 1.1678, + "step": 26869 + }, + { + "epoch": 0.81, + "learning_rate": 4.611255537769277e-07, + "loss": 1.1752, + "step": 26870 + }, + { + "epoch": 0.81, + "learning_rate": 4.609844101386829e-07, + "loss": 1.0362, + "step": 26871 + }, + { + "epoch": 0.81, + "learning_rate": 4.6084328591088467e-07, + "loss": 1.0161, + "step": 26872 + }, + { + "epoch": 0.81, + "learning_rate": 4.6070218109487586e-07, + "loss": 1.1476, + "step": 26873 + }, + { + "epoch": 0.81, + "learning_rate": 4.605610956920012e-07, + "loss": 1.0309, + "step": 26874 + }, + { + "epoch": 0.81, + "learning_rate": 4.6042002970360183e-07, + "loss": 1.2559, + "step": 26875 + }, + { + "epoch": 0.81, + "learning_rate": 4.6027898313102144e-07, + "loss": 1.1044, + "step": 26876 + }, + { + "epoch": 0.81, + "learning_rate": 4.601379559756028e-07, + "loss": 0.9716, + "step": 26877 + }, + { + "epoch": 0.81, + "learning_rate": 4.59996948238689e-07, + "loss": 1.0435, + "step": 26878 + }, + { + "epoch": 0.81, + "learning_rate": 4.5985595992162123e-07, + "loss": 1.0705, + "step": 26879 + }, + { + "epoch": 0.81, + "learning_rate": 4.59714991025742e-07, + "loss": 1.2331, + "step": 26880 + }, + { + "epoch": 0.81, + "learning_rate": 4.595740415523936e-07, + "loss": 1.2541, + "step": 26881 + }, + { + "epoch": 0.81, + "learning_rate": 4.5943311150291744e-07, + "loss": 1.0819, + "step": 26882 + }, + { + "epoch": 0.81, + "learning_rate": 4.5929220087865546e-07, + "loss": 1.0897, + "step": 26883 + }, + { + "epoch": 0.81, + "learning_rate": 4.5915130968094854e-07, + "loss": 1.0803, + "step": 26884 + }, + { + "epoch": 0.81, + "learning_rate": 4.590104379111393e-07, + "loss": 1.0375, + "step": 26885 + }, + { + "epoch": 0.81, + "learning_rate": 4.5886958557056685e-07, + "loss": 1.0094, + "step": 26886 + }, + { + "epoch": 0.81, + "learning_rate": 4.58728752660573e-07, + "loss": 1.252, + "step": 26887 + }, + { + "epoch": 0.81, + "learning_rate": 4.5858793918249825e-07, + "loss": 1.129, + "step": 26888 + }, + { + "epoch": 0.81, + "learning_rate": 4.584471451376832e-07, + "loss": 1.1033, + "step": 26889 + }, + { + "epoch": 0.81, + "learning_rate": 4.583063705274679e-07, + "loss": 1.1409, + "step": 26890 + }, + { + "epoch": 0.81, + "learning_rate": 4.5816561535319353e-07, + "loss": 1.0768, + "step": 26891 + }, + { + "epoch": 0.81, + "learning_rate": 4.5802487961619845e-07, + "loss": 1.0822, + "step": 26892 + }, + { + "epoch": 0.81, + "learning_rate": 4.57884163317823e-07, + "loss": 1.0539, + "step": 26893 + }, + { + "epoch": 0.81, + "learning_rate": 4.577434664594069e-07, + "loss": 0.9732, + "step": 26894 + }, + { + "epoch": 0.81, + "learning_rate": 4.576027890422899e-07, + "loss": 1.0386, + "step": 26895 + }, + { + "epoch": 0.81, + "learning_rate": 4.5746213106781014e-07, + "loss": 1.1501, + "step": 26896 + }, + { + "epoch": 0.81, + "learning_rate": 4.5732149253730707e-07, + "loss": 1.0229, + "step": 26897 + }, + { + "epoch": 0.81, + "learning_rate": 4.571808734521196e-07, + "loss": 1.1439, + "step": 26898 + }, + { + "epoch": 0.81, + "learning_rate": 4.5704027381358653e-07, + "loss": 1.1054, + "step": 26899 + }, + { + "epoch": 0.81, + "learning_rate": 4.568996936230466e-07, + "loss": 1.1147, + "step": 26900 + }, + { + "epoch": 0.81, + "learning_rate": 4.5675913288183716e-07, + "loss": 1.0793, + "step": 26901 + }, + { + "epoch": 0.81, + "learning_rate": 4.5661859159129654e-07, + "loss": 1.1259, + "step": 26902 + }, + { + "epoch": 0.81, + "learning_rate": 4.5647806975276295e-07, + "loss": 1.0418, + "step": 26903 + }, + { + "epoch": 0.81, + "learning_rate": 4.563375673675743e-07, + "loss": 1.0876, + "step": 26904 + }, + { + "epoch": 0.81, + "learning_rate": 4.5619708443706723e-07, + "loss": 1.0693, + "step": 26905 + }, + { + "epoch": 0.81, + "learning_rate": 4.5605662096257967e-07, + "loss": 1.1941, + "step": 26906 + }, + { + "epoch": 0.81, + "learning_rate": 4.559161769454487e-07, + "loss": 0.9527, + "step": 26907 + }, + { + "epoch": 0.81, + "learning_rate": 4.557757523870118e-07, + "loss": 1.0644, + "step": 26908 + }, + { + "epoch": 0.81, + "learning_rate": 4.5563534728860464e-07, + "loss": 1.0621, + "step": 26909 + }, + { + "epoch": 0.81, + "learning_rate": 4.5549496165156443e-07, + "loss": 1.0721, + "step": 26910 + }, + { + "epoch": 0.81, + "learning_rate": 4.553545954772273e-07, + "loss": 1.1893, + "step": 26911 + }, + { + "epoch": 0.81, + "learning_rate": 4.5521424876693006e-07, + "loss": 1.1827, + "step": 26912 + }, + { + "epoch": 0.81, + "learning_rate": 4.550739215220082e-07, + "loss": 1.1478, + "step": 26913 + }, + { + "epoch": 0.81, + "learning_rate": 4.549336137437976e-07, + "loss": 1.102, + "step": 26914 + }, + { + "epoch": 0.81, + "learning_rate": 4.5479332543363397e-07, + "loss": 1.1525, + "step": 26915 + }, + { + "epoch": 0.81, + "learning_rate": 4.5465305659285306e-07, + "loss": 1.1483, + "step": 26916 + }, + { + "epoch": 0.81, + "learning_rate": 4.5451280722279055e-07, + "loss": 1.1174, + "step": 26917 + }, + { + "epoch": 0.81, + "learning_rate": 4.5437257732478064e-07, + "loss": 1.0838, + "step": 26918 + }, + { + "epoch": 0.81, + "learning_rate": 4.5423236690015834e-07, + "loss": 1.1396, + "step": 26919 + }, + { + "epoch": 0.81, + "learning_rate": 4.540921759502584e-07, + "loss": 1.1346, + "step": 26920 + }, + { + "epoch": 0.81, + "learning_rate": 4.5395200447641646e-07, + "loss": 1.0469, + "step": 26921 + }, + { + "epoch": 0.81, + "learning_rate": 4.538118524799656e-07, + "loss": 1.0513, + "step": 26922 + }, + { + "epoch": 0.81, + "learning_rate": 4.5367171996224007e-07, + "loss": 1.1741, + "step": 26923 + }, + { + "epoch": 0.81, + "learning_rate": 4.5353160692457433e-07, + "loss": 1.2139, + "step": 26924 + }, + { + "epoch": 0.81, + "learning_rate": 4.533915133683023e-07, + "loss": 1.0376, + "step": 26925 + }, + { + "epoch": 0.81, + "learning_rate": 4.532514392947576e-07, + "loss": 1.084, + "step": 26926 + }, + { + "epoch": 0.81, + "learning_rate": 4.5311138470527315e-07, + "loss": 1.0602, + "step": 26927 + }, + { + "epoch": 0.81, + "learning_rate": 4.5297134960118257e-07, + "loss": 1.1161, + "step": 26928 + }, + { + "epoch": 0.81, + "learning_rate": 4.5283133398381863e-07, + "loss": 0.9973, + "step": 26929 + }, + { + "epoch": 0.81, + "learning_rate": 4.5269133785451505e-07, + "loss": 1.1378, + "step": 26930 + }, + { + "epoch": 0.81, + "learning_rate": 4.5255136121460345e-07, + "loss": 1.1055, + "step": 26931 + }, + { + "epoch": 0.81, + "learning_rate": 4.524114040654168e-07, + "loss": 1.1993, + "step": 26932 + }, + { + "epoch": 0.81, + "learning_rate": 4.5227146640828723e-07, + "loss": 1.1249, + "step": 26933 + }, + { + "epoch": 0.81, + "learning_rate": 4.521315482445479e-07, + "loss": 1.0305, + "step": 26934 + }, + { + "epoch": 0.81, + "learning_rate": 4.5199164957552915e-07, + "loss": 1.1716, + "step": 26935 + }, + { + "epoch": 0.81, + "learning_rate": 4.5185177040256376e-07, + "loss": 1.0891, + "step": 26936 + }, + { + "epoch": 0.81, + "learning_rate": 4.51711910726983e-07, + "loss": 1.1487, + "step": 26937 + }, + { + "epoch": 0.81, + "learning_rate": 4.5157207055011836e-07, + "loss": 1.1089, + "step": 26938 + }, + { + "epoch": 0.81, + "learning_rate": 4.5143224987330094e-07, + "loss": 1.1023, + "step": 26939 + }, + { + "epoch": 0.81, + "learning_rate": 4.5129244869786203e-07, + "loss": 1.1308, + "step": 26940 + }, + { + "epoch": 0.81, + "learning_rate": 4.5115266702513205e-07, + "loss": 0.9907, + "step": 26941 + }, + { + "epoch": 0.81, + "learning_rate": 4.510129048564421e-07, + "loss": 1.1149, + "step": 26942 + }, + { + "epoch": 0.81, + "learning_rate": 4.508731621931234e-07, + "loss": 1.1107, + "step": 26943 + }, + { + "epoch": 0.81, + "learning_rate": 4.5073343903650426e-07, + "loss": 0.9819, + "step": 26944 + }, + { + "epoch": 0.81, + "learning_rate": 4.5059373538791585e-07, + "loss": 1.1106, + "step": 26945 + }, + { + "epoch": 0.81, + "learning_rate": 4.5045405124868823e-07, + "loss": 1.1476, + "step": 26946 + }, + { + "epoch": 0.81, + "learning_rate": 4.5031438662015146e-07, + "loss": 1.1009, + "step": 26947 + }, + { + "epoch": 0.81, + "learning_rate": 4.5017474150363394e-07, + "loss": 1.1396, + "step": 26948 + }, + { + "epoch": 0.81, + "learning_rate": 4.500351159004657e-07, + "loss": 1.1128, + "step": 26949 + }, + { + "epoch": 0.81, + "learning_rate": 4.498955098119759e-07, + "loss": 1.1456, + "step": 26950 + }, + { + "epoch": 0.81, + "learning_rate": 4.4975592323949354e-07, + "loss": 1.041, + "step": 26951 + }, + { + "epoch": 0.81, + "learning_rate": 4.496163561843478e-07, + "loss": 1.0252, + "step": 26952 + }, + { + "epoch": 0.81, + "learning_rate": 4.4947680864786627e-07, + "loss": 0.9406, + "step": 26953 + }, + { + "epoch": 0.81, + "learning_rate": 4.493372806313781e-07, + "loss": 1.1495, + "step": 26954 + }, + { + "epoch": 0.81, + "learning_rate": 4.491977721362112e-07, + "loss": 1.0377, + "step": 26955 + }, + { + "epoch": 0.81, + "learning_rate": 4.4905828316369445e-07, + "loss": 1.0936, + "step": 26956 + }, + { + "epoch": 0.81, + "learning_rate": 4.4891881371515453e-07, + "loss": 1.0861, + "step": 26957 + }, + { + "epoch": 0.81, + "learning_rate": 4.487793637919197e-07, + "loss": 1.1281, + "step": 26958 + }, + { + "epoch": 0.81, + "learning_rate": 4.486399333953173e-07, + "loss": 1.2089, + "step": 26959 + }, + { + "epoch": 0.81, + "learning_rate": 4.4850052252667557e-07, + "loss": 1.1499, + "step": 26960 + }, + { + "epoch": 0.81, + "learning_rate": 4.483611311873201e-07, + "loss": 1.1607, + "step": 26961 + }, + { + "epoch": 0.81, + "learning_rate": 4.482217593785784e-07, + "loss": 1.0571, + "step": 26962 + }, + { + "epoch": 0.81, + "learning_rate": 4.480824071017778e-07, + "loss": 1.1245, + "step": 26963 + }, + { + "epoch": 0.81, + "learning_rate": 4.479430743582441e-07, + "loss": 1.1641, + "step": 26964 + }, + { + "epoch": 0.81, + "learning_rate": 4.478037611493041e-07, + "loss": 0.9814, + "step": 26965 + }, + { + "epoch": 0.81, + "learning_rate": 4.4766446747628396e-07, + "loss": 1.1105, + "step": 26966 + }, + { + "epoch": 0.81, + "learning_rate": 4.475251933405095e-07, + "loss": 1.1024, + "step": 26967 + }, + { + "epoch": 0.81, + "learning_rate": 4.4738593874330743e-07, + "loss": 1.1589, + "step": 26968 + }, + { + "epoch": 0.81, + "learning_rate": 4.47246703686002e-07, + "loss": 1.1387, + "step": 26969 + }, + { + "epoch": 0.81, + "learning_rate": 4.4710748816991945e-07, + "loss": 1.0789, + "step": 26970 + }, + { + "epoch": 0.81, + "learning_rate": 4.4696829219638473e-07, + "loss": 1.0017, + "step": 26971 + }, + { + "epoch": 0.81, + "learning_rate": 4.4682911576672316e-07, + "loss": 1.0539, + "step": 26972 + }, + { + "epoch": 0.81, + "learning_rate": 4.466899588822604e-07, + "loss": 1.0059, + "step": 26973 + }, + { + "epoch": 0.81, + "learning_rate": 4.465508215443193e-07, + "loss": 1.1957, + "step": 26974 + }, + { + "epoch": 0.81, + "learning_rate": 4.4641170375422563e-07, + "loss": 1.1277, + "step": 26975 + }, + { + "epoch": 0.81, + "learning_rate": 4.4627260551330346e-07, + "loss": 1.1609, + "step": 26976 + }, + { + "epoch": 0.81, + "learning_rate": 4.4613352682287696e-07, + "loss": 1.0602, + "step": 26977 + }, + { + "epoch": 0.81, + "learning_rate": 4.459944676842709e-07, + "loss": 1.101, + "step": 26978 + }, + { + "epoch": 0.81, + "learning_rate": 4.4585542809880754e-07, + "loss": 1.1329, + "step": 26979 + }, + { + "epoch": 0.81, + "learning_rate": 4.457164080678111e-07, + "loss": 1.2139, + "step": 26980 + }, + { + "epoch": 0.81, + "learning_rate": 4.45577407592605e-07, + "loss": 1.1497, + "step": 26981 + }, + { + "epoch": 0.81, + "learning_rate": 4.4543842667451346e-07, + "loss": 1.1351, + "step": 26982 + }, + { + "epoch": 0.81, + "learning_rate": 4.452994653148579e-07, + "loss": 1.0786, + "step": 26983 + }, + { + "epoch": 0.81, + "learning_rate": 4.451605235149617e-07, + "loss": 1.0556, + "step": 26984 + }, + { + "epoch": 0.81, + "learning_rate": 4.450216012761477e-07, + "loss": 1.0057, + "step": 26985 + }, + { + "epoch": 0.81, + "learning_rate": 4.4488269859973897e-07, + "loss": 1.1713, + "step": 26986 + }, + { + "epoch": 0.81, + "learning_rate": 4.4474381548705646e-07, + "loss": 1.0757, + "step": 26987 + }, + { + "epoch": 0.81, + "learning_rate": 4.446049519394233e-07, + "loss": 1.0864, + "step": 26988 + }, + { + "epoch": 0.81, + "learning_rate": 4.4446610795816083e-07, + "loss": 1.1102, + "step": 26989 + }, + { + "epoch": 0.81, + "learning_rate": 4.443272835445911e-07, + "loss": 1.0675, + "step": 26990 + }, + { + "epoch": 0.81, + "learning_rate": 4.4418847870003614e-07, + "loss": 1.1464, + "step": 26991 + }, + { + "epoch": 0.81, + "learning_rate": 4.4404969342581623e-07, + "loss": 1.0543, + "step": 26992 + }, + { + "epoch": 0.81, + "learning_rate": 4.4391092772325283e-07, + "loss": 1.0486, + "step": 26993 + }, + { + "epoch": 0.81, + "learning_rate": 4.437721815936674e-07, + "loss": 1.0999, + "step": 26994 + }, + { + "epoch": 0.81, + "learning_rate": 4.436334550383803e-07, + "loss": 1.0648, + "step": 26995 + }, + { + "epoch": 0.81, + "learning_rate": 4.4349474805871265e-07, + "loss": 1.0408, + "step": 26996 + }, + { + "epoch": 0.81, + "learning_rate": 4.433560606559842e-07, + "loss": 0.9823, + "step": 26997 + }, + { + "epoch": 0.81, + "learning_rate": 4.432173928315156e-07, + "loss": 1.1385, + "step": 26998 + }, + { + "epoch": 0.81, + "learning_rate": 4.4307874458662777e-07, + "loss": 1.269, + "step": 26999 + }, + { + "epoch": 0.81, + "learning_rate": 4.4294011592263875e-07, + "loss": 1.1118, + "step": 27000 + }, + { + "epoch": 0.81, + "learning_rate": 4.428015068408692e-07, + "loss": 1.1505, + "step": 27001 + }, + { + "epoch": 0.81, + "learning_rate": 4.4266291734263834e-07, + "loss": 1.0375, + "step": 27002 + }, + { + "epoch": 0.81, + "learning_rate": 4.4252434742926594e-07, + "loss": 1.1792, + "step": 27003 + }, + { + "epoch": 0.81, + "learning_rate": 4.423857971020712e-07, + "loss": 1.2328, + "step": 27004 + }, + { + "epoch": 0.81, + "learning_rate": 4.4224726636237225e-07, + "loss": 1.1528, + "step": 27005 + }, + { + "epoch": 0.81, + "learning_rate": 4.4210875521148805e-07, + "loss": 1.0798, + "step": 27006 + }, + { + "epoch": 0.81, + "learning_rate": 4.4197026365073754e-07, + "loss": 1.1119, + "step": 27007 + }, + { + "epoch": 0.81, + "learning_rate": 4.418317916814396e-07, + "loss": 1.0832, + "step": 27008 + }, + { + "epoch": 0.81, + "learning_rate": 4.416933393049111e-07, + "loss": 1.1408, + "step": 27009 + }, + { + "epoch": 0.81, + "learning_rate": 4.415549065224709e-07, + "loss": 1.2321, + "step": 27010 + }, + { + "epoch": 0.81, + "learning_rate": 4.414164933354362e-07, + "loss": 1.2134, + "step": 27011 + }, + { + "epoch": 0.81, + "learning_rate": 4.41278099745126e-07, + "loss": 1.1138, + "step": 27012 + }, + { + "epoch": 0.81, + "learning_rate": 4.41139725752856e-07, + "loss": 1.1254, + "step": 27013 + }, + { + "epoch": 0.81, + "learning_rate": 4.4100137135994426e-07, + "loss": 1.1276, + "step": 27014 + }, + { + "epoch": 0.81, + "learning_rate": 4.4086303656770773e-07, + "loss": 1.1044, + "step": 27015 + }, + { + "epoch": 0.81, + "learning_rate": 4.4072472137746347e-07, + "loss": 1.1011, + "step": 27016 + }, + { + "epoch": 0.81, + "learning_rate": 4.4058642579052876e-07, + "loss": 1.1229, + "step": 27017 + }, + { + "epoch": 0.81, + "learning_rate": 4.404481498082186e-07, + "loss": 1.1173, + "step": 27018 + }, + { + "epoch": 0.81, + "learning_rate": 4.403098934318503e-07, + "loss": 1.1015, + "step": 27019 + }, + { + "epoch": 0.81, + "learning_rate": 4.4017165666273984e-07, + "loss": 1.0784, + "step": 27020 + }, + { + "epoch": 0.81, + "learning_rate": 4.400334395022032e-07, + "loss": 1.071, + "step": 27021 + }, + { + "epoch": 0.81, + "learning_rate": 4.398952419515559e-07, + "loss": 1.008, + "step": 27022 + }, + { + "epoch": 0.81, + "learning_rate": 4.3975706401211406e-07, + "loss": 1.1263, + "step": 27023 + }, + { + "epoch": 0.81, + "learning_rate": 4.396189056851924e-07, + "loss": 1.1864, + "step": 27024 + }, + { + "epoch": 0.81, + "learning_rate": 4.3948076697210714e-07, + "loss": 1.1687, + "step": 27025 + }, + { + "epoch": 0.81, + "learning_rate": 4.393426478741722e-07, + "loss": 1.1165, + "step": 27026 + }, + { + "epoch": 0.81, + "learning_rate": 4.3920454839270236e-07, + "loss": 1.1138, + "step": 27027 + }, + { + "epoch": 0.81, + "learning_rate": 4.39066468529013e-07, + "loss": 1.0297, + "step": 27028 + }, + { + "epoch": 0.81, + "learning_rate": 4.3892840828441833e-07, + "loss": 1.0535, + "step": 27029 + }, + { + "epoch": 0.81, + "learning_rate": 4.3879036766023315e-07, + "loss": 1.0936, + "step": 27030 + }, + { + "epoch": 0.81, + "learning_rate": 4.386523466577702e-07, + "loss": 1.1849, + "step": 27031 + }, + { + "epoch": 0.81, + "learning_rate": 4.3851434527834414e-07, + "loss": 1.1535, + "step": 27032 + }, + { + "epoch": 0.81, + "learning_rate": 4.3837636352326877e-07, + "loss": 1.1644, + "step": 27033 + }, + { + "epoch": 0.81, + "learning_rate": 4.3823840139385815e-07, + "loss": 1.0534, + "step": 27034 + }, + { + "epoch": 0.81, + "learning_rate": 4.381004588914245e-07, + "loss": 1.1121, + "step": 27035 + }, + { + "epoch": 0.81, + "learning_rate": 4.3796253601728125e-07, + "loss": 1.2239, + "step": 27036 + }, + { + "epoch": 0.81, + "learning_rate": 4.3782463277274144e-07, + "loss": 1.1803, + "step": 27037 + }, + { + "epoch": 0.81, + "learning_rate": 4.376867491591186e-07, + "loss": 1.0832, + "step": 27038 + }, + { + "epoch": 0.81, + "learning_rate": 4.3754888517772406e-07, + "loss": 1.0711, + "step": 27039 + }, + { + "epoch": 0.81, + "learning_rate": 4.3741104082987096e-07, + "loss": 1.0601, + "step": 27040 + }, + { + "epoch": 0.81, + "learning_rate": 4.3727321611687135e-07, + "loss": 1.115, + "step": 27041 + }, + { + "epoch": 0.81, + "learning_rate": 4.3713541104003775e-07, + "loss": 1.058, + "step": 27042 + }, + { + "epoch": 0.81, + "learning_rate": 4.369976256006811e-07, + "loss": 1.1208, + "step": 27043 + }, + { + "epoch": 0.81, + "learning_rate": 4.368598598001134e-07, + "loss": 1.0795, + "step": 27044 + }, + { + "epoch": 0.81, + "learning_rate": 4.36722113639646e-07, + "loss": 1.196, + "step": 27045 + }, + { + "epoch": 0.81, + "learning_rate": 4.365843871205905e-07, + "loss": 1.0977, + "step": 27046 + }, + { + "epoch": 0.81, + "learning_rate": 4.3644668024425793e-07, + "loss": 1.0753, + "step": 27047 + }, + { + "epoch": 0.81, + "learning_rate": 4.3630899301195907e-07, + "loss": 1.0671, + "step": 27048 + }, + { + "epoch": 0.81, + "learning_rate": 4.3617132542500467e-07, + "loss": 1.1186, + "step": 27049 + }, + { + "epoch": 0.81, + "learning_rate": 4.36033677484706e-07, + "loss": 1.0723, + "step": 27050 + }, + { + "epoch": 0.81, + "learning_rate": 4.358960491923719e-07, + "loss": 1.0941, + "step": 27051 + }, + { + "epoch": 0.81, + "learning_rate": 4.3575844054931345e-07, + "loss": 1.0944, + "step": 27052 + }, + { + "epoch": 0.81, + "learning_rate": 4.356208515568405e-07, + "loss": 1.1443, + "step": 27053 + }, + { + "epoch": 0.82, + "learning_rate": 4.3548328221626273e-07, + "loss": 1.0264, + "step": 27054 + }, + { + "epoch": 0.82, + "learning_rate": 4.353457325288904e-07, + "loss": 1.189, + "step": 27055 + }, + { + "epoch": 0.82, + "learning_rate": 4.3520820249603163e-07, + "loss": 1.1103, + "step": 27056 + }, + { + "epoch": 0.82, + "learning_rate": 4.350706921189965e-07, + "loss": 1.0487, + "step": 27057 + }, + { + "epoch": 0.82, + "learning_rate": 4.3493320139909393e-07, + "loss": 1.0269, + "step": 27058 + }, + { + "epoch": 0.82, + "learning_rate": 4.347957303376324e-07, + "loss": 1.204, + "step": 27059 + }, + { + "epoch": 0.82, + "learning_rate": 4.346582789359219e-07, + "loss": 1.0586, + "step": 27060 + }, + { + "epoch": 0.82, + "learning_rate": 4.345208471952689e-07, + "loss": 1.188, + "step": 27061 + }, + { + "epoch": 0.82, + "learning_rate": 4.343834351169829e-07, + "loss": 1.1209, + "step": 27062 + }, + { + "epoch": 0.82, + "learning_rate": 4.3424604270237174e-07, + "loss": 1.0604, + "step": 27063 + }, + { + "epoch": 0.82, + "learning_rate": 4.341086699527439e-07, + "loss": 1.0864, + "step": 27064 + }, + { + "epoch": 0.82, + "learning_rate": 4.3397131686940597e-07, + "loss": 1.1166, + "step": 27065 + }, + { + "epoch": 0.82, + "learning_rate": 4.338339834536659e-07, + "loss": 0.9448, + "step": 27066 + }, + { + "epoch": 0.82, + "learning_rate": 4.336966697068315e-07, + "loss": 1.0906, + "step": 27067 + }, + { + "epoch": 0.82, + "learning_rate": 4.3355937563021007e-07, + "loss": 1.119, + "step": 27068 + }, + { + "epoch": 0.82, + "learning_rate": 4.3342210122510745e-07, + "loss": 1.1813, + "step": 27069 + }, + { + "epoch": 0.82, + "learning_rate": 4.332848464928313e-07, + "loss": 1.0589, + "step": 27070 + }, + { + "epoch": 0.82, + "learning_rate": 4.3314761143468804e-07, + "loss": 1.1098, + "step": 27071 + }, + { + "epoch": 0.82, + "learning_rate": 4.330103960519841e-07, + "loss": 1.1064, + "step": 27072 + }, + { + "epoch": 0.82, + "learning_rate": 4.328732003460262e-07, + "loss": 1.1564, + "step": 27073 + }, + { + "epoch": 0.82, + "learning_rate": 4.3273602431811945e-07, + "loss": 0.9699, + "step": 27074 + }, + { + "epoch": 0.82, + "learning_rate": 4.3259886796957e-07, + "loss": 0.9443, + "step": 27075 + }, + { + "epoch": 0.82, + "learning_rate": 4.324617313016835e-07, + "loss": 1.0331, + "step": 27076 + }, + { + "epoch": 0.82, + "learning_rate": 4.323246143157656e-07, + "loss": 1.0004, + "step": 27077 + }, + { + "epoch": 0.82, + "learning_rate": 4.3218751701312176e-07, + "loss": 1.1273, + "step": 27078 + }, + { + "epoch": 0.82, + "learning_rate": 4.320504393950567e-07, + "loss": 1.1094, + "step": 27079 + }, + { + "epoch": 0.82, + "learning_rate": 4.319133814628754e-07, + "loss": 1.1915, + "step": 27080 + }, + { + "epoch": 0.82, + "learning_rate": 4.3177634321788344e-07, + "loss": 1.1069, + "step": 27081 + }, + { + "epoch": 0.82, + "learning_rate": 4.31639324661384e-07, + "loss": 1.0731, + "step": 27082 + }, + { + "epoch": 0.82, + "learning_rate": 4.315023257946821e-07, + "loss": 1.0909, + "step": 27083 + }, + { + "epoch": 0.82, + "learning_rate": 4.3136534661908175e-07, + "loss": 1.0859, + "step": 27084 + }, + { + "epoch": 0.82, + "learning_rate": 4.312283871358869e-07, + "loss": 1.0506, + "step": 27085 + }, + { + "epoch": 0.82, + "learning_rate": 4.310914473464023e-07, + "loss": 1.0809, + "step": 27086 + }, + { + "epoch": 0.82, + "learning_rate": 4.3095452725193e-07, + "loss": 1.0547, + "step": 27087 + }, + { + "epoch": 0.82, + "learning_rate": 4.308176268537739e-07, + "loss": 1.1318, + "step": 27088 + }, + { + "epoch": 0.82, + "learning_rate": 4.306807461532375e-07, + "loss": 1.1456, + "step": 27089 + }, + { + "epoch": 0.82, + "learning_rate": 4.305438851516247e-07, + "loss": 0.9782, + "step": 27090 + }, + { + "epoch": 0.82, + "learning_rate": 4.3040704385023666e-07, + "loss": 0.9838, + "step": 27091 + }, + { + "epoch": 0.82, + "learning_rate": 4.3027022225037655e-07, + "loss": 1.1391, + "step": 27092 + }, + { + "epoch": 0.82, + "learning_rate": 4.301334203533475e-07, + "loss": 1.1516, + "step": 27093 + }, + { + "epoch": 0.82, + "learning_rate": 4.2999663816045175e-07, + "loss": 1.158, + "step": 27094 + }, + { + "epoch": 0.82, + "learning_rate": 4.298598756729905e-07, + "loss": 1.0255, + "step": 27095 + }, + { + "epoch": 0.82, + "learning_rate": 4.297231328922663e-07, + "loss": 1.0664, + "step": 27096 + }, + { + "epoch": 0.82, + "learning_rate": 4.295864098195807e-07, + "loss": 1.0786, + "step": 27097 + }, + { + "epoch": 0.82, + "learning_rate": 4.2944970645623557e-07, + "loss": 0.9858, + "step": 27098 + }, + { + "epoch": 0.82, + "learning_rate": 4.293130228035322e-07, + "loss": 1.1181, + "step": 27099 + }, + { + "epoch": 0.82, + "learning_rate": 4.2917635886277146e-07, + "loss": 1.2001, + "step": 27100 + }, + { + "epoch": 0.82, + "learning_rate": 4.29039714635254e-07, + "loss": 1.0974, + "step": 27101 + }, + { + "epoch": 0.82, + "learning_rate": 4.2890309012228124e-07, + "loss": 1.0214, + "step": 27102 + }, + { + "epoch": 0.82, + "learning_rate": 4.2876648532515356e-07, + "loss": 1.0841, + "step": 27103 + }, + { + "epoch": 0.82, + "learning_rate": 4.2862990024517157e-07, + "loss": 1.0984, + "step": 27104 + }, + { + "epoch": 0.82, + "learning_rate": 4.284933348836351e-07, + "loss": 1.0012, + "step": 27105 + }, + { + "epoch": 0.82, + "learning_rate": 4.2835678924184443e-07, + "loss": 1.1397, + "step": 27106 + }, + { + "epoch": 0.82, + "learning_rate": 4.2822026332110024e-07, + "loss": 1.019, + "step": 27107 + }, + { + "epoch": 0.82, + "learning_rate": 4.2808375712270064e-07, + "loss": 1.1047, + "step": 27108 + }, + { + "epoch": 0.82, + "learning_rate": 4.2794727064794565e-07, + "loss": 1.0671, + "step": 27109 + }, + { + "epoch": 0.82, + "learning_rate": 4.278108038981346e-07, + "loss": 1.0622, + "step": 27110 + }, + { + "epoch": 0.82, + "learning_rate": 4.27674356874567e-07, + "loss": 1.1036, + "step": 27111 + }, + { + "epoch": 0.82, + "learning_rate": 4.27537929578542e-07, + "loss": 1.228, + "step": 27112 + }, + { + "epoch": 0.82, + "learning_rate": 4.27401522011357e-07, + "loss": 1.1338, + "step": 27113 + }, + { + "epoch": 0.82, + "learning_rate": 4.272651341743114e-07, + "loss": 1.1777, + "step": 27114 + }, + { + "epoch": 0.82, + "learning_rate": 4.2712876606870344e-07, + "loss": 1.1267, + "step": 27115 + }, + { + "epoch": 0.82, + "learning_rate": 4.2699241769583203e-07, + "loss": 0.9857, + "step": 27116 + }, + { + "epoch": 0.82, + "learning_rate": 4.2685608905699367e-07, + "loss": 1.1601, + "step": 27117 + }, + { + "epoch": 0.82, + "learning_rate": 4.2671978015348697e-07, + "loss": 1.1301, + "step": 27118 + }, + { + "epoch": 0.82, + "learning_rate": 4.2658349098660927e-07, + "loss": 1.1014, + "step": 27119 + }, + { + "epoch": 0.82, + "learning_rate": 4.26447221557659e-07, + "loss": 1.1682, + "step": 27120 + }, + { + "epoch": 0.82, + "learning_rate": 4.263109718679317e-07, + "loss": 1.0314, + "step": 27121 + }, + { + "epoch": 0.82, + "learning_rate": 4.261747419187254e-07, + "loss": 1.122, + "step": 27122 + }, + { + "epoch": 0.82, + "learning_rate": 4.260385317113366e-07, + "loss": 1.1727, + "step": 27123 + }, + { + "epoch": 0.82, + "learning_rate": 4.2590234124706224e-07, + "loss": 1.0546, + "step": 27124 + }, + { + "epoch": 0.82, + "learning_rate": 4.2576617052719925e-07, + "loss": 1.0007, + "step": 27125 + }, + { + "epoch": 0.82, + "learning_rate": 4.2563001955304274e-07, + "loss": 1.0249, + "step": 27126 + }, + { + "epoch": 0.82, + "learning_rate": 4.254938883258894e-07, + "loss": 1.1091, + "step": 27127 + }, + { + "epoch": 0.82, + "learning_rate": 4.2535777684703514e-07, + "loss": 1.0764, + "step": 27128 + }, + { + "epoch": 0.82, + "learning_rate": 4.2522168511777566e-07, + "loss": 1.1454, + "step": 27129 + }, + { + "epoch": 0.82, + "learning_rate": 4.250856131394063e-07, + "loss": 1.2022, + "step": 27130 + }, + { + "epoch": 0.82, + "learning_rate": 4.2494956091322285e-07, + "loss": 1.1426, + "step": 27131 + }, + { + "epoch": 0.82, + "learning_rate": 4.248135284405208e-07, + "loss": 1.1206, + "step": 27132 + }, + { + "epoch": 0.82, + "learning_rate": 4.246775157225938e-07, + "loss": 1.1181, + "step": 27133 + }, + { + "epoch": 0.82, + "learning_rate": 4.2454152276073716e-07, + "loss": 1.0668, + "step": 27134 + }, + { + "epoch": 0.82, + "learning_rate": 4.2440554955624603e-07, + "loss": 1.003, + "step": 27135 + }, + { + "epoch": 0.82, + "learning_rate": 4.24269596110414e-07, + "loss": 1.1906, + "step": 27136 + }, + { + "epoch": 0.82, + "learning_rate": 4.2413366242453595e-07, + "loss": 1.1066, + "step": 27137 + }, + { + "epoch": 0.82, + "learning_rate": 4.2399774849990637e-07, + "loss": 1.0156, + "step": 27138 + }, + { + "epoch": 0.82, + "learning_rate": 4.238618543378176e-07, + "loss": 1.126, + "step": 27139 + }, + { + "epoch": 0.82, + "learning_rate": 4.2372597993956433e-07, + "loss": 1.1505, + "step": 27140 + }, + { + "epoch": 0.82, + "learning_rate": 4.235901253064395e-07, + "loss": 0.9897, + "step": 27141 + }, + { + "epoch": 0.82, + "learning_rate": 4.2345429043973736e-07, + "loss": 1.0466, + "step": 27142 + }, + { + "epoch": 0.82, + "learning_rate": 4.233184753407496e-07, + "loss": 1.1919, + "step": 27143 + }, + { + "epoch": 0.82, + "learning_rate": 4.2318268001076996e-07, + "loss": 1.1886, + "step": 27144 + }, + { + "epoch": 0.82, + "learning_rate": 4.230469044510907e-07, + "loss": 1.1035, + "step": 27145 + }, + { + "epoch": 0.82, + "learning_rate": 4.229111486630055e-07, + "loss": 1.1196, + "step": 27146 + }, + { + "epoch": 0.82, + "learning_rate": 4.227754126478051e-07, + "loss": 0.9929, + "step": 27147 + }, + { + "epoch": 0.82, + "learning_rate": 4.226396964067822e-07, + "loss": 0.9839, + "step": 27148 + }, + { + "epoch": 0.82, + "learning_rate": 4.225039999412289e-07, + "loss": 1.111, + "step": 27149 + }, + { + "epoch": 0.82, + "learning_rate": 4.2236832325243725e-07, + "loss": 1.0511, + "step": 27150 + }, + { + "epoch": 0.82, + "learning_rate": 4.2223266634169894e-07, + "loss": 1.1196, + "step": 27151 + }, + { + "epoch": 0.82, + "learning_rate": 4.220970292103044e-07, + "loss": 1.0779, + "step": 27152 + }, + { + "epoch": 0.82, + "learning_rate": 4.2196141185954525e-07, + "loss": 1.0248, + "step": 27153 + }, + { + "epoch": 0.82, + "learning_rate": 4.218258142907128e-07, + "loss": 1.1003, + "step": 27154 + }, + { + "epoch": 0.82, + "learning_rate": 4.216902365050984e-07, + "loss": 1.1252, + "step": 27155 + }, + { + "epoch": 0.82, + "learning_rate": 4.2155467850399116e-07, + "loss": 1.1118, + "step": 27156 + }, + { + "epoch": 0.82, + "learning_rate": 4.2141914028868246e-07, + "loss": 1.0788, + "step": 27157 + }, + { + "epoch": 0.82, + "learning_rate": 4.212836218604627e-07, + "loss": 1.2299, + "step": 27158 + }, + { + "epoch": 0.82, + "learning_rate": 4.2114812322062133e-07, + "loss": 1.1241, + "step": 27159 + }, + { + "epoch": 0.82, + "learning_rate": 4.21012644370449e-07, + "loss": 1.1095, + "step": 27160 + }, + { + "epoch": 0.82, + "learning_rate": 4.208771853112348e-07, + "loss": 1.1295, + "step": 27161 + }, + { + "epoch": 0.82, + "learning_rate": 4.2074174604426835e-07, + "loss": 1.2723, + "step": 27162 + }, + { + "epoch": 0.82, + "learning_rate": 4.2060632657083934e-07, + "loss": 1.0617, + "step": 27163 + }, + { + "epoch": 0.82, + "learning_rate": 4.204709268922369e-07, + "loss": 0.973, + "step": 27164 + }, + { + "epoch": 0.82, + "learning_rate": 4.2033554700974947e-07, + "loss": 1.116, + "step": 27165 + }, + { + "epoch": 0.82, + "learning_rate": 4.202001869246658e-07, + "loss": 1.1108, + "step": 27166 + }, + { + "epoch": 0.82, + "learning_rate": 4.200648466382748e-07, + "loss": 1.1685, + "step": 27167 + }, + { + "epoch": 0.82, + "learning_rate": 4.199295261518652e-07, + "loss": 1.0364, + "step": 27168 + }, + { + "epoch": 0.82, + "learning_rate": 4.197942254667242e-07, + "loss": 1.0461, + "step": 27169 + }, + { + "epoch": 0.82, + "learning_rate": 4.1965894458414036e-07, + "loss": 1.1354, + "step": 27170 + }, + { + "epoch": 0.82, + "learning_rate": 4.1952368350540117e-07, + "loss": 0.9888, + "step": 27171 + }, + { + "epoch": 0.82, + "learning_rate": 4.1938844223179534e-07, + "loss": 1.1194, + "step": 27172 + }, + { + "epoch": 0.82, + "learning_rate": 4.192532207646091e-07, + "loss": 1.0716, + "step": 27173 + }, + { + "epoch": 0.82, + "learning_rate": 4.1911801910512973e-07, + "loss": 0.9416, + "step": 27174 + }, + { + "epoch": 0.82, + "learning_rate": 4.1898283725464476e-07, + "loss": 1.0424, + "step": 27175 + }, + { + "epoch": 0.82, + "learning_rate": 4.18847675214441e-07, + "loss": 1.0499, + "step": 27176 + }, + { + "epoch": 0.82, + "learning_rate": 4.1871253298580547e-07, + "loss": 1.0367, + "step": 27177 + }, + { + "epoch": 0.82, + "learning_rate": 4.185774105700238e-07, + "loss": 1.119, + "step": 27178 + }, + { + "epoch": 0.82, + "learning_rate": 4.1844230796838247e-07, + "loss": 1.1487, + "step": 27179 + }, + { + "epoch": 0.82, + "learning_rate": 4.183072251821682e-07, + "loss": 1.1607, + "step": 27180 + }, + { + "epoch": 0.82, + "learning_rate": 4.1817216221266694e-07, + "loss": 1.0422, + "step": 27181 + }, + { + "epoch": 0.82, + "learning_rate": 4.1803711906116375e-07, + "loss": 1.0858, + "step": 27182 + }, + { + "epoch": 0.82, + "learning_rate": 4.1790209572894425e-07, + "loss": 1.1036, + "step": 27183 + }, + { + "epoch": 0.82, + "learning_rate": 4.177670922172938e-07, + "loss": 1.002, + "step": 27184 + }, + { + "epoch": 0.82, + "learning_rate": 4.176321085274981e-07, + "loss": 1.0524, + "step": 27185 + }, + { + "epoch": 0.82, + "learning_rate": 4.1749714466084197e-07, + "loss": 1.0755, + "step": 27186 + }, + { + "epoch": 0.82, + "learning_rate": 4.173622006186098e-07, + "loss": 1.0737, + "step": 27187 + }, + { + "epoch": 0.82, + "learning_rate": 4.1722727640208654e-07, + "loss": 1.0276, + "step": 27188 + }, + { + "epoch": 0.82, + "learning_rate": 4.170923720125564e-07, + "loss": 1.0167, + "step": 27189 + }, + { + "epoch": 0.82, + "learning_rate": 4.169574874513044e-07, + "loss": 1.1257, + "step": 27190 + }, + { + "epoch": 0.82, + "learning_rate": 4.168226227196132e-07, + "loss": 1.0867, + "step": 27191 + }, + { + "epoch": 0.82, + "learning_rate": 4.166877778187675e-07, + "loss": 1.174, + "step": 27192 + }, + { + "epoch": 0.82, + "learning_rate": 4.165529527500506e-07, + "loss": 0.9932, + "step": 27193 + }, + { + "epoch": 0.82, + "learning_rate": 4.164181475147469e-07, + "loss": 1.1373, + "step": 27194 + }, + { + "epoch": 0.82, + "learning_rate": 4.162833621141385e-07, + "loss": 1.1265, + "step": 27195 + }, + { + "epoch": 0.82, + "learning_rate": 4.161485965495088e-07, + "loss": 1.0965, + "step": 27196 + }, + { + "epoch": 0.82, + "learning_rate": 4.1601385082214063e-07, + "loss": 1.1298, + "step": 27197 + }, + { + "epoch": 0.82, + "learning_rate": 4.1587912493331775e-07, + "loss": 1.1588, + "step": 27198 + }, + { + "epoch": 0.82, + "learning_rate": 4.1574441888432127e-07, + "loss": 1.1644, + "step": 27199 + }, + { + "epoch": 0.82, + "learning_rate": 4.156097326764338e-07, + "loss": 1.1696, + "step": 27200 + }, + { + "epoch": 0.82, + "learning_rate": 4.1547506631093834e-07, + "loss": 1.1514, + "step": 27201 + }, + { + "epoch": 0.82, + "learning_rate": 4.153404197891159e-07, + "loss": 1.1045, + "step": 27202 + }, + { + "epoch": 0.82, + "learning_rate": 4.152057931122494e-07, + "loss": 1.0527, + "step": 27203 + }, + { + "epoch": 0.82, + "learning_rate": 4.1507118628161896e-07, + "loss": 1.0818, + "step": 27204 + }, + { + "epoch": 0.82, + "learning_rate": 4.149365992985069e-07, + "loss": 1.1552, + "step": 27205 + }, + { + "epoch": 0.82, + "learning_rate": 4.1480203216419405e-07, + "loss": 1.1291, + "step": 27206 + }, + { + "epoch": 0.82, + "learning_rate": 4.146674848799623e-07, + "loss": 1.0309, + "step": 27207 + }, + { + "epoch": 0.82, + "learning_rate": 4.1453295744709107e-07, + "loss": 1.064, + "step": 27208 + }, + { + "epoch": 0.82, + "learning_rate": 4.1439844986686156e-07, + "loss": 1.0745, + "step": 27209 + }, + { + "epoch": 0.82, + "learning_rate": 4.1426396214055445e-07, + "loss": 1.1539, + "step": 27210 + }, + { + "epoch": 0.82, + "learning_rate": 4.1412949426945016e-07, + "loss": 1.2448, + "step": 27211 + }, + { + "epoch": 0.82, + "learning_rate": 4.139950462548281e-07, + "loss": 1.0363, + "step": 27212 + }, + { + "epoch": 0.82, + "learning_rate": 4.138606180979687e-07, + "loss": 1.1435, + "step": 27213 + }, + { + "epoch": 0.82, + "learning_rate": 4.137262098001521e-07, + "loss": 1.1573, + "step": 27214 + }, + { + "epoch": 0.82, + "learning_rate": 4.1359182136265665e-07, + "loss": 1.1705, + "step": 27215 + }, + { + "epoch": 0.82, + "learning_rate": 4.134574527867621e-07, + "loss": 1.013, + "step": 27216 + }, + { + "epoch": 0.82, + "learning_rate": 4.1332310407374786e-07, + "loss": 1.1932, + "step": 27217 + }, + { + "epoch": 0.82, + "learning_rate": 4.1318877522489255e-07, + "loss": 1.2822, + "step": 27218 + }, + { + "epoch": 0.82, + "learning_rate": 4.1305446624147513e-07, + "loss": 1.0361, + "step": 27219 + }, + { + "epoch": 0.82, + "learning_rate": 4.129201771247748e-07, + "loss": 1.1974, + "step": 27220 + }, + { + "epoch": 0.82, + "learning_rate": 4.127859078760685e-07, + "loss": 1.1211, + "step": 27221 + }, + { + "epoch": 0.82, + "learning_rate": 4.12651658496635e-07, + "loss": 1.1622, + "step": 27222 + }, + { + "epoch": 0.82, + "learning_rate": 4.125174289877526e-07, + "loss": 1.1458, + "step": 27223 + }, + { + "epoch": 0.82, + "learning_rate": 4.1238321935069935e-07, + "loss": 1.1435, + "step": 27224 + }, + { + "epoch": 0.82, + "learning_rate": 4.1224902958675177e-07, + "loss": 1.1462, + "step": 27225 + }, + { + "epoch": 0.82, + "learning_rate": 4.12114859697188e-07, + "loss": 1.1698, + "step": 27226 + }, + { + "epoch": 0.82, + "learning_rate": 4.119807096832854e-07, + "loss": 1.0814, + "step": 27227 + }, + { + "epoch": 0.82, + "learning_rate": 4.118465795463211e-07, + "loss": 1.042, + "step": 27228 + }, + { + "epoch": 0.82, + "learning_rate": 4.1171246928757153e-07, + "loss": 1.142, + "step": 27229 + }, + { + "epoch": 0.82, + "learning_rate": 4.1157837890831306e-07, + "loss": 1.299, + "step": 27230 + }, + { + "epoch": 0.82, + "learning_rate": 4.114443084098227e-07, + "loss": 1.1469, + "step": 27231 + }, + { + "epoch": 0.82, + "learning_rate": 4.1131025779337667e-07, + "loss": 1.0613, + "step": 27232 + }, + { + "epoch": 0.82, + "learning_rate": 4.1117622706025176e-07, + "loss": 1.1192, + "step": 27233 + }, + { + "epoch": 0.82, + "learning_rate": 4.110422162117225e-07, + "loss": 1.0684, + "step": 27234 + }, + { + "epoch": 0.82, + "learning_rate": 4.109082252490651e-07, + "loss": 1.0757, + "step": 27235 + }, + { + "epoch": 0.82, + "learning_rate": 4.1077425417355545e-07, + "loss": 1.0445, + "step": 27236 + }, + { + "epoch": 0.82, + "learning_rate": 4.106403029864692e-07, + "loss": 1.1371, + "step": 27237 + }, + { + "epoch": 0.82, + "learning_rate": 4.105063716890806e-07, + "loss": 1.1046, + "step": 27238 + }, + { + "epoch": 0.82, + "learning_rate": 4.1037246028266476e-07, + "loss": 1.1334, + "step": 27239 + }, + { + "epoch": 0.82, + "learning_rate": 4.102385687684968e-07, + "loss": 1.0466, + "step": 27240 + }, + { + "epoch": 0.82, + "learning_rate": 4.101046971478512e-07, + "loss": 1.1721, + "step": 27241 + }, + { + "epoch": 0.82, + "learning_rate": 4.099708454220022e-07, + "loss": 1.1763, + "step": 27242 + }, + { + "epoch": 0.82, + "learning_rate": 4.0983701359222414e-07, + "loss": 1.1102, + "step": 27243 + }, + { + "epoch": 0.82, + "learning_rate": 4.0970320165979127e-07, + "loss": 1.1658, + "step": 27244 + }, + { + "epoch": 0.82, + "learning_rate": 4.0956940962597726e-07, + "loss": 1.0859, + "step": 27245 + }, + { + "epoch": 0.82, + "learning_rate": 4.0943563749205604e-07, + "loss": 1.029, + "step": 27246 + }, + { + "epoch": 0.82, + "learning_rate": 4.093018852593003e-07, + "loss": 1.2042, + "step": 27247 + }, + { + "epoch": 0.82, + "learning_rate": 4.091681529289837e-07, + "loss": 1.1036, + "step": 27248 + }, + { + "epoch": 0.82, + "learning_rate": 4.090344405023791e-07, + "loss": 1.1203, + "step": 27249 + }, + { + "epoch": 0.82, + "learning_rate": 4.0890074798076026e-07, + "loss": 1.2432, + "step": 27250 + }, + { + "epoch": 0.82, + "learning_rate": 4.087670753653986e-07, + "loss": 1.1016, + "step": 27251 + }, + { + "epoch": 0.82, + "learning_rate": 4.0863342265756724e-07, + "loss": 0.9697, + "step": 27252 + }, + { + "epoch": 0.82, + "learning_rate": 4.0849978985853853e-07, + "loss": 1.0797, + "step": 27253 + }, + { + "epoch": 0.82, + "learning_rate": 4.0836617696958516e-07, + "loss": 1.0789, + "step": 27254 + }, + { + "epoch": 0.82, + "learning_rate": 4.0823258399197764e-07, + "loss": 1.0188, + "step": 27255 + }, + { + "epoch": 0.82, + "learning_rate": 4.0809901092698864e-07, + "loss": 1.0656, + "step": 27256 + }, + { + "epoch": 0.82, + "learning_rate": 4.0796545777588933e-07, + "loss": 1.115, + "step": 27257 + }, + { + "epoch": 0.82, + "learning_rate": 4.078319245399515e-07, + "loss": 1.1968, + "step": 27258 + }, + { + "epoch": 0.82, + "learning_rate": 4.0769841122044656e-07, + "loss": 1.048, + "step": 27259 + }, + { + "epoch": 0.82, + "learning_rate": 4.075649178186447e-07, + "loss": 1.0458, + "step": 27260 + }, + { + "epoch": 0.82, + "learning_rate": 4.0743144433581684e-07, + "loss": 1.0073, + "step": 27261 + }, + { + "epoch": 0.82, + "learning_rate": 4.0729799077323384e-07, + "loss": 1.1761, + "step": 27262 + }, + { + "epoch": 0.82, + "learning_rate": 4.0716455713216696e-07, + "loss": 1.0452, + "step": 27263 + }, + { + "epoch": 0.82, + "learning_rate": 4.0703114341388463e-07, + "loss": 1.2622, + "step": 27264 + }, + { + "epoch": 0.82, + "learning_rate": 4.06897749619658e-07, + "loss": 1.0404, + "step": 27265 + }, + { + "epoch": 0.82, + "learning_rate": 4.0676437575075665e-07, + "loss": 1.0165, + "step": 27266 + }, + { + "epoch": 0.82, + "learning_rate": 4.066310218084504e-07, + "loss": 1.1597, + "step": 27267 + }, + { + "epoch": 0.82, + "learning_rate": 4.0649768779400855e-07, + "loss": 1.2313, + "step": 27268 + }, + { + "epoch": 0.82, + "learning_rate": 4.063643737087003e-07, + "loss": 1.051, + "step": 27269 + }, + { + "epoch": 0.82, + "learning_rate": 4.062310795537952e-07, + "loss": 1.0306, + "step": 27270 + }, + { + "epoch": 0.82, + "learning_rate": 4.0609780533056143e-07, + "loss": 1.1198, + "step": 27271 + }, + { + "epoch": 0.82, + "learning_rate": 4.0596455104026907e-07, + "loss": 1.1571, + "step": 27272 + }, + { + "epoch": 0.82, + "learning_rate": 4.0583131668418487e-07, + "loss": 1.1229, + "step": 27273 + }, + { + "epoch": 0.82, + "learning_rate": 4.056981022635778e-07, + "loss": 1.1238, + "step": 27274 + }, + { + "epoch": 0.82, + "learning_rate": 4.055649077797164e-07, + "loss": 1.0045, + "step": 27275 + }, + { + "epoch": 0.82, + "learning_rate": 4.054317332338689e-07, + "loss": 1.0676, + "step": 27276 + }, + { + "epoch": 0.82, + "learning_rate": 4.05298578627302e-07, + "loss": 1.1368, + "step": 27277 + }, + { + "epoch": 0.82, + "learning_rate": 4.051654439612837e-07, + "loss": 1.1428, + "step": 27278 + }, + { + "epoch": 0.82, + "learning_rate": 4.050323292370814e-07, + "loss": 1.0925, + "step": 27279 + }, + { + "epoch": 0.82, + "learning_rate": 4.04899234455963e-07, + "loss": 1.2127, + "step": 27280 + }, + { + "epoch": 0.82, + "learning_rate": 4.047661596191943e-07, + "loss": 1.1545, + "step": 27281 + }, + { + "epoch": 0.82, + "learning_rate": 4.0463310472804274e-07, + "loss": 1.0645, + "step": 27282 + }, + { + "epoch": 0.82, + "learning_rate": 4.0450006978377477e-07, + "loss": 1.1379, + "step": 27283 + }, + { + "epoch": 0.82, + "learning_rate": 4.0436705478765686e-07, + "loss": 1.0991, + "step": 27284 + }, + { + "epoch": 0.82, + "learning_rate": 4.042340597409558e-07, + "loss": 1.0224, + "step": 27285 + }, + { + "epoch": 0.82, + "learning_rate": 4.041010846449367e-07, + "loss": 1.1141, + "step": 27286 + }, + { + "epoch": 0.82, + "learning_rate": 4.03968129500866e-07, + "loss": 0.9696, + "step": 27287 + }, + { + "epoch": 0.82, + "learning_rate": 4.0383519431000885e-07, + "loss": 1.0662, + "step": 27288 + }, + { + "epoch": 0.82, + "learning_rate": 4.0370227907363194e-07, + "loss": 1.019, + "step": 27289 + }, + { + "epoch": 0.82, + "learning_rate": 4.0356938379299907e-07, + "loss": 1.0726, + "step": 27290 + }, + { + "epoch": 0.82, + "learning_rate": 4.0343650846937616e-07, + "loss": 1.1193, + "step": 27291 + }, + { + "epoch": 0.82, + "learning_rate": 4.033036531040277e-07, + "loss": 1.2072, + "step": 27292 + }, + { + "epoch": 0.82, + "learning_rate": 4.031708176982188e-07, + "loss": 1.2008, + "step": 27293 + }, + { + "epoch": 0.82, + "learning_rate": 4.0303800225321377e-07, + "loss": 1.0909, + "step": 27294 + }, + { + "epoch": 0.82, + "learning_rate": 4.029052067702771e-07, + "loss": 1.0766, + "step": 27295 + }, + { + "epoch": 0.82, + "learning_rate": 4.0277243125067255e-07, + "loss": 1.0428, + "step": 27296 + }, + { + "epoch": 0.82, + "learning_rate": 4.0263967569566546e-07, + "loss": 1.0815, + "step": 27297 + }, + { + "epoch": 0.82, + "learning_rate": 4.0250694010651766e-07, + "loss": 1.0214, + "step": 27298 + }, + { + "epoch": 0.82, + "learning_rate": 4.023742244844936e-07, + "loss": 1.1971, + "step": 27299 + }, + { + "epoch": 0.82, + "learning_rate": 4.0224152883085675e-07, + "loss": 1.1899, + "step": 27300 + }, + { + "epoch": 0.82, + "learning_rate": 4.0210885314687034e-07, + "loss": 1.073, + "step": 27301 + }, + { + "epoch": 0.82, + "learning_rate": 4.019761974337977e-07, + "loss": 1.0847, + "step": 27302 + }, + { + "epoch": 0.82, + "learning_rate": 4.0184356169290064e-07, + "loss": 1.103, + "step": 27303 + }, + { + "epoch": 0.82, + "learning_rate": 4.017109459254426e-07, + "loss": 1.1384, + "step": 27304 + }, + { + "epoch": 0.82, + "learning_rate": 4.0157835013268556e-07, + "loss": 0.9412, + "step": 27305 + }, + { + "epoch": 0.82, + "learning_rate": 4.0144577431589253e-07, + "loss": 1.0892, + "step": 27306 + }, + { + "epoch": 0.82, + "learning_rate": 4.0131321847632465e-07, + "loss": 1.1617, + "step": 27307 + }, + { + "epoch": 0.82, + "learning_rate": 4.0118068261524395e-07, + "loss": 1.0657, + "step": 27308 + }, + { + "epoch": 0.82, + "learning_rate": 4.010481667339125e-07, + "loss": 1.072, + "step": 27309 + }, + { + "epoch": 0.82, + "learning_rate": 4.009156708335915e-07, + "loss": 1.0613, + "step": 27310 + }, + { + "epoch": 0.82, + "learning_rate": 4.00783194915543e-07, + "loss": 1.1091, + "step": 27311 + }, + { + "epoch": 0.82, + "learning_rate": 4.0065073898102684e-07, + "loss": 1.121, + "step": 27312 + }, + { + "epoch": 0.82, + "learning_rate": 4.005183030313045e-07, + "loss": 1.0141, + "step": 27313 + }, + { + "epoch": 0.82, + "learning_rate": 4.003858870676369e-07, + "loss": 1.1611, + "step": 27314 + }, + { + "epoch": 0.82, + "learning_rate": 4.00253491091285e-07, + "loss": 1.1146, + "step": 27315 + }, + { + "epoch": 0.82, + "learning_rate": 4.0012111510350783e-07, + "loss": 1.0588, + "step": 27316 + }, + { + "epoch": 0.82, + "learning_rate": 3.999887591055665e-07, + "loss": 1.1449, + "step": 27317 + }, + { + "epoch": 0.82, + "learning_rate": 3.998564230987209e-07, + "loss": 1.1291, + "step": 27318 + }, + { + "epoch": 0.82, + "learning_rate": 3.9972410708423113e-07, + "loss": 1.2653, + "step": 27319 + }, + { + "epoch": 0.82, + "learning_rate": 3.9959181106335563e-07, + "loss": 1.0017, + "step": 27320 + }, + { + "epoch": 0.82, + "learning_rate": 3.9945953503735454e-07, + "loss": 1.0864, + "step": 27321 + }, + { + "epoch": 0.82, + "learning_rate": 3.993272790074873e-07, + "loss": 1.0697, + "step": 27322 + }, + { + "epoch": 0.82, + "learning_rate": 3.991950429750124e-07, + "loss": 0.999, + "step": 27323 + }, + { + "epoch": 0.82, + "learning_rate": 3.9906282694118893e-07, + "loss": 1.1578, + "step": 27324 + }, + { + "epoch": 0.82, + "learning_rate": 3.9893063090727546e-07, + "loss": 1.091, + "step": 27325 + }, + { + "epoch": 0.82, + "learning_rate": 3.987984548745305e-07, + "loss": 1.0379, + "step": 27326 + }, + { + "epoch": 0.82, + "learning_rate": 3.986662988442122e-07, + "loss": 1.0959, + "step": 27327 + }, + { + "epoch": 0.82, + "learning_rate": 3.9853416281757957e-07, + "loss": 0.989, + "step": 27328 + }, + { + "epoch": 0.82, + "learning_rate": 3.984020467958888e-07, + "loss": 1.0709, + "step": 27329 + }, + { + "epoch": 0.82, + "learning_rate": 3.982699507803983e-07, + "loss": 1.256, + "step": 27330 + }, + { + "epoch": 0.82, + "learning_rate": 3.981378747723658e-07, + "loss": 1.0571, + "step": 27331 + }, + { + "epoch": 0.82, + "learning_rate": 3.98005818773049e-07, + "loss": 0.9492, + "step": 27332 + }, + { + "epoch": 0.82, + "learning_rate": 3.9787378278370396e-07, + "loss": 1.0472, + "step": 27333 + }, + { + "epoch": 0.82, + "learning_rate": 3.97741766805588e-07, + "loss": 1.0968, + "step": 27334 + }, + { + "epoch": 0.82, + "learning_rate": 3.976097708399579e-07, + "loss": 1.0493, + "step": 27335 + }, + { + "epoch": 0.82, + "learning_rate": 3.974777948880701e-07, + "loss": 1.2698, + "step": 27336 + }, + { + "epoch": 0.82, + "learning_rate": 3.9734583895118193e-07, + "loss": 1.2038, + "step": 27337 + }, + { + "epoch": 0.82, + "learning_rate": 3.97213903030548e-07, + "loss": 1.0269, + "step": 27338 + }, + { + "epoch": 0.82, + "learning_rate": 3.9708198712742506e-07, + "loss": 1.0926, + "step": 27339 + }, + { + "epoch": 0.82, + "learning_rate": 3.969500912430688e-07, + "loss": 1.1036, + "step": 27340 + }, + { + "epoch": 0.82, + "learning_rate": 3.9681821537873534e-07, + "loss": 0.9789, + "step": 27341 + }, + { + "epoch": 0.82, + "learning_rate": 3.9668635953567874e-07, + "loss": 1.1027, + "step": 27342 + }, + { + "epoch": 0.82, + "learning_rate": 3.9655452371515525e-07, + "loss": 1.0975, + "step": 27343 + }, + { + "epoch": 0.82, + "learning_rate": 3.9642270791841964e-07, + "loss": 1.1046, + "step": 27344 + }, + { + "epoch": 0.82, + "learning_rate": 3.962909121467273e-07, + "loss": 0.9952, + "step": 27345 + }, + { + "epoch": 0.82, + "learning_rate": 3.9615913640133174e-07, + "loss": 1.0372, + "step": 27346 + }, + { + "epoch": 0.82, + "learning_rate": 3.960273806834877e-07, + "loss": 1.1703, + "step": 27347 + }, + { + "epoch": 0.82, + "learning_rate": 3.958956449944501e-07, + "loss": 1.1908, + "step": 27348 + }, + { + "epoch": 0.82, + "learning_rate": 3.957639293354723e-07, + "loss": 1.0561, + "step": 27349 + }, + { + "epoch": 0.82, + "learning_rate": 3.9563223370780863e-07, + "loss": 1.0046, + "step": 27350 + }, + { + "epoch": 0.82, + "learning_rate": 3.955005581127125e-07, + "loss": 1.0824, + "step": 27351 + }, + { + "epoch": 0.82, + "learning_rate": 3.9536890255143736e-07, + "loss": 1.1229, + "step": 27352 + }, + { + "epoch": 0.82, + "learning_rate": 3.952372670252369e-07, + "loss": 0.9752, + "step": 27353 + }, + { + "epoch": 0.82, + "learning_rate": 3.9510565153536436e-07, + "loss": 1.0977, + "step": 27354 + }, + { + "epoch": 0.82, + "learning_rate": 3.949740560830717e-07, + "loss": 1.0938, + "step": 27355 + }, + { + "epoch": 0.82, + "learning_rate": 3.948424806696124e-07, + "loss": 1.0573, + "step": 27356 + }, + { + "epoch": 0.82, + "learning_rate": 3.947109252962386e-07, + "loss": 1.1699, + "step": 27357 + }, + { + "epoch": 0.82, + "learning_rate": 3.9457938996420337e-07, + "loss": 1.1321, + "step": 27358 + }, + { + "epoch": 0.82, + "learning_rate": 3.9444787467475794e-07, + "loss": 1.1254, + "step": 27359 + }, + { + "epoch": 0.82, + "learning_rate": 3.9431637942915464e-07, + "loss": 0.9703, + "step": 27360 + }, + { + "epoch": 0.82, + "learning_rate": 3.9418490422864527e-07, + "loss": 1.0964, + "step": 27361 + }, + { + "epoch": 0.82, + "learning_rate": 3.9405344907448154e-07, + "loss": 1.1815, + "step": 27362 + }, + { + "epoch": 0.82, + "learning_rate": 3.9392201396791505e-07, + "loss": 1.132, + "step": 27363 + }, + { + "epoch": 0.82, + "learning_rate": 3.937905989101962e-07, + "loss": 1.1163, + "step": 27364 + }, + { + "epoch": 0.82, + "learning_rate": 3.936592039025766e-07, + "loss": 0.9436, + "step": 27365 + }, + { + "epoch": 0.82, + "learning_rate": 3.935278289463068e-07, + "loss": 1.0494, + "step": 27366 + }, + { + "epoch": 0.82, + "learning_rate": 3.93396474042638e-07, + "loss": 1.1963, + "step": 27367 + }, + { + "epoch": 0.82, + "learning_rate": 3.9326513919281966e-07, + "loss": 1.1931, + "step": 27368 + }, + { + "epoch": 0.82, + "learning_rate": 3.931338243981028e-07, + "loss": 1.1001, + "step": 27369 + }, + { + "epoch": 0.82, + "learning_rate": 3.93002529659737e-07, + "loss": 1.1544, + "step": 27370 + }, + { + "epoch": 0.82, + "learning_rate": 3.9287125497897314e-07, + "loss": 1.0791, + "step": 27371 + }, + { + "epoch": 0.82, + "learning_rate": 3.927400003570592e-07, + "loss": 1.053, + "step": 27372 + }, + { + "epoch": 0.82, + "learning_rate": 3.92608765795246e-07, + "loss": 1.0807, + "step": 27373 + }, + { + "epoch": 0.82, + "learning_rate": 3.9247755129478207e-07, + "loss": 1.1683, + "step": 27374 + }, + { + "epoch": 0.82, + "learning_rate": 3.9234635685691693e-07, + "loss": 1.0304, + "step": 27375 + }, + { + "epoch": 0.82, + "learning_rate": 3.922151824828993e-07, + "loss": 0.9793, + "step": 27376 + }, + { + "epoch": 0.82, + "learning_rate": 3.92084028173978e-07, + "loss": 1.109, + "step": 27377 + }, + { + "epoch": 0.82, + "learning_rate": 3.919528939314016e-07, + "loss": 1.0374, + "step": 27378 + }, + { + "epoch": 0.82, + "learning_rate": 3.918217797564192e-07, + "loss": 1.1514, + "step": 27379 + }, + { + "epoch": 0.82, + "learning_rate": 3.9169068565027723e-07, + "loss": 1.1039, + "step": 27380 + }, + { + "epoch": 0.82, + "learning_rate": 3.915596116142245e-07, + "loss": 1.057, + "step": 27381 + }, + { + "epoch": 0.82, + "learning_rate": 3.914285576495089e-07, + "loss": 1.1159, + "step": 27382 + }, + { + "epoch": 0.82, + "learning_rate": 3.9129752375737793e-07, + "loss": 1.1324, + "step": 27383 + }, + { + "epoch": 0.82, + "learning_rate": 3.911665099390796e-07, + "loss": 1.0893, + "step": 27384 + }, + { + "epoch": 0.82, + "learning_rate": 3.910355161958598e-07, + "loss": 1.0991, + "step": 27385 + }, + { + "epoch": 0.83, + "learning_rate": 3.909045425289662e-07, + "loss": 1.1379, + "step": 27386 + }, + { + "epoch": 0.83, + "learning_rate": 3.907735889396455e-07, + "loss": 1.0778, + "step": 27387 + }, + { + "epoch": 0.83, + "learning_rate": 3.9064265542914454e-07, + "loss": 1.1401, + "step": 27388 + }, + { + "epoch": 0.83, + "learning_rate": 3.9051174199871006e-07, + "loss": 1.0768, + "step": 27389 + }, + { + "epoch": 0.83, + "learning_rate": 3.903808486495872e-07, + "loss": 0.9953, + "step": 27390 + }, + { + "epoch": 0.83, + "learning_rate": 3.9024997538302275e-07, + "loss": 1.1602, + "step": 27391 + }, + { + "epoch": 0.83, + "learning_rate": 3.901191222002623e-07, + "loss": 1.1457, + "step": 27392 + }, + { + "epoch": 0.83, + "learning_rate": 3.899882891025525e-07, + "loss": 1.069, + "step": 27393 + }, + { + "epoch": 0.83, + "learning_rate": 3.898574760911372e-07, + "loss": 1.0951, + "step": 27394 + }, + { + "epoch": 0.83, + "learning_rate": 3.8972668316726245e-07, + "loss": 1.0914, + "step": 27395 + }, + { + "epoch": 0.83, + "learning_rate": 3.895959103321734e-07, + "loss": 1.0143, + "step": 27396 + }, + { + "epoch": 0.83, + "learning_rate": 3.894651575871153e-07, + "loss": 1.1062, + "step": 27397 + }, + { + "epoch": 0.83, + "learning_rate": 3.8933442493333196e-07, + "loss": 1.1695, + "step": 27398 + }, + { + "epoch": 0.83, + "learning_rate": 3.892037123720685e-07, + "loss": 1.1725, + "step": 27399 + }, + { + "epoch": 0.83, + "learning_rate": 3.890730199045689e-07, + "loss": 1.0029, + "step": 27400 + }, + { + "epoch": 0.83, + "learning_rate": 3.8894234753207807e-07, + "loss": 1.0616, + "step": 27401 + }, + { + "epoch": 0.83, + "learning_rate": 3.8881169525583906e-07, + "loss": 1.1318, + "step": 27402 + }, + { + "epoch": 0.83, + "learning_rate": 3.8868106307709567e-07, + "loss": 1.071, + "step": 27403 + }, + { + "epoch": 0.83, + "learning_rate": 3.885504509970917e-07, + "loss": 1.1041, + "step": 27404 + }, + { + "epoch": 0.83, + "learning_rate": 3.884198590170707e-07, + "loss": 1.0677, + "step": 27405 + }, + { + "epoch": 0.83, + "learning_rate": 3.8828928713827543e-07, + "loss": 1.2255, + "step": 27406 + }, + { + "epoch": 0.83, + "learning_rate": 3.8815873536194927e-07, + "loss": 1.0226, + "step": 27407 + }, + { + "epoch": 0.83, + "learning_rate": 3.8802820368933485e-07, + "loss": 1.1488, + "step": 27408 + }, + { + "epoch": 0.83, + "learning_rate": 3.878976921216748e-07, + "loss": 1.0491, + "step": 27409 + }, + { + "epoch": 0.83, + "learning_rate": 3.8776720066021204e-07, + "loss": 1.1945, + "step": 27410 + }, + { + "epoch": 0.83, + "learning_rate": 3.876367293061878e-07, + "loss": 1.0848, + "step": 27411 + }, + { + "epoch": 0.83, + "learning_rate": 3.8750627806084434e-07, + "loss": 1.1913, + "step": 27412 + }, + { + "epoch": 0.83, + "learning_rate": 3.8737584692542377e-07, + "loss": 1.1313, + "step": 27413 + }, + { + "epoch": 0.83, + "learning_rate": 3.872454359011682e-07, + "loss": 1.0964, + "step": 27414 + }, + { + "epoch": 0.83, + "learning_rate": 3.87115044989318e-07, + "loss": 1.0021, + "step": 27415 + }, + { + "epoch": 0.83, + "learning_rate": 3.8698467419111515e-07, + "loss": 1.0329, + "step": 27416 + }, + { + "epoch": 0.83, + "learning_rate": 3.868543235078004e-07, + "loss": 1.1376, + "step": 27417 + }, + { + "epoch": 0.83, + "learning_rate": 3.8672399294061467e-07, + "loss": 1.1931, + "step": 27418 + }, + { + "epoch": 0.83, + "learning_rate": 3.8659368249079925e-07, + "loss": 0.9695, + "step": 27419 + }, + { + "epoch": 0.83, + "learning_rate": 3.8646339215959366e-07, + "loss": 1.0198, + "step": 27420 + }, + { + "epoch": 0.83, + "learning_rate": 3.8633312194823886e-07, + "loss": 1.0307, + "step": 27421 + }, + { + "epoch": 0.83, + "learning_rate": 3.862028718579744e-07, + "loss": 1.0692, + "step": 27422 + }, + { + "epoch": 0.83, + "learning_rate": 3.8607264189004154e-07, + "loss": 1.0655, + "step": 27423 + }, + { + "epoch": 0.83, + "learning_rate": 3.859424320456781e-07, + "loss": 1.0598, + "step": 27424 + }, + { + "epoch": 0.83, + "learning_rate": 3.858122423261246e-07, + "loss": 1.084, + "step": 27425 + }, + { + "epoch": 0.83, + "learning_rate": 3.856820727326205e-07, + "loss": 1.0926, + "step": 27426 + }, + { + "epoch": 0.83, + "learning_rate": 3.855519232664051e-07, + "loss": 1.1, + "step": 27427 + }, + { + "epoch": 0.83, + "learning_rate": 3.8542179392871663e-07, + "loss": 1.0935, + "step": 27428 + }, + { + "epoch": 0.83, + "learning_rate": 3.852916847207944e-07, + "loss": 1.1529, + "step": 27429 + }, + { + "epoch": 0.83, + "learning_rate": 3.851615956438767e-07, + "loss": 1.056, + "step": 27430 + }, + { + "epoch": 0.83, + "learning_rate": 3.850315266992019e-07, + "loss": 1.1932, + "step": 27431 + }, + { + "epoch": 0.83, + "learning_rate": 3.849014778880086e-07, + "loss": 1.069, + "step": 27432 + }, + { + "epoch": 0.83, + "learning_rate": 3.8477144921153455e-07, + "loss": 1.1639, + "step": 27433 + }, + { + "epoch": 0.83, + "learning_rate": 3.846414406710175e-07, + "loss": 0.9882, + "step": 27434 + }, + { + "epoch": 0.83, + "learning_rate": 3.8451145226769515e-07, + "loss": 1.0605, + "step": 27435 + }, + { + "epoch": 0.83, + "learning_rate": 3.843814840028054e-07, + "loss": 1.0812, + "step": 27436 + }, + { + "epoch": 0.83, + "learning_rate": 3.8425153587758445e-07, + "loss": 1.0087, + "step": 27437 + }, + { + "epoch": 0.83, + "learning_rate": 3.8412160789327023e-07, + "loss": 1.0624, + "step": 27438 + }, + { + "epoch": 0.83, + "learning_rate": 3.8399170005109897e-07, + "loss": 0.9762, + "step": 27439 + }, + { + "epoch": 0.83, + "learning_rate": 3.8386181235230827e-07, + "loss": 1.0531, + "step": 27440 + }, + { + "epoch": 0.83, + "learning_rate": 3.837319447981333e-07, + "loss": 0.9894, + "step": 27441 + }, + { + "epoch": 0.83, + "learning_rate": 3.836020973898111e-07, + "loss": 1.1172, + "step": 27442 + }, + { + "epoch": 0.83, + "learning_rate": 3.834722701285776e-07, + "loss": 1.0142, + "step": 27443 + }, + { + "epoch": 0.83, + "learning_rate": 3.8334246301566845e-07, + "loss": 1.0043, + "step": 27444 + }, + { + "epoch": 0.83, + "learning_rate": 3.8321267605232056e-07, + "loss": 1.0606, + "step": 27445 + }, + { + "epoch": 0.83, + "learning_rate": 3.830829092397678e-07, + "loss": 1.0513, + "step": 27446 + }, + { + "epoch": 0.83, + "learning_rate": 3.8295316257924624e-07, + "loss": 1.1812, + "step": 27447 + }, + { + "epoch": 0.83, + "learning_rate": 3.82823436071991e-07, + "loss": 1.1742, + "step": 27448 + }, + { + "epoch": 0.83, + "learning_rate": 3.826937297192376e-07, + "loss": 1.1572, + "step": 27449 + }, + { + "epoch": 0.83, + "learning_rate": 3.8256404352221943e-07, + "loss": 1.0312, + "step": 27450 + }, + { + "epoch": 0.83, + "learning_rate": 3.8243437748217204e-07, + "loss": 1.0516, + "step": 27451 + }, + { + "epoch": 0.83, + "learning_rate": 3.8230473160032924e-07, + "loss": 1.0876, + "step": 27452 + }, + { + "epoch": 0.83, + "learning_rate": 3.8217510587792607e-07, + "loss": 1.0442, + "step": 27453 + }, + { + "epoch": 0.83, + "learning_rate": 3.820455003161955e-07, + "loss": 1.121, + "step": 27454 + }, + { + "epoch": 0.83, + "learning_rate": 3.819159149163718e-07, + "loss": 1.1812, + "step": 27455 + }, + { + "epoch": 0.83, + "learning_rate": 3.8178634967968806e-07, + "loss": 1.2131, + "step": 27456 + }, + { + "epoch": 0.83, + "learning_rate": 3.8165680460737847e-07, + "loss": 1.1483, + "step": 27457 + }, + { + "epoch": 0.83, + "learning_rate": 3.815272797006758e-07, + "loss": 1.0958, + "step": 27458 + }, + { + "epoch": 0.83, + "learning_rate": 3.81397774960813e-07, + "loss": 1.0175, + "step": 27459 + }, + { + "epoch": 0.83, + "learning_rate": 3.812682903890233e-07, + "loss": 1.1742, + "step": 27460 + }, + { + "epoch": 0.83, + "learning_rate": 3.811388259865395e-07, + "loss": 1.1319, + "step": 27461 + }, + { + "epoch": 0.83, + "learning_rate": 3.810093817545929e-07, + "loss": 1.1051, + "step": 27462 + }, + { + "epoch": 0.83, + "learning_rate": 3.808799576944167e-07, + "loss": 0.9418, + "step": 27463 + }, + { + "epoch": 0.83, + "learning_rate": 3.807505538072426e-07, + "loss": 1.1407, + "step": 27464 + }, + { + "epoch": 0.83, + "learning_rate": 3.8062117009430244e-07, + "loss": 1.1158, + "step": 27465 + }, + { + "epoch": 0.83, + "learning_rate": 3.804918065568286e-07, + "loss": 1.1055, + "step": 27466 + }, + { + "epoch": 0.83, + "learning_rate": 3.803624631960515e-07, + "loss": 1.0046, + "step": 27467 + }, + { + "epoch": 0.83, + "learning_rate": 3.8023314001320283e-07, + "loss": 1.0786, + "step": 27468 + }, + { + "epoch": 0.83, + "learning_rate": 3.8010383700951363e-07, + "loss": 0.9332, + "step": 27469 + }, + { + "epoch": 0.83, + "learning_rate": 3.7997455418621515e-07, + "loss": 1.0818, + "step": 27470 + }, + { + "epoch": 0.83, + "learning_rate": 3.798452915445383e-07, + "loss": 0.9999, + "step": 27471 + }, + { + "epoch": 0.83, + "learning_rate": 3.7971604908571267e-07, + "loss": 1.1689, + "step": 27472 + }, + { + "epoch": 0.83, + "learning_rate": 3.7958682681096925e-07, + "loss": 1.0395, + "step": 27473 + }, + { + "epoch": 0.83, + "learning_rate": 3.7945762472153786e-07, + "loss": 1.1279, + "step": 27474 + }, + { + "epoch": 0.83, + "learning_rate": 3.7932844281864915e-07, + "loss": 1.0469, + "step": 27475 + }, + { + "epoch": 0.83, + "learning_rate": 3.7919928110353167e-07, + "loss": 1.1664, + "step": 27476 + }, + { + "epoch": 0.83, + "learning_rate": 3.7907013957741574e-07, + "loss": 1.1243, + "step": 27477 + }, + { + "epoch": 0.83, + "learning_rate": 3.789410182415304e-07, + "loss": 1.0619, + "step": 27478 + }, + { + "epoch": 0.83, + "learning_rate": 3.7881191709710577e-07, + "loss": 1.0303, + "step": 27479 + }, + { + "epoch": 0.83, + "learning_rate": 3.7868283614536956e-07, + "loss": 1.1453, + "step": 27480 + }, + { + "epoch": 0.83, + "learning_rate": 3.7855377538755124e-07, + "loss": 1.2092, + "step": 27481 + }, + { + "epoch": 0.83, + "learning_rate": 3.78424734824879e-07, + "loss": 1.03, + "step": 27482 + }, + { + "epoch": 0.83, + "learning_rate": 3.7829571445858137e-07, + "loss": 1.1383, + "step": 27483 + }, + { + "epoch": 0.83, + "learning_rate": 3.781667142898876e-07, + "loss": 1.087, + "step": 27484 + }, + { + "epoch": 0.83, + "learning_rate": 3.780377343200239e-07, + "loss": 1.1016, + "step": 27485 + }, + { + "epoch": 0.83, + "learning_rate": 3.779087745502194e-07, + "loss": 1.1528, + "step": 27486 + }, + { + "epoch": 0.83, + "learning_rate": 3.7777983498170104e-07, + "loss": 1.1555, + "step": 27487 + }, + { + "epoch": 0.83, + "learning_rate": 3.7765091561569653e-07, + "loss": 1.1382, + "step": 27488 + }, + { + "epoch": 0.83, + "learning_rate": 3.775220164534332e-07, + "loss": 1.1442, + "step": 27489 + }, + { + "epoch": 0.83, + "learning_rate": 3.7739313749613813e-07, + "loss": 1.0607, + "step": 27490 + }, + { + "epoch": 0.83, + "learning_rate": 3.7726427874503815e-07, + "loss": 1.0793, + "step": 27491 + }, + { + "epoch": 0.83, + "learning_rate": 3.7713544020136025e-07, + "loss": 1.0649, + "step": 27492 + }, + { + "epoch": 0.83, + "learning_rate": 3.7700662186633014e-07, + "loss": 1.129, + "step": 27493 + }, + { + "epoch": 0.83, + "learning_rate": 3.7687782374117465e-07, + "loss": 1.0748, + "step": 27494 + }, + { + "epoch": 0.83, + "learning_rate": 3.767490458271195e-07, + "loss": 1.2014, + "step": 27495 + }, + { + "epoch": 0.83, + "learning_rate": 3.766202881253908e-07, + "loss": 0.9747, + "step": 27496 + }, + { + "epoch": 0.83, + "learning_rate": 3.764915506372152e-07, + "loss": 1.0609, + "step": 27497 + }, + { + "epoch": 0.83, + "learning_rate": 3.763628333638164e-07, + "loss": 1.114, + "step": 27498 + }, + { + "epoch": 0.83, + "learning_rate": 3.7623413630642094e-07, + "loss": 1.0335, + "step": 27499 + }, + { + "epoch": 0.83, + "learning_rate": 3.761054594662533e-07, + "loss": 1.0054, + "step": 27500 + }, + { + "epoch": 0.83, + "learning_rate": 3.7597680284453987e-07, + "loss": 1.1264, + "step": 27501 + }, + { + "epoch": 0.83, + "learning_rate": 3.7584816644250344e-07, + "loss": 1.1147, + "step": 27502 + }, + { + "epoch": 0.83, + "learning_rate": 3.757195502613692e-07, + "loss": 0.9855, + "step": 27503 + }, + { + "epoch": 0.83, + "learning_rate": 3.7559095430236224e-07, + "loss": 1.1613, + "step": 27504 + }, + { + "epoch": 0.83, + "learning_rate": 3.754623785667064e-07, + "loss": 1.1788, + "step": 27505 + }, + { + "epoch": 0.83, + "learning_rate": 3.7533382305562525e-07, + "loss": 1.1071, + "step": 27506 + }, + { + "epoch": 0.83, + "learning_rate": 3.7520528777034273e-07, + "loss": 1.1696, + "step": 27507 + }, + { + "epoch": 0.83, + "learning_rate": 3.750767727120824e-07, + "loss": 1.111, + "step": 27508 + }, + { + "epoch": 0.83, + "learning_rate": 3.7494827788206787e-07, + "loss": 1.0086, + "step": 27509 + }, + { + "epoch": 0.83, + "learning_rate": 3.748198032815228e-07, + "loss": 1.1404, + "step": 27510 + }, + { + "epoch": 0.83, + "learning_rate": 3.7469134891166934e-07, + "loss": 1.1038, + "step": 27511 + }, + { + "epoch": 0.83, + "learning_rate": 3.7456291477373037e-07, + "loss": 1.2053, + "step": 27512 + }, + { + "epoch": 0.83, + "learning_rate": 3.7443450086892903e-07, + "loss": 1.028, + "step": 27513 + }, + { + "epoch": 0.83, + "learning_rate": 3.7430610719848744e-07, + "loss": 1.0024, + "step": 27514 + }, + { + "epoch": 0.83, + "learning_rate": 3.741777337636279e-07, + "loss": 1.0785, + "step": 27515 + }, + { + "epoch": 0.83, + "learning_rate": 3.7404938056557233e-07, + "loss": 1.0422, + "step": 27516 + }, + { + "epoch": 0.83, + "learning_rate": 3.73921047605543e-07, + "loss": 1.1804, + "step": 27517 + }, + { + "epoch": 0.83, + "learning_rate": 3.73792734884762e-07, + "loss": 1.0828, + "step": 27518 + }, + { + "epoch": 0.83, + "learning_rate": 3.7366444240444944e-07, + "loss": 1.1715, + "step": 27519 + }, + { + "epoch": 0.83, + "learning_rate": 3.7353617016582716e-07, + "loss": 1.0444, + "step": 27520 + }, + { + "epoch": 0.83, + "learning_rate": 3.734079181701167e-07, + "loss": 1.0839, + "step": 27521 + }, + { + "epoch": 0.83, + "learning_rate": 3.732796864185384e-07, + "loss": 1.078, + "step": 27522 + }, + { + "epoch": 0.83, + "learning_rate": 3.731514749123141e-07, + "loss": 1.1244, + "step": 27523 + }, + { + "epoch": 0.83, + "learning_rate": 3.730232836526626e-07, + "loss": 1.1219, + "step": 27524 + }, + { + "epoch": 0.83, + "learning_rate": 3.7289511264080506e-07, + "loss": 1.0381, + "step": 27525 + }, + { + "epoch": 0.83, + "learning_rate": 3.727669618779617e-07, + "loss": 1.2112, + "step": 27526 + }, + { + "epoch": 0.83, + "learning_rate": 3.726388313653528e-07, + "loss": 1.1651, + "step": 27527 + }, + { + "epoch": 0.83, + "learning_rate": 3.725107211041973e-07, + "loss": 1.0153, + "step": 27528 + }, + { + "epoch": 0.83, + "learning_rate": 3.723826310957149e-07, + "loss": 1.0403, + "step": 27529 + }, + { + "epoch": 0.83, + "learning_rate": 3.722545613411252e-07, + "loss": 1.1567, + "step": 27530 + }, + { + "epoch": 0.83, + "learning_rate": 3.7212651184164813e-07, + "loss": 1.1127, + "step": 27531 + }, + { + "epoch": 0.83, + "learning_rate": 3.71998482598501e-07, + "loss": 1.1257, + "step": 27532 + }, + { + "epoch": 0.83, + "learning_rate": 3.7187047361290365e-07, + "loss": 1.1371, + "step": 27533 + }, + { + "epoch": 0.83, + "learning_rate": 3.71742484886074e-07, + "loss": 0.9801, + "step": 27534 + }, + { + "epoch": 0.83, + "learning_rate": 3.716145164192314e-07, + "loss": 1.1563, + "step": 27535 + }, + { + "epoch": 0.83, + "learning_rate": 3.7148656821359375e-07, + "loss": 1.2405, + "step": 27536 + }, + { + "epoch": 0.83, + "learning_rate": 3.7135864027037837e-07, + "loss": 1.1964, + "step": 27537 + }, + { + "epoch": 0.83, + "learning_rate": 3.7123073259080376e-07, + "loss": 1.0419, + "step": 27538 + }, + { + "epoch": 0.83, + "learning_rate": 3.71102845176087e-07, + "loss": 1.0913, + "step": 27539 + }, + { + "epoch": 0.83, + "learning_rate": 3.7097497802744604e-07, + "loss": 1.0526, + "step": 27540 + }, + { + "epoch": 0.83, + "learning_rate": 3.7084713114609787e-07, + "loss": 1.1398, + "step": 27541 + }, + { + "epoch": 0.83, + "learning_rate": 3.7071930453325964e-07, + "loss": 1.076, + "step": 27542 + }, + { + "epoch": 0.83, + "learning_rate": 3.7059149819014817e-07, + "loss": 1.0639, + "step": 27543 + }, + { + "epoch": 0.83, + "learning_rate": 3.704637121179805e-07, + "loss": 1.0084, + "step": 27544 + }, + { + "epoch": 0.83, + "learning_rate": 3.7033594631797233e-07, + "loss": 1.0365, + "step": 27545 + }, + { + "epoch": 0.83, + "learning_rate": 3.702082007913399e-07, + "loss": 1.0719, + "step": 27546 + }, + { + "epoch": 0.83, + "learning_rate": 3.700804755393e-07, + "loss": 1.2042, + "step": 27547 + }, + { + "epoch": 0.83, + "learning_rate": 3.699527705630679e-07, + "loss": 1.1328, + "step": 27548 + }, + { + "epoch": 0.83, + "learning_rate": 3.6982508586386024e-07, + "loss": 1.103, + "step": 27549 + }, + { + "epoch": 0.83, + "learning_rate": 3.696974214428914e-07, + "loss": 1.0133, + "step": 27550 + }, + { + "epoch": 0.83, + "learning_rate": 3.6956977730137705e-07, + "loss": 1.0815, + "step": 27551 + }, + { + "epoch": 0.83, + "learning_rate": 3.694421534405321e-07, + "loss": 1.0174, + "step": 27552 + }, + { + "epoch": 0.83, + "learning_rate": 3.6931454986157274e-07, + "loss": 1.1066, + "step": 27553 + }, + { + "epoch": 0.83, + "learning_rate": 3.691869665657119e-07, + "loss": 1.1122, + "step": 27554 + }, + { + "epoch": 0.83, + "learning_rate": 3.6905940355416474e-07, + "loss": 1.1871, + "step": 27555 + }, + { + "epoch": 0.83, + "learning_rate": 3.6893186082814616e-07, + "loss": 1.1128, + "step": 27556 + }, + { + "epoch": 0.83, + "learning_rate": 3.688043383888701e-07, + "loss": 0.9984, + "step": 27557 + }, + { + "epoch": 0.83, + "learning_rate": 3.686768362375498e-07, + "loss": 1.0746, + "step": 27558 + }, + { + "epoch": 0.83, + "learning_rate": 3.6854935437539985e-07, + "loss": 1.0496, + "step": 27559 + }, + { + "epoch": 0.83, + "learning_rate": 3.6842189280363314e-07, + "loss": 1.1315, + "step": 27560 + }, + { + "epoch": 0.83, + "learning_rate": 3.6829445152346347e-07, + "loss": 1.1049, + "step": 27561 + }, + { + "epoch": 0.83, + "learning_rate": 3.6816703053610485e-07, + "loss": 1.0498, + "step": 27562 + }, + { + "epoch": 0.83, + "learning_rate": 3.6803962984276854e-07, + "loss": 1.0449, + "step": 27563 + }, + { + "epoch": 0.83, + "learning_rate": 3.6791224944466823e-07, + "loss": 1.0923, + "step": 27564 + }, + { + "epoch": 0.83, + "learning_rate": 3.677848893430164e-07, + "loss": 1.054, + "step": 27565 + }, + { + "epoch": 0.83, + "learning_rate": 3.676575495390261e-07, + "loss": 1.0634, + "step": 27566 + }, + { + "epoch": 0.83, + "learning_rate": 3.675302300339084e-07, + "loss": 1.1696, + "step": 27567 + }, + { + "epoch": 0.83, + "learning_rate": 3.674029308288757e-07, + "loss": 1.1508, + "step": 27568 + }, + { + "epoch": 0.83, + "learning_rate": 3.6727565192514023e-07, + "loss": 1.1071, + "step": 27569 + }, + { + "epoch": 0.83, + "learning_rate": 3.671483933239134e-07, + "loss": 1.0142, + "step": 27570 + }, + { + "epoch": 0.83, + "learning_rate": 3.670211550264066e-07, + "loss": 1.1508, + "step": 27571 + }, + { + "epoch": 0.83, + "learning_rate": 3.668939370338312e-07, + "loss": 1.182, + "step": 27572 + }, + { + "epoch": 0.83, + "learning_rate": 3.667667393473981e-07, + "loss": 1.269, + "step": 27573 + }, + { + "epoch": 0.83, + "learning_rate": 3.66639561968318e-07, + "loss": 1.2289, + "step": 27574 + }, + { + "epoch": 0.83, + "learning_rate": 3.665124048978028e-07, + "loss": 1.1172, + "step": 27575 + }, + { + "epoch": 0.83, + "learning_rate": 3.663852681370611e-07, + "loss": 1.0842, + "step": 27576 + }, + { + "epoch": 0.83, + "learning_rate": 3.6625815168730425e-07, + "loss": 1.114, + "step": 27577 + }, + { + "epoch": 0.83, + "learning_rate": 3.6613105554974214e-07, + "loss": 1.085, + "step": 27578 + }, + { + "epoch": 0.83, + "learning_rate": 3.6600397972558515e-07, + "loss": 1.0635, + "step": 27579 + }, + { + "epoch": 0.83, + "learning_rate": 3.6587692421604206e-07, + "loss": 1.0394, + "step": 27580 + }, + { + "epoch": 0.83, + "learning_rate": 3.657498890223227e-07, + "loss": 1.1406, + "step": 27581 + }, + { + "epoch": 0.83, + "learning_rate": 3.6562287414563663e-07, + "loss": 1.0965, + "step": 27582 + }, + { + "epoch": 0.83, + "learning_rate": 3.654958795871932e-07, + "loss": 1.0507, + "step": 27583 + }, + { + "epoch": 0.83, + "learning_rate": 3.653689053482007e-07, + "loss": 1.1315, + "step": 27584 + }, + { + "epoch": 0.83, + "learning_rate": 3.65241951429868e-07, + "loss": 1.068, + "step": 27585 + }, + { + "epoch": 0.83, + "learning_rate": 3.651150178334037e-07, + "loss": 1.035, + "step": 27586 + }, + { + "epoch": 0.83, + "learning_rate": 3.6498810456001704e-07, + "loss": 1.1601, + "step": 27587 + }, + { + "epoch": 0.83, + "learning_rate": 3.6486121161091457e-07, + "loss": 1.157, + "step": 27588 + }, + { + "epoch": 0.83, + "learning_rate": 3.6473433898730507e-07, + "loss": 1.0951, + "step": 27589 + }, + { + "epoch": 0.83, + "learning_rate": 3.6460748669039646e-07, + "loss": 1.0934, + "step": 27590 + }, + { + "epoch": 0.83, + "learning_rate": 3.644806547213958e-07, + "loss": 1.1466, + "step": 27591 + }, + { + "epoch": 0.83, + "learning_rate": 3.643538430815116e-07, + "loss": 1.1773, + "step": 27592 + }, + { + "epoch": 0.83, + "learning_rate": 3.6422705177194985e-07, + "loss": 1.1052, + "step": 27593 + }, + { + "epoch": 0.83, + "learning_rate": 3.6410028079391784e-07, + "loss": 1.1328, + "step": 27594 + }, + { + "epoch": 0.83, + "learning_rate": 3.639735301486222e-07, + "loss": 1.1397, + "step": 27595 + }, + { + "epoch": 0.83, + "learning_rate": 3.638467998372702e-07, + "loss": 0.9839, + "step": 27596 + }, + { + "epoch": 0.83, + "learning_rate": 3.637200898610677e-07, + "loss": 1.0938, + "step": 27597 + }, + { + "epoch": 0.83, + "learning_rate": 3.63593400221221e-07, + "loss": 1.1569, + "step": 27598 + }, + { + "epoch": 0.83, + "learning_rate": 3.6346673091893605e-07, + "loss": 1.0601, + "step": 27599 + }, + { + "epoch": 0.83, + "learning_rate": 3.6334008195541976e-07, + "loss": 1.0954, + "step": 27600 + }, + { + "epoch": 0.83, + "learning_rate": 3.6321345333187594e-07, + "loss": 0.9999, + "step": 27601 + }, + { + "epoch": 0.83, + "learning_rate": 3.630868450495112e-07, + "loss": 1.142, + "step": 27602 + }, + { + "epoch": 0.83, + "learning_rate": 3.629602571095303e-07, + "loss": 1.0048, + "step": 27603 + }, + { + "epoch": 0.83, + "learning_rate": 3.6283368951313877e-07, + "loss": 1.2035, + "step": 27604 + }, + { + "epoch": 0.83, + "learning_rate": 3.6270714226154165e-07, + "loss": 1.0302, + "step": 27605 + }, + { + "epoch": 0.83, + "learning_rate": 3.6258061535594274e-07, + "loss": 1.0896, + "step": 27606 + }, + { + "epoch": 0.83, + "learning_rate": 3.624541087975467e-07, + "loss": 1.0491, + "step": 27607 + }, + { + "epoch": 0.83, + "learning_rate": 3.6232762258755827e-07, + "loss": 1.1362, + "step": 27608 + }, + { + "epoch": 0.83, + "learning_rate": 3.6220115672718187e-07, + "loss": 1.0273, + "step": 27609 + }, + { + "epoch": 0.83, + "learning_rate": 3.6207471121762013e-07, + "loss": 1.0781, + "step": 27610 + }, + { + "epoch": 0.83, + "learning_rate": 3.6194828606007757e-07, + "loss": 1.1224, + "step": 27611 + }, + { + "epoch": 0.83, + "learning_rate": 3.618218812557578e-07, + "loss": 1.1182, + "step": 27612 + }, + { + "epoch": 0.83, + "learning_rate": 3.6169549680586416e-07, + "loss": 1.1451, + "step": 27613 + }, + { + "epoch": 0.83, + "learning_rate": 3.615691327115994e-07, + "loss": 1.156, + "step": 27614 + }, + { + "epoch": 0.83, + "learning_rate": 3.614427889741662e-07, + "loss": 1.0848, + "step": 27615 + }, + { + "epoch": 0.83, + "learning_rate": 3.613164655947679e-07, + "loss": 1.0098, + "step": 27616 + }, + { + "epoch": 0.83, + "learning_rate": 3.611901625746067e-07, + "loss": 1.1785, + "step": 27617 + }, + { + "epoch": 0.83, + "learning_rate": 3.6106387991488576e-07, + "loss": 1.127, + "step": 27618 + }, + { + "epoch": 0.83, + "learning_rate": 3.6093761761680583e-07, + "loss": 1.0461, + "step": 27619 + }, + { + "epoch": 0.83, + "learning_rate": 3.608113756815698e-07, + "loss": 1.0198, + "step": 27620 + }, + { + "epoch": 0.83, + "learning_rate": 3.6068515411037896e-07, + "loss": 1.0352, + "step": 27621 + }, + { + "epoch": 0.83, + "learning_rate": 3.6055895290443537e-07, + "loss": 1.0859, + "step": 27622 + }, + { + "epoch": 0.83, + "learning_rate": 3.6043277206494006e-07, + "loss": 1.11, + "step": 27623 + }, + { + "epoch": 0.83, + "learning_rate": 3.6030661159309423e-07, + "loss": 1.0654, + "step": 27624 + }, + { + "epoch": 0.83, + "learning_rate": 3.601804714900989e-07, + "loss": 1.2301, + "step": 27625 + }, + { + "epoch": 0.83, + "learning_rate": 3.600543517571556e-07, + "loss": 1.1696, + "step": 27626 + }, + { + "epoch": 0.83, + "learning_rate": 3.599282523954636e-07, + "loss": 1.0473, + "step": 27627 + }, + { + "epoch": 0.83, + "learning_rate": 3.59802173406224e-07, + "loss": 1.1361, + "step": 27628 + }, + { + "epoch": 0.83, + "learning_rate": 3.596761147906369e-07, + "loss": 1.1396, + "step": 27629 + }, + { + "epoch": 0.83, + "learning_rate": 3.5955007654990244e-07, + "loss": 1.1722, + "step": 27630 + }, + { + "epoch": 0.83, + "learning_rate": 3.594240586852207e-07, + "loss": 1.0685, + "step": 27631 + }, + { + "epoch": 0.83, + "learning_rate": 3.592980611977906e-07, + "loss": 1.2556, + "step": 27632 + }, + { + "epoch": 0.83, + "learning_rate": 3.5917208408881214e-07, + "loss": 1.1249, + "step": 27633 + }, + { + "epoch": 0.83, + "learning_rate": 3.590461273594842e-07, + "loss": 1.0536, + "step": 27634 + }, + { + "epoch": 0.83, + "learning_rate": 3.5892019101100655e-07, + "loss": 1.1321, + "step": 27635 + }, + { + "epoch": 0.83, + "learning_rate": 3.587942750445769e-07, + "loss": 1.1521, + "step": 27636 + }, + { + "epoch": 0.83, + "learning_rate": 3.586683794613946e-07, + "loss": 1.1011, + "step": 27637 + }, + { + "epoch": 0.83, + "learning_rate": 3.585425042626581e-07, + "loss": 1.0349, + "step": 27638 + }, + { + "epoch": 0.83, + "learning_rate": 3.584166494495661e-07, + "loss": 1.0675, + "step": 27639 + }, + { + "epoch": 0.83, + "learning_rate": 3.5829081502331554e-07, + "loss": 1.1006, + "step": 27640 + }, + { + "epoch": 0.83, + "learning_rate": 3.5816500098510483e-07, + "loss": 1.0369, + "step": 27641 + }, + { + "epoch": 0.83, + "learning_rate": 3.580392073361322e-07, + "loss": 1.0822, + "step": 27642 + }, + { + "epoch": 0.83, + "learning_rate": 3.5791343407759417e-07, + "loss": 1.2359, + "step": 27643 + }, + { + "epoch": 0.83, + "learning_rate": 3.5778768121068953e-07, + "loss": 1.1511, + "step": 27644 + }, + { + "epoch": 0.83, + "learning_rate": 3.576619487366137e-07, + "loss": 1.1182, + "step": 27645 + }, + { + "epoch": 0.83, + "learning_rate": 3.575362366565643e-07, + "loss": 1.1125, + "step": 27646 + }, + { + "epoch": 0.83, + "learning_rate": 3.5741054497173826e-07, + "loss": 1.0973, + "step": 27647 + }, + { + "epoch": 0.83, + "learning_rate": 3.572848736833326e-07, + "loss": 1.1161, + "step": 27648 + }, + { + "epoch": 0.83, + "learning_rate": 3.571592227925422e-07, + "loss": 1.1511, + "step": 27649 + }, + { + "epoch": 0.83, + "learning_rate": 3.5703359230056384e-07, + "loss": 1.0878, + "step": 27650 + }, + { + "epoch": 0.83, + "learning_rate": 3.5690798220859385e-07, + "loss": 1.1016, + "step": 27651 + }, + { + "epoch": 0.83, + "learning_rate": 3.567823925178274e-07, + "loss": 1.1032, + "step": 27652 + }, + { + "epoch": 0.83, + "learning_rate": 3.566568232294607e-07, + "loss": 0.9921, + "step": 27653 + }, + { + "epoch": 0.83, + "learning_rate": 3.565312743446886e-07, + "loss": 1.0814, + "step": 27654 + }, + { + "epoch": 0.83, + "learning_rate": 3.5640574586470663e-07, + "loss": 1.2007, + "step": 27655 + }, + { + "epoch": 0.83, + "learning_rate": 3.562802377907093e-07, + "loss": 1.032, + "step": 27656 + }, + { + "epoch": 0.83, + "learning_rate": 3.561547501238924e-07, + "loss": 1.0862, + "step": 27657 + }, + { + "epoch": 0.83, + "learning_rate": 3.5602928286544907e-07, + "loss": 1.1989, + "step": 27658 + }, + { + "epoch": 0.83, + "learning_rate": 3.559038360165745e-07, + "loss": 1.108, + "step": 27659 + }, + { + "epoch": 0.83, + "learning_rate": 3.5577840957846275e-07, + "loss": 1.1422, + "step": 27660 + }, + { + "epoch": 0.83, + "learning_rate": 3.5565300355230844e-07, + "loss": 1.1675, + "step": 27661 + }, + { + "epoch": 0.83, + "learning_rate": 3.555276179393041e-07, + "loss": 1.2226, + "step": 27662 + }, + { + "epoch": 0.83, + "learning_rate": 3.554022527406442e-07, + "loss": 1.1162, + "step": 27663 + }, + { + "epoch": 0.83, + "learning_rate": 3.552769079575219e-07, + "loss": 1.0687, + "step": 27664 + }, + { + "epoch": 0.83, + "learning_rate": 3.551515835911309e-07, + "loss": 1.1178, + "step": 27665 + }, + { + "epoch": 0.83, + "learning_rate": 3.5502627964266346e-07, + "loss": 1.1406, + "step": 27666 + }, + { + "epoch": 0.83, + "learning_rate": 3.549009961133129e-07, + "loss": 1.0988, + "step": 27667 + }, + { + "epoch": 0.83, + "learning_rate": 3.547757330042714e-07, + "loss": 1.2415, + "step": 27668 + }, + { + "epoch": 0.83, + "learning_rate": 3.546504903167322e-07, + "loss": 1.0657, + "step": 27669 + }, + { + "epoch": 0.83, + "learning_rate": 3.5452526805188736e-07, + "loss": 1.0689, + "step": 27670 + }, + { + "epoch": 0.83, + "learning_rate": 3.5440006621092817e-07, + "loss": 1.0928, + "step": 27671 + }, + { + "epoch": 0.83, + "learning_rate": 3.54274884795047e-07, + "loss": 1.0305, + "step": 27672 + }, + { + "epoch": 0.83, + "learning_rate": 3.5414972380543535e-07, + "loss": 1.0945, + "step": 27673 + }, + { + "epoch": 0.83, + "learning_rate": 3.5402458324328564e-07, + "loss": 1.1926, + "step": 27674 + }, + { + "epoch": 0.83, + "learning_rate": 3.538994631097875e-07, + "loss": 1.2086, + "step": 27675 + }, + { + "epoch": 0.83, + "learning_rate": 3.537743634061333e-07, + "loss": 1.1443, + "step": 27676 + }, + { + "epoch": 0.83, + "learning_rate": 3.536492841335132e-07, + "loss": 1.0367, + "step": 27677 + }, + { + "epoch": 0.83, + "learning_rate": 3.5352422529311817e-07, + "loss": 0.9786, + "step": 27678 + }, + { + "epoch": 0.83, + "learning_rate": 3.533991868861389e-07, + "loss": 1.072, + "step": 27679 + }, + { + "epoch": 0.83, + "learning_rate": 3.532741689137656e-07, + "loss": 1.105, + "step": 27680 + }, + { + "epoch": 0.83, + "learning_rate": 3.5314917137718813e-07, + "loss": 1.1746, + "step": 27681 + }, + { + "epoch": 0.83, + "learning_rate": 3.5302419427759667e-07, + "loss": 1.0423, + "step": 27682 + }, + { + "epoch": 0.83, + "learning_rate": 3.5289923761618135e-07, + "loss": 1.0715, + "step": 27683 + }, + { + "epoch": 0.83, + "learning_rate": 3.5277430139413066e-07, + "loss": 1.0169, + "step": 27684 + }, + { + "epoch": 0.83, + "learning_rate": 3.526493856126345e-07, + "loss": 1.1634, + "step": 27685 + }, + { + "epoch": 0.83, + "learning_rate": 3.5252449027288195e-07, + "loss": 1.0442, + "step": 27686 + }, + { + "epoch": 0.83, + "learning_rate": 3.523996153760628e-07, + "loss": 1.0397, + "step": 27687 + }, + { + "epoch": 0.83, + "learning_rate": 3.5227476092336425e-07, + "loss": 1.1497, + "step": 27688 + }, + { + "epoch": 0.83, + "learning_rate": 3.521499269159756e-07, + "loss": 1.061, + "step": 27689 + }, + { + "epoch": 0.83, + "learning_rate": 3.5202511335508507e-07, + "loss": 1.1376, + "step": 27690 + }, + { + "epoch": 0.83, + "learning_rate": 3.5190032024188166e-07, + "loss": 1.0604, + "step": 27691 + }, + { + "epoch": 0.83, + "learning_rate": 3.517755475775522e-07, + "loss": 1.0908, + "step": 27692 + }, + { + "epoch": 0.83, + "learning_rate": 3.5165079536328473e-07, + "loss": 0.986, + "step": 27693 + }, + { + "epoch": 0.83, + "learning_rate": 3.515260636002671e-07, + "loss": 1.1179, + "step": 27694 + }, + { + "epoch": 0.83, + "learning_rate": 3.514013522896864e-07, + "loss": 1.0794, + "step": 27695 + }, + { + "epoch": 0.83, + "learning_rate": 3.5127666143273094e-07, + "loss": 1.1234, + "step": 27696 + }, + { + "epoch": 0.83, + "learning_rate": 3.511519910305861e-07, + "loss": 1.1511, + "step": 27697 + }, + { + "epoch": 0.83, + "learning_rate": 3.510273410844392e-07, + "loss": 1.1923, + "step": 27698 + }, + { + "epoch": 0.83, + "learning_rate": 3.5090271159547717e-07, + "loss": 1.1744, + "step": 27699 + }, + { + "epoch": 0.83, + "learning_rate": 3.507781025648868e-07, + "loss": 1.1301, + "step": 27700 + }, + { + "epoch": 0.83, + "learning_rate": 3.5065351399385326e-07, + "loss": 1.1721, + "step": 27701 + }, + { + "epoch": 0.83, + "learning_rate": 3.5052894588356314e-07, + "loss": 1.1497, + "step": 27702 + }, + { + "epoch": 0.83, + "learning_rate": 3.504043982352021e-07, + "loss": 1.0233, + "step": 27703 + }, + { + "epoch": 0.83, + "learning_rate": 3.502798710499561e-07, + "loss": 1.04, + "step": 27704 + }, + { + "epoch": 0.83, + "learning_rate": 3.501553643290104e-07, + "loss": 1.1709, + "step": 27705 + }, + { + "epoch": 0.83, + "learning_rate": 3.5003087807355007e-07, + "loss": 1.1793, + "step": 27706 + }, + { + "epoch": 0.83, + "learning_rate": 3.4990641228476035e-07, + "loss": 1.0991, + "step": 27707 + }, + { + "epoch": 0.83, + "learning_rate": 3.4978196696382665e-07, + "loss": 0.9733, + "step": 27708 + }, + { + "epoch": 0.83, + "learning_rate": 3.496575421119325e-07, + "loss": 1.0484, + "step": 27709 + }, + { + "epoch": 0.83, + "learning_rate": 3.49533137730263e-07, + "loss": 1.1482, + "step": 27710 + }, + { + "epoch": 0.83, + "learning_rate": 3.494087538200022e-07, + "loss": 1.021, + "step": 27711 + }, + { + "epoch": 0.83, + "learning_rate": 3.4928439038233427e-07, + "loss": 1.2548, + "step": 27712 + }, + { + "epoch": 0.83, + "learning_rate": 3.491600474184437e-07, + "loss": 1.0128, + "step": 27713 + }, + { + "epoch": 0.83, + "learning_rate": 3.4903572492951316e-07, + "loss": 1.1584, + "step": 27714 + }, + { + "epoch": 0.83, + "learning_rate": 3.489114229167265e-07, + "loss": 1.0459, + "step": 27715 + }, + { + "epoch": 0.83, + "learning_rate": 3.487871413812671e-07, + "loss": 1.0554, + "step": 27716 + }, + { + "epoch": 0.83, + "learning_rate": 3.486628803243186e-07, + "loss": 1.0875, + "step": 27717 + }, + { + "epoch": 0.84, + "learning_rate": 3.4853863974706274e-07, + "loss": 1.246, + "step": 27718 + }, + { + "epoch": 0.84, + "learning_rate": 3.4841441965068306e-07, + "loss": 1.1842, + "step": 27719 + }, + { + "epoch": 0.84, + "learning_rate": 3.4829022003636165e-07, + "loss": 1.174, + "step": 27720 + }, + { + "epoch": 0.84, + "learning_rate": 3.481660409052812e-07, + "loss": 1.0848, + "step": 27721 + }, + { + "epoch": 0.84, + "learning_rate": 3.48041882258624e-07, + "loss": 0.975, + "step": 27722 + }, + { + "epoch": 0.84, + "learning_rate": 3.4791774409757145e-07, + "loss": 1.0842, + "step": 27723 + }, + { + "epoch": 0.84, + "learning_rate": 3.4779362642330534e-07, + "loss": 1.241, + "step": 27724 + }, + { + "epoch": 0.84, + "learning_rate": 3.476695292370072e-07, + "loss": 1.1599, + "step": 27725 + }, + { + "epoch": 0.84, + "learning_rate": 3.4754545253985944e-07, + "loss": 1.0612, + "step": 27726 + }, + { + "epoch": 0.84, + "learning_rate": 3.474213963330414e-07, + "loss": 0.9987, + "step": 27727 + }, + { + "epoch": 0.84, + "learning_rate": 3.4729736061773514e-07, + "loss": 1.0041, + "step": 27728 + }, + { + "epoch": 0.84, + "learning_rate": 3.471733453951212e-07, + "loss": 1.1842, + "step": 27729 + }, + { + "epoch": 0.84, + "learning_rate": 3.470493506663808e-07, + "loss": 1.1536, + "step": 27730 + }, + { + "epoch": 0.84, + "learning_rate": 3.4692537643269297e-07, + "loss": 1.2058, + "step": 27731 + }, + { + "epoch": 0.84, + "learning_rate": 3.4680142269523875e-07, + "loss": 0.9529, + "step": 27732 + }, + { + "epoch": 0.84, + "learning_rate": 3.46677489455198e-07, + "loss": 1.1302, + "step": 27733 + }, + { + "epoch": 0.84, + "learning_rate": 3.465535767137504e-07, + "loss": 1.0698, + "step": 27734 + }, + { + "epoch": 0.84, + "learning_rate": 3.464296844720755e-07, + "loss": 1.1058, + "step": 27735 + }, + { + "epoch": 0.84, + "learning_rate": 3.463058127313529e-07, + "loss": 1.1447, + "step": 27736 + }, + { + "epoch": 0.84, + "learning_rate": 3.461819614927617e-07, + "loss": 1.157, + "step": 27737 + }, + { + "epoch": 0.84, + "learning_rate": 3.4605813075748093e-07, + "loss": 1.0743, + "step": 27738 + }, + { + "epoch": 0.84, + "learning_rate": 3.459343205266899e-07, + "loss": 1.0846, + "step": 27739 + }, + { + "epoch": 0.84, + "learning_rate": 3.4581053080156635e-07, + "loss": 0.9811, + "step": 27740 + }, + { + "epoch": 0.84, + "learning_rate": 3.456867615832887e-07, + "loss": 1.075, + "step": 27741 + }, + { + "epoch": 0.84, + "learning_rate": 3.4556301287303585e-07, + "loss": 1.0593, + "step": 27742 + }, + { + "epoch": 0.84, + "learning_rate": 3.454392846719859e-07, + "loss": 1.1198, + "step": 27743 + }, + { + "epoch": 0.84, + "learning_rate": 3.4531557698131574e-07, + "loss": 1.11, + "step": 27744 + }, + { + "epoch": 0.84, + "learning_rate": 3.451918898022036e-07, + "loss": 1.057, + "step": 27745 + }, + { + "epoch": 0.84, + "learning_rate": 3.4506822313582683e-07, + "loss": 0.9813, + "step": 27746 + }, + { + "epoch": 0.84, + "learning_rate": 3.4494457698336284e-07, + "loss": 1.1547, + "step": 27747 + }, + { + "epoch": 0.84, + "learning_rate": 3.448209513459891e-07, + "loss": 1.181, + "step": 27748 + }, + { + "epoch": 0.84, + "learning_rate": 3.4469734622488123e-07, + "loss": 1.1035, + "step": 27749 + }, + { + "epoch": 0.84, + "learning_rate": 3.445737616212166e-07, + "loss": 1.1123, + "step": 27750 + }, + { + "epoch": 0.84, + "learning_rate": 3.444501975361719e-07, + "loss": 1.0784, + "step": 27751 + }, + { + "epoch": 0.84, + "learning_rate": 3.4432665397092337e-07, + "loss": 0.9749, + "step": 27752 + }, + { + "epoch": 0.84, + "learning_rate": 3.4420313092664663e-07, + "loss": 1.0455, + "step": 27753 + }, + { + "epoch": 0.84, + "learning_rate": 3.440796284045178e-07, + "loss": 1.1337, + "step": 27754 + }, + { + "epoch": 0.84, + "learning_rate": 3.4395614640571254e-07, + "loss": 1.1089, + "step": 27755 + }, + { + "epoch": 0.84, + "learning_rate": 3.4383268493140693e-07, + "loss": 1.1356, + "step": 27756 + }, + { + "epoch": 0.84, + "learning_rate": 3.4370924398277496e-07, + "loss": 1.0447, + "step": 27757 + }, + { + "epoch": 0.84, + "learning_rate": 3.4358582356099263e-07, + "loss": 1.1302, + "step": 27758 + }, + { + "epoch": 0.84, + "learning_rate": 3.434624236672349e-07, + "loss": 1.1585, + "step": 27759 + }, + { + "epoch": 0.84, + "learning_rate": 3.4333904430267603e-07, + "loss": 0.9686, + "step": 27760 + }, + { + "epoch": 0.84, + "learning_rate": 3.4321568546849063e-07, + "loss": 1.184, + "step": 27761 + }, + { + "epoch": 0.84, + "learning_rate": 3.430923471658534e-07, + "loss": 1.0906, + "step": 27762 + }, + { + "epoch": 0.84, + "learning_rate": 3.429690293959381e-07, + "loss": 1.06, + "step": 27763 + }, + { + "epoch": 0.84, + "learning_rate": 3.428457321599191e-07, + "loss": 1.1834, + "step": 27764 + }, + { + "epoch": 0.84, + "learning_rate": 3.4272245545897004e-07, + "loss": 1.0263, + "step": 27765 + }, + { + "epoch": 0.84, + "learning_rate": 3.425991992942637e-07, + "loss": 1.0282, + "step": 27766 + }, + { + "epoch": 0.84, + "learning_rate": 3.424759636669742e-07, + "loss": 1.1958, + "step": 27767 + }, + { + "epoch": 0.84, + "learning_rate": 3.4235274857827406e-07, + "loss": 1.1205, + "step": 27768 + }, + { + "epoch": 0.84, + "learning_rate": 3.4222955402933745e-07, + "loss": 1.1821, + "step": 27769 + }, + { + "epoch": 0.84, + "learning_rate": 3.421063800213353e-07, + "loss": 1.0934, + "step": 27770 + }, + { + "epoch": 0.84, + "learning_rate": 3.4198322655544154e-07, + "loss": 1.1522, + "step": 27771 + }, + { + "epoch": 0.84, + "learning_rate": 3.4186009363282815e-07, + "loss": 1.0111, + "step": 27772 + }, + { + "epoch": 0.84, + "learning_rate": 3.4173698125466754e-07, + "loss": 1.1982, + "step": 27773 + }, + { + "epoch": 0.84, + "learning_rate": 3.41613889422131e-07, + "loss": 1.2665, + "step": 27774 + }, + { + "epoch": 0.84, + "learning_rate": 3.4149081813639075e-07, + "loss": 1.0811, + "step": 27775 + }, + { + "epoch": 0.84, + "learning_rate": 3.413677673986182e-07, + "loss": 1.0826, + "step": 27776 + }, + { + "epoch": 0.84, + "learning_rate": 3.41244737209985e-07, + "loss": 1.1696, + "step": 27777 + }, + { + "epoch": 0.84, + "learning_rate": 3.4112172757166274e-07, + "loss": 1.2258, + "step": 27778 + }, + { + "epoch": 0.84, + "learning_rate": 3.4099873848482125e-07, + "loss": 1.2277, + "step": 27779 + }, + { + "epoch": 0.84, + "learning_rate": 3.408757699506321e-07, + "loss": 1.1533, + "step": 27780 + }, + { + "epoch": 0.84, + "learning_rate": 3.4075282197026575e-07, + "loss": 1.189, + "step": 27781 + }, + { + "epoch": 0.84, + "learning_rate": 3.40629894544893e-07, + "loss": 1.1239, + "step": 27782 + }, + { + "epoch": 0.84, + "learning_rate": 3.4050698767568337e-07, + "loss": 1.1805, + "step": 27783 + }, + { + "epoch": 0.84, + "learning_rate": 3.403841013638068e-07, + "loss": 1.0838, + "step": 27784 + }, + { + "epoch": 0.84, + "learning_rate": 3.402612356104337e-07, + "loss": 1.1426, + "step": 27785 + }, + { + "epoch": 0.84, + "learning_rate": 3.401383904167335e-07, + "loss": 1.089, + "step": 27786 + }, + { + "epoch": 0.84, + "learning_rate": 3.400155657838755e-07, + "loss": 1.0806, + "step": 27787 + }, + { + "epoch": 0.84, + "learning_rate": 3.39892761713029e-07, + "loss": 0.9907, + "step": 27788 + }, + { + "epoch": 0.84, + "learning_rate": 3.397699782053632e-07, + "loss": 1.1749, + "step": 27789 + }, + { + "epoch": 0.84, + "learning_rate": 3.396472152620467e-07, + "loss": 1.0522, + "step": 27790 + }, + { + "epoch": 0.84, + "learning_rate": 3.3952447288424896e-07, + "loss": 1.2151, + "step": 27791 + }, + { + "epoch": 0.84, + "learning_rate": 3.3940175107313704e-07, + "loss": 1.1173, + "step": 27792 + }, + { + "epoch": 0.84, + "learning_rate": 3.392790498298798e-07, + "loss": 1.074, + "step": 27793 + }, + { + "epoch": 0.84, + "learning_rate": 3.3915636915564573e-07, + "loss": 1.1384, + "step": 27794 + }, + { + "epoch": 0.84, + "learning_rate": 3.3903370905160246e-07, + "loss": 1.072, + "step": 27795 + }, + { + "epoch": 0.84, + "learning_rate": 3.3891106951891713e-07, + "loss": 1.1412, + "step": 27796 + }, + { + "epoch": 0.84, + "learning_rate": 3.387884505587577e-07, + "loss": 1.0065, + "step": 27797 + }, + { + "epoch": 0.84, + "learning_rate": 3.3866585217229104e-07, + "loss": 1.0108, + "step": 27798 + }, + { + "epoch": 0.84, + "learning_rate": 3.3854327436068535e-07, + "loss": 1.0399, + "step": 27799 + }, + { + "epoch": 0.84, + "learning_rate": 3.384207171251061e-07, + "loss": 1.1353, + "step": 27800 + }, + { + "epoch": 0.84, + "learning_rate": 3.382981804667204e-07, + "loss": 1.1016, + "step": 27801 + }, + { + "epoch": 0.84, + "learning_rate": 3.3817566438669513e-07, + "loss": 1.0093, + "step": 27802 + }, + { + "epoch": 0.84, + "learning_rate": 3.3805316888619625e-07, + "loss": 1.0211, + "step": 27803 + }, + { + "epoch": 0.84, + "learning_rate": 3.3793069396639067e-07, + "loss": 1.1308, + "step": 27804 + }, + { + "epoch": 0.84, + "learning_rate": 3.3780823962844296e-07, + "loss": 1.0653, + "step": 27805 + }, + { + "epoch": 0.84, + "learning_rate": 3.376858058735194e-07, + "loss": 1.0998, + "step": 27806 + }, + { + "epoch": 0.84, + "learning_rate": 3.375633927027855e-07, + "loss": 1.0699, + "step": 27807 + }, + { + "epoch": 0.84, + "learning_rate": 3.374410001174072e-07, + "loss": 1.0677, + "step": 27808 + }, + { + "epoch": 0.84, + "learning_rate": 3.3731862811854867e-07, + "loss": 1.0175, + "step": 27809 + }, + { + "epoch": 0.84, + "learning_rate": 3.3719627670737523e-07, + "loss": 1.1518, + "step": 27810 + }, + { + "epoch": 0.84, + "learning_rate": 3.370739458850514e-07, + "loss": 1.0659, + "step": 27811 + }, + { + "epoch": 0.84, + "learning_rate": 3.369516356527419e-07, + "loss": 1.083, + "step": 27812 + }, + { + "epoch": 0.84, + "learning_rate": 3.3682934601161175e-07, + "loss": 1.0094, + "step": 27813 + }, + { + "epoch": 0.84, + "learning_rate": 3.367070769628239e-07, + "loss": 1.2205, + "step": 27814 + }, + { + "epoch": 0.84, + "learning_rate": 3.365848285075427e-07, + "loss": 1.0499, + "step": 27815 + }, + { + "epoch": 0.84, + "learning_rate": 3.364626006469321e-07, + "loss": 0.9858, + "step": 27816 + }, + { + "epoch": 0.84, + "learning_rate": 3.363403933821555e-07, + "loss": 1.1303, + "step": 27817 + }, + { + "epoch": 0.84, + "learning_rate": 3.362182067143763e-07, + "loss": 1.0743, + "step": 27818 + }, + { + "epoch": 0.84, + "learning_rate": 3.360960406447575e-07, + "loss": 1.0211, + "step": 27819 + }, + { + "epoch": 0.84, + "learning_rate": 3.359738951744623e-07, + "loss": 1.1185, + "step": 27820 + }, + { + "epoch": 0.84, + "learning_rate": 3.3585177030465403e-07, + "loss": 1.0624, + "step": 27821 + }, + { + "epoch": 0.84, + "learning_rate": 3.357296660364942e-07, + "loss": 1.1002, + "step": 27822 + }, + { + "epoch": 0.84, + "learning_rate": 3.356075823711452e-07, + "loss": 1.1184, + "step": 27823 + }, + { + "epoch": 0.84, + "learning_rate": 3.3548551930977e-07, + "loss": 1.2523, + "step": 27824 + }, + { + "epoch": 0.84, + "learning_rate": 3.353634768535305e-07, + "loss": 1.0523, + "step": 27825 + }, + { + "epoch": 0.84, + "learning_rate": 3.352414550035876e-07, + "loss": 1.0657, + "step": 27826 + }, + { + "epoch": 0.84, + "learning_rate": 3.351194537611038e-07, + "loss": 0.9739, + "step": 27827 + }, + { + "epoch": 0.84, + "learning_rate": 3.349974731272398e-07, + "loss": 1.1296, + "step": 27828 + }, + { + "epoch": 0.84, + "learning_rate": 3.3487551310315725e-07, + "loss": 1.0595, + "step": 27829 + }, + { + "epoch": 0.84, + "learning_rate": 3.347535736900176e-07, + "loss": 1.0803, + "step": 27830 + }, + { + "epoch": 0.84, + "learning_rate": 3.346316548889808e-07, + "loss": 1.024, + "step": 27831 + }, + { + "epoch": 0.84, + "learning_rate": 3.345097567012076e-07, + "loss": 1.0786, + "step": 27832 + }, + { + "epoch": 0.84, + "learning_rate": 3.3438787912785846e-07, + "loss": 1.0499, + "step": 27833 + }, + { + "epoch": 0.84, + "learning_rate": 3.342660221700944e-07, + "loss": 1.0018, + "step": 27834 + }, + { + "epoch": 0.84, + "learning_rate": 3.3414418582907393e-07, + "loss": 1.1658, + "step": 27835 + }, + { + "epoch": 0.84, + "learning_rate": 3.3402237010595804e-07, + "loss": 0.9757, + "step": 27836 + }, + { + "epoch": 0.84, + "learning_rate": 3.339005750019059e-07, + "loss": 1.0463, + "step": 27837 + }, + { + "epoch": 0.84, + "learning_rate": 3.3377880051807754e-07, + "loss": 1.0521, + "step": 27838 + }, + { + "epoch": 0.84, + "learning_rate": 3.336570466556313e-07, + "loss": 1.0168, + "step": 27839 + }, + { + "epoch": 0.84, + "learning_rate": 3.335353134157265e-07, + "loss": 1.0563, + "step": 27840 + }, + { + "epoch": 0.84, + "learning_rate": 3.334136007995223e-07, + "loss": 1.1352, + "step": 27841 + }, + { + "epoch": 0.84, + "learning_rate": 3.332919088081771e-07, + "loss": 1.1008, + "step": 27842 + }, + { + "epoch": 0.84, + "learning_rate": 3.331702374428492e-07, + "loss": 1.2423, + "step": 27843 + }, + { + "epoch": 0.84, + "learning_rate": 3.330485867046973e-07, + "loss": 1.0189, + "step": 27844 + }, + { + "epoch": 0.84, + "learning_rate": 3.3292695659487894e-07, + "loss": 1.0581, + "step": 27845 + }, + { + "epoch": 0.84, + "learning_rate": 3.328053471145526e-07, + "loss": 1.1301, + "step": 27846 + }, + { + "epoch": 0.84, + "learning_rate": 3.326837582648759e-07, + "loss": 0.9937, + "step": 27847 + }, + { + "epoch": 0.84, + "learning_rate": 3.325621900470055e-07, + "loss": 1.2081, + "step": 27848 + }, + { + "epoch": 0.84, + "learning_rate": 3.3244064246209907e-07, + "loss": 1.1569, + "step": 27849 + }, + { + "epoch": 0.84, + "learning_rate": 3.3231911551131395e-07, + "loss": 1.0775, + "step": 27850 + }, + { + "epoch": 0.84, + "learning_rate": 3.3219760919580737e-07, + "loss": 1.0235, + "step": 27851 + }, + { + "epoch": 0.84, + "learning_rate": 3.3207612351673495e-07, + "loss": 1.1177, + "step": 27852 + }, + { + "epoch": 0.84, + "learning_rate": 3.3195465847525395e-07, + "loss": 1.1844, + "step": 27853 + }, + { + "epoch": 0.84, + "learning_rate": 3.3183321407252e-07, + "loss": 1.0485, + "step": 27854 + }, + { + "epoch": 0.84, + "learning_rate": 3.3171179030969005e-07, + "loss": 1.199, + "step": 27855 + }, + { + "epoch": 0.84, + "learning_rate": 3.3159038718791976e-07, + "loss": 1.0787, + "step": 27856 + }, + { + "epoch": 0.84, + "learning_rate": 3.3146900470836437e-07, + "loss": 1.0734, + "step": 27857 + }, + { + "epoch": 0.84, + "learning_rate": 3.313476428721796e-07, + "loss": 1.148, + "step": 27858 + }, + { + "epoch": 0.84, + "learning_rate": 3.3122630168052063e-07, + "loss": 0.986, + "step": 27859 + }, + { + "epoch": 0.84, + "learning_rate": 3.3110498113454346e-07, + "loss": 1.1003, + "step": 27860 + }, + { + "epoch": 0.84, + "learning_rate": 3.309836812354017e-07, + "loss": 1.0901, + "step": 27861 + }, + { + "epoch": 0.84, + "learning_rate": 3.308624019842507e-07, + "loss": 1.1388, + "step": 27862 + }, + { + "epoch": 0.84, + "learning_rate": 3.307411433822449e-07, + "loss": 1.1013, + "step": 27863 + }, + { + "epoch": 0.84, + "learning_rate": 3.3061990543053923e-07, + "loss": 1.0138, + "step": 27864 + }, + { + "epoch": 0.84, + "learning_rate": 3.304986881302866e-07, + "loss": 1.0796, + "step": 27865 + }, + { + "epoch": 0.84, + "learning_rate": 3.303774914826419e-07, + "loss": 1.0906, + "step": 27866 + }, + { + "epoch": 0.84, + "learning_rate": 3.302563154887581e-07, + "loss": 1.0986, + "step": 27867 + }, + { + "epoch": 0.84, + "learning_rate": 3.3013516014978955e-07, + "loss": 1.1227, + "step": 27868 + }, + { + "epoch": 0.84, + "learning_rate": 3.30014025466889e-07, + "loss": 1.2007, + "step": 27869 + }, + { + "epoch": 0.84, + "learning_rate": 3.2989291144121e-07, + "loss": 1.0938, + "step": 27870 + }, + { + "epoch": 0.84, + "learning_rate": 3.297718180739054e-07, + "loss": 1.0159, + "step": 27871 + }, + { + "epoch": 0.84, + "learning_rate": 3.2965074536612766e-07, + "loss": 1.1542, + "step": 27872 + }, + { + "epoch": 0.84, + "learning_rate": 3.2952969331903005e-07, + "loss": 0.9967, + "step": 27873 + }, + { + "epoch": 0.84, + "learning_rate": 3.2940866193376414e-07, + "loss": 1.1578, + "step": 27874 + }, + { + "epoch": 0.84, + "learning_rate": 3.292876512114823e-07, + "loss": 1.1638, + "step": 27875 + }, + { + "epoch": 0.84, + "learning_rate": 3.2916666115333646e-07, + "loss": 1.1032, + "step": 27876 + }, + { + "epoch": 0.84, + "learning_rate": 3.29045691760479e-07, + "loss": 1.028, + "step": 27877 + }, + { + "epoch": 0.84, + "learning_rate": 3.289247430340606e-07, + "loss": 0.9977, + "step": 27878 + }, + { + "epoch": 0.84, + "learning_rate": 3.288038149752329e-07, + "loss": 1.118, + "step": 27879 + }, + { + "epoch": 0.84, + "learning_rate": 3.286829075851472e-07, + "loss": 1.0949, + "step": 27880 + }, + { + "epoch": 0.84, + "learning_rate": 3.285620208649545e-07, + "loss": 1.0939, + "step": 27881 + }, + { + "epoch": 0.84, + "learning_rate": 3.284411548158062e-07, + "loss": 1.0103, + "step": 27882 + }, + { + "epoch": 0.84, + "learning_rate": 3.2832030943885177e-07, + "loss": 1.1193, + "step": 27883 + }, + { + "epoch": 0.84, + "learning_rate": 3.281994847352418e-07, + "loss": 1.0767, + "step": 27884 + }, + { + "epoch": 0.84, + "learning_rate": 3.2807868070612704e-07, + "loss": 1.0308, + "step": 27885 + }, + { + "epoch": 0.84, + "learning_rate": 3.279578973526576e-07, + "loss": 1.1294, + "step": 27886 + }, + { + "epoch": 0.84, + "learning_rate": 3.278371346759823e-07, + "loss": 1.1571, + "step": 27887 + }, + { + "epoch": 0.84, + "learning_rate": 3.277163926772514e-07, + "loss": 1.0747, + "step": 27888 + }, + { + "epoch": 0.84, + "learning_rate": 3.275956713576142e-07, + "loss": 1.1056, + "step": 27889 + }, + { + "epoch": 0.84, + "learning_rate": 3.274749707182204e-07, + "loss": 1.1757, + "step": 27890 + }, + { + "epoch": 0.84, + "learning_rate": 3.2735429076021813e-07, + "loss": 1.1392, + "step": 27891 + }, + { + "epoch": 0.84, + "learning_rate": 3.272336314847566e-07, + "loss": 1.0668, + "step": 27892 + }, + { + "epoch": 0.84, + "learning_rate": 3.271129928929845e-07, + "loss": 1.1082, + "step": 27893 + }, + { + "epoch": 0.84, + "learning_rate": 3.2699237498605014e-07, + "loss": 1.0096, + "step": 27894 + }, + { + "epoch": 0.84, + "learning_rate": 3.268717777651026e-07, + "loss": 1.1647, + "step": 27895 + }, + { + "epoch": 0.84, + "learning_rate": 3.2675120123128817e-07, + "loss": 1.0109, + "step": 27896 + }, + { + "epoch": 0.84, + "learning_rate": 3.26630645385756e-07, + "loss": 1.0129, + "step": 27897 + }, + { + "epoch": 0.84, + "learning_rate": 3.265101102296531e-07, + "loss": 1.0847, + "step": 27898 + }, + { + "epoch": 0.84, + "learning_rate": 3.2638959576412723e-07, + "loss": 1.1334, + "step": 27899 + }, + { + "epoch": 0.84, + "learning_rate": 3.262691019903255e-07, + "loss": 1.0257, + "step": 27900 + }, + { + "epoch": 0.84, + "learning_rate": 3.2614862890939516e-07, + "loss": 1.0452, + "step": 27901 + }, + { + "epoch": 0.84, + "learning_rate": 3.260281765224829e-07, + "loss": 1.0524, + "step": 27902 + }, + { + "epoch": 0.84, + "learning_rate": 3.25907744830736e-07, + "loss": 1.0766, + "step": 27903 + }, + { + "epoch": 0.84, + "learning_rate": 3.257873338352996e-07, + "loss": 1.1868, + "step": 27904 + }, + { + "epoch": 0.84, + "learning_rate": 3.2566694353732054e-07, + "loss": 1.1581, + "step": 27905 + }, + { + "epoch": 0.84, + "learning_rate": 3.2554657393794516e-07, + "loss": 1.0547, + "step": 27906 + }, + { + "epoch": 0.84, + "learning_rate": 3.254262250383192e-07, + "loss": 1.0855, + "step": 27907 + }, + { + "epoch": 0.84, + "learning_rate": 3.253058968395886e-07, + "loss": 1.0632, + "step": 27908 + }, + { + "epoch": 0.84, + "learning_rate": 3.2518558934289816e-07, + "loss": 0.9814, + "step": 27909 + }, + { + "epoch": 0.84, + "learning_rate": 3.250653025493933e-07, + "loss": 1.0945, + "step": 27910 + }, + { + "epoch": 0.84, + "learning_rate": 3.249450364602194e-07, + "loss": 1.2513, + "step": 27911 + }, + { + "epoch": 0.84, + "learning_rate": 3.248247910765218e-07, + "loss": 1.1272, + "step": 27912 + }, + { + "epoch": 0.84, + "learning_rate": 3.247045663994439e-07, + "loss": 1.063, + "step": 27913 + }, + { + "epoch": 0.84, + "learning_rate": 3.245843624301309e-07, + "loss": 1.053, + "step": 27914 + }, + { + "epoch": 0.84, + "learning_rate": 3.24464179169727e-07, + "loss": 1.1428, + "step": 27915 + }, + { + "epoch": 0.84, + "learning_rate": 3.2434401661937703e-07, + "loss": 1.0334, + "step": 27916 + }, + { + "epoch": 0.84, + "learning_rate": 3.2422387478022343e-07, + "loss": 1.1378, + "step": 27917 + }, + { + "epoch": 0.84, + "learning_rate": 3.2410375365341086e-07, + "loss": 1.1412, + "step": 27918 + }, + { + "epoch": 0.84, + "learning_rate": 3.239836532400825e-07, + "loss": 1.0353, + "step": 27919 + }, + { + "epoch": 0.84, + "learning_rate": 3.23863573541382e-07, + "loss": 1.158, + "step": 27920 + }, + { + "epoch": 0.84, + "learning_rate": 3.237435145584525e-07, + "loss": 1.1462, + "step": 27921 + }, + { + "epoch": 0.84, + "learning_rate": 3.2362347629243616e-07, + "loss": 1.1285, + "step": 27922 + }, + { + "epoch": 0.84, + "learning_rate": 3.2350345874447605e-07, + "loss": 0.9736, + "step": 27923 + }, + { + "epoch": 0.84, + "learning_rate": 3.2338346191571476e-07, + "loss": 1.2018, + "step": 27924 + }, + { + "epoch": 0.84, + "learning_rate": 3.232634858072947e-07, + "loss": 1.1505, + "step": 27925 + }, + { + "epoch": 0.84, + "learning_rate": 3.231435304203581e-07, + "loss": 1.1451, + "step": 27926 + }, + { + "epoch": 0.84, + "learning_rate": 3.2302359575604626e-07, + "loss": 1.0567, + "step": 27927 + }, + { + "epoch": 0.84, + "learning_rate": 3.229036818155018e-07, + "loss": 1.2516, + "step": 27928 + }, + { + "epoch": 0.84, + "learning_rate": 3.2278378859986583e-07, + "loss": 1.1739, + "step": 27929 + }, + { + "epoch": 0.84, + "learning_rate": 3.226639161102793e-07, + "loss": 1.1461, + "step": 27930 + }, + { + "epoch": 0.84, + "learning_rate": 3.225440643478836e-07, + "loss": 1.16, + "step": 27931 + }, + { + "epoch": 0.84, + "learning_rate": 3.2242423331382e-07, + "loss": 1.0499, + "step": 27932 + }, + { + "epoch": 0.84, + "learning_rate": 3.223044230092287e-07, + "loss": 1.0629, + "step": 27933 + }, + { + "epoch": 0.84, + "learning_rate": 3.22184633435251e-07, + "loss": 1.0526, + "step": 27934 + }, + { + "epoch": 0.84, + "learning_rate": 3.2206486459302606e-07, + "loss": 1.1321, + "step": 27935 + }, + { + "epoch": 0.84, + "learning_rate": 3.219451164836948e-07, + "loss": 1.0377, + "step": 27936 + }, + { + "epoch": 0.84, + "learning_rate": 3.218253891083972e-07, + "loss": 1.145, + "step": 27937 + }, + { + "epoch": 0.84, + "learning_rate": 3.217056824682732e-07, + "loss": 1.0885, + "step": 27938 + }, + { + "epoch": 0.84, + "learning_rate": 3.215859965644613e-07, + "loss": 1.1053, + "step": 27939 + }, + { + "epoch": 0.84, + "learning_rate": 3.21466331398102e-07, + "loss": 1.0855, + "step": 27940 + }, + { + "epoch": 0.84, + "learning_rate": 3.2134668697033357e-07, + "loss": 1.1257, + "step": 27941 + }, + { + "epoch": 0.84, + "learning_rate": 3.2122706328229613e-07, + "loss": 1.0328, + "step": 27942 + }, + { + "epoch": 0.84, + "learning_rate": 3.211074603351272e-07, + "loss": 1.0823, + "step": 27943 + }, + { + "epoch": 0.84, + "learning_rate": 3.209878781299661e-07, + "loss": 1.0764, + "step": 27944 + }, + { + "epoch": 0.84, + "learning_rate": 3.208683166679505e-07, + "loss": 1.0526, + "step": 27945 + }, + { + "epoch": 0.84, + "learning_rate": 3.2074877595021926e-07, + "loss": 1.026, + "step": 27946 + }, + { + "epoch": 0.84, + "learning_rate": 3.2062925597791063e-07, + "loss": 1.2189, + "step": 27947 + }, + { + "epoch": 0.84, + "learning_rate": 3.205097567521612e-07, + "loss": 1.045, + "step": 27948 + }, + { + "epoch": 0.84, + "learning_rate": 3.2039027827410947e-07, + "loss": 1.0847, + "step": 27949 + }, + { + "epoch": 0.84, + "learning_rate": 3.2027082054489233e-07, + "loss": 1.1205, + "step": 27950 + }, + { + "epoch": 0.84, + "learning_rate": 3.2015138356564723e-07, + "loss": 1.0579, + "step": 27951 + }, + { + "epoch": 0.84, + "learning_rate": 3.20031967337511e-07, + "loss": 1.0905, + "step": 27952 + }, + { + "epoch": 0.84, + "learning_rate": 3.1991257186162083e-07, + "loss": 1.0328, + "step": 27953 + }, + { + "epoch": 0.84, + "learning_rate": 3.197931971391127e-07, + "loss": 1.1481, + "step": 27954 + }, + { + "epoch": 0.84, + "learning_rate": 3.196738431711241e-07, + "loss": 1.0691, + "step": 27955 + }, + { + "epoch": 0.84, + "learning_rate": 3.195545099587896e-07, + "loss": 1.1142, + "step": 27956 + }, + { + "epoch": 0.84, + "learning_rate": 3.1943519750324615e-07, + "loss": 1.1149, + "step": 27957 + }, + { + "epoch": 0.84, + "learning_rate": 3.193159058056297e-07, + "loss": 1.2041, + "step": 27958 + }, + { + "epoch": 0.84, + "learning_rate": 3.1919663486707583e-07, + "loss": 1.0966, + "step": 27959 + }, + { + "epoch": 0.84, + "learning_rate": 3.1907738468871906e-07, + "loss": 1.1276, + "step": 27960 + }, + { + "epoch": 0.84, + "learning_rate": 3.1895815527169553e-07, + "loss": 1.0773, + "step": 27961 + }, + { + "epoch": 0.84, + "learning_rate": 3.188389466171396e-07, + "loss": 1.2846, + "step": 27962 + }, + { + "epoch": 0.84, + "learning_rate": 3.187197587261867e-07, + "loss": 1.0845, + "step": 27963 + }, + { + "epoch": 0.84, + "learning_rate": 3.186005915999715e-07, + "loss": 1.1092, + "step": 27964 + }, + { + "epoch": 0.84, + "learning_rate": 3.184814452396276e-07, + "loss": 1.1783, + "step": 27965 + }, + { + "epoch": 0.84, + "learning_rate": 3.1836231964628984e-07, + "loss": 1.1275, + "step": 27966 + }, + { + "epoch": 0.84, + "learning_rate": 3.1824321482109175e-07, + "loss": 1.0885, + "step": 27967 + }, + { + "epoch": 0.84, + "learning_rate": 3.1812413076516837e-07, + "loss": 1.0565, + "step": 27968 + }, + { + "epoch": 0.84, + "learning_rate": 3.180050674796517e-07, + "loss": 1.0718, + "step": 27969 + }, + { + "epoch": 0.84, + "learning_rate": 3.178860249656759e-07, + "loss": 1.1122, + "step": 27970 + }, + { + "epoch": 0.84, + "learning_rate": 3.177670032243743e-07, + "loss": 1.0318, + "step": 27971 + }, + { + "epoch": 0.84, + "learning_rate": 3.1764800225688036e-07, + "loss": 1.1411, + "step": 27972 + }, + { + "epoch": 0.84, + "learning_rate": 3.1752902206432565e-07, + "loss": 1.1377, + "step": 27973 + }, + { + "epoch": 0.84, + "learning_rate": 3.174100626478438e-07, + "loss": 1.1377, + "step": 27974 + }, + { + "epoch": 0.84, + "learning_rate": 3.172911240085669e-07, + "loss": 1.1857, + "step": 27975 + }, + { + "epoch": 0.84, + "learning_rate": 3.171722061476271e-07, + "loss": 1.0386, + "step": 27976 + }, + { + "epoch": 0.84, + "learning_rate": 3.1705330906615733e-07, + "loss": 1.1161, + "step": 27977 + }, + { + "epoch": 0.84, + "learning_rate": 3.169344327652882e-07, + "loss": 1.0695, + "step": 27978 + }, + { + "epoch": 0.84, + "learning_rate": 3.1681557724615174e-07, + "loss": 1.1572, + "step": 27979 + }, + { + "epoch": 0.84, + "learning_rate": 3.1669674250987965e-07, + "loss": 1.1265, + "step": 27980 + }, + { + "epoch": 0.84, + "learning_rate": 3.165779285576029e-07, + "loss": 0.9874, + "step": 27981 + }, + { + "epoch": 0.84, + "learning_rate": 3.164591353904528e-07, + "loss": 1.0591, + "step": 27982 + }, + { + "epoch": 0.84, + "learning_rate": 3.163403630095602e-07, + "loss": 1.1415, + "step": 27983 + }, + { + "epoch": 0.84, + "learning_rate": 3.1622161141605547e-07, + "loss": 1.0549, + "step": 27984 + }, + { + "epoch": 0.84, + "learning_rate": 3.1610288061107e-07, + "loss": 1.1494, + "step": 27985 + }, + { + "epoch": 0.84, + "learning_rate": 3.1598417059573255e-07, + "loss": 1.1346, + "step": 27986 + }, + { + "epoch": 0.84, + "learning_rate": 3.1586548137117397e-07, + "loss": 1.1801, + "step": 27987 + }, + { + "epoch": 0.84, + "learning_rate": 3.157468129385241e-07, + "loss": 1.0693, + "step": 27988 + }, + { + "epoch": 0.84, + "learning_rate": 3.156281652989127e-07, + "loss": 1.0728, + "step": 27989 + }, + { + "epoch": 0.84, + "learning_rate": 3.1550953845346953e-07, + "loss": 1.1296, + "step": 27990 + }, + { + "epoch": 0.84, + "learning_rate": 3.15390932403323e-07, + "loss": 1.0467, + "step": 27991 + }, + { + "epoch": 0.84, + "learning_rate": 3.1527234714960273e-07, + "loss": 1.062, + "step": 27992 + }, + { + "epoch": 0.84, + "learning_rate": 3.1515378269343757e-07, + "loss": 1.1355, + "step": 27993 + }, + { + "epoch": 0.84, + "learning_rate": 3.1503523903595653e-07, + "loss": 1.1642, + "step": 27994 + }, + { + "epoch": 0.84, + "learning_rate": 3.149167161782873e-07, + "loss": 1.0737, + "step": 27995 + }, + { + "epoch": 0.84, + "learning_rate": 3.147982141215583e-07, + "loss": 1.11, + "step": 27996 + }, + { + "epoch": 0.84, + "learning_rate": 3.14679732866898e-07, + "loss": 1.0153, + "step": 27997 + }, + { + "epoch": 0.84, + "learning_rate": 3.145612724154348e-07, + "loss": 1.0585, + "step": 27998 + }, + { + "epoch": 0.84, + "learning_rate": 3.1444283276829526e-07, + "loss": 1.1321, + "step": 27999 + }, + { + "epoch": 0.84, + "learning_rate": 3.143244139266072e-07, + "loss": 1.1143, + "step": 28000 + }, + { + "epoch": 0.84, + "learning_rate": 3.1420601589149805e-07, + "loss": 1.1266, + "step": 28001 + }, + { + "epoch": 0.84, + "learning_rate": 3.1408763866409483e-07, + "loss": 1.2385, + "step": 28002 + }, + { + "epoch": 0.84, + "learning_rate": 3.1396928224552535e-07, + "loss": 1.0533, + "step": 28003 + }, + { + "epoch": 0.84, + "learning_rate": 3.138509466369147e-07, + "loss": 1.0089, + "step": 28004 + }, + { + "epoch": 0.84, + "learning_rate": 3.137326318393902e-07, + "loss": 1.1998, + "step": 28005 + }, + { + "epoch": 0.84, + "learning_rate": 3.1361433785407817e-07, + "loss": 1.2055, + "step": 28006 + }, + { + "epoch": 0.84, + "learning_rate": 3.1349606468210447e-07, + "loss": 1.098, + "step": 28007 + }, + { + "epoch": 0.84, + "learning_rate": 3.1337781232459533e-07, + "loss": 0.9962, + "step": 28008 + }, + { + "epoch": 0.84, + "learning_rate": 3.1325958078267634e-07, + "loss": 1.0497, + "step": 28009 + }, + { + "epoch": 0.84, + "learning_rate": 3.131413700574729e-07, + "loss": 1.0627, + "step": 28010 + }, + { + "epoch": 0.84, + "learning_rate": 3.1302318015011073e-07, + "loss": 1.1279, + "step": 28011 + }, + { + "epoch": 0.84, + "learning_rate": 3.129050110617143e-07, + "loss": 1.0939, + "step": 28012 + }, + { + "epoch": 0.84, + "learning_rate": 3.1278686279340886e-07, + "loss": 1.0846, + "step": 28013 + }, + { + "epoch": 0.84, + "learning_rate": 3.1266873534631897e-07, + "loss": 1.1572, + "step": 28014 + }, + { + "epoch": 0.84, + "learning_rate": 3.1255062872156935e-07, + "loss": 1.0245, + "step": 28015 + }, + { + "epoch": 0.84, + "learning_rate": 3.1243254292028484e-07, + "loss": 1.0068, + "step": 28016 + }, + { + "epoch": 0.84, + "learning_rate": 3.1231447794358825e-07, + "loss": 1.1128, + "step": 28017 + }, + { + "epoch": 0.84, + "learning_rate": 3.1219643379260423e-07, + "loss": 1.1712, + "step": 28018 + }, + { + "epoch": 0.84, + "learning_rate": 3.120784104684565e-07, + "loss": 1.1489, + "step": 28019 + }, + { + "epoch": 0.84, + "learning_rate": 3.119604079722691e-07, + "loss": 1.1462, + "step": 28020 + }, + { + "epoch": 0.84, + "learning_rate": 3.118424263051642e-07, + "loss": 1.2778, + "step": 28021 + }, + { + "epoch": 0.84, + "learning_rate": 3.117244654682658e-07, + "loss": 1.0411, + "step": 28022 + }, + { + "epoch": 0.84, + "learning_rate": 3.1160652546269626e-07, + "loss": 1.1298, + "step": 28023 + }, + { + "epoch": 0.84, + "learning_rate": 3.1148860628957946e-07, + "loss": 1.0364, + "step": 28024 + }, + { + "epoch": 0.84, + "learning_rate": 3.113707079500364e-07, + "loss": 1.2631, + "step": 28025 + }, + { + "epoch": 0.84, + "learning_rate": 3.1125283044519007e-07, + "loss": 1.1685, + "step": 28026 + }, + { + "epoch": 0.84, + "learning_rate": 3.111349737761629e-07, + "loss": 1.0352, + "step": 28027 + }, + { + "epoch": 0.84, + "learning_rate": 3.110171379440763e-07, + "loss": 1.0295, + "step": 28028 + }, + { + "epoch": 0.84, + "learning_rate": 3.108993229500529e-07, + "loss": 1.1377, + "step": 28029 + }, + { + "epoch": 0.84, + "learning_rate": 3.107815287952132e-07, + "loss": 1.0836, + "step": 28030 + }, + { + "epoch": 0.84, + "learning_rate": 3.1066375548067904e-07, + "loss": 1.2242, + "step": 28031 + }, + { + "epoch": 0.84, + "learning_rate": 3.105460030075713e-07, + "loss": 1.0745, + "step": 28032 + }, + { + "epoch": 0.84, + "learning_rate": 3.104282713770113e-07, + "loss": 1.1165, + "step": 28033 + }, + { + "epoch": 0.84, + "learning_rate": 3.1031056059011965e-07, + "loss": 1.0506, + "step": 28034 + }, + { + "epoch": 0.84, + "learning_rate": 3.101928706480167e-07, + "loss": 1.1257, + "step": 28035 + }, + { + "epoch": 0.84, + "learning_rate": 3.1007520155182295e-07, + "loss": 1.1542, + "step": 28036 + }, + { + "epoch": 0.84, + "learning_rate": 3.099575533026594e-07, + "loss": 1.0015, + "step": 28037 + }, + { + "epoch": 0.84, + "learning_rate": 3.0983992590164436e-07, + "loss": 1.2073, + "step": 28038 + }, + { + "epoch": 0.84, + "learning_rate": 3.0972231934989856e-07, + "loss": 1.1226, + "step": 28039 + }, + { + "epoch": 0.84, + "learning_rate": 3.096047336485414e-07, + "loss": 0.9817, + "step": 28040 + }, + { + "epoch": 0.84, + "learning_rate": 3.0948716879869225e-07, + "loss": 1.1327, + "step": 28041 + }, + { + "epoch": 0.84, + "learning_rate": 3.0936962480147076e-07, + "loss": 1.1753, + "step": 28042 + }, + { + "epoch": 0.84, + "learning_rate": 3.09252101657995e-07, + "loss": 1.1091, + "step": 28043 + }, + { + "epoch": 0.84, + "learning_rate": 3.0913459936938394e-07, + "loss": 1.1404, + "step": 28044 + }, + { + "epoch": 0.84, + "learning_rate": 3.0901711793675626e-07, + "loss": 1.0771, + "step": 28045 + }, + { + "epoch": 0.84, + "learning_rate": 3.08899657361231e-07, + "loss": 1.0786, + "step": 28046 + }, + { + "epoch": 0.84, + "learning_rate": 3.0878221764392534e-07, + "loss": 1.0963, + "step": 28047 + }, + { + "epoch": 0.84, + "learning_rate": 3.086647987859576e-07, + "loss": 1.0471, + "step": 28048 + }, + { + "epoch": 0.84, + "learning_rate": 3.085474007884456e-07, + "loss": 1.0833, + "step": 28049 + }, + { + "epoch": 0.85, + "learning_rate": 3.0843002365250727e-07, + "loss": 1.1519, + "step": 28050 + }, + { + "epoch": 0.85, + "learning_rate": 3.083126673792594e-07, + "loss": 1.148, + "step": 28051 + }, + { + "epoch": 0.85, + "learning_rate": 3.0819533196981913e-07, + "loss": 1.0729, + "step": 28052 + }, + { + "epoch": 0.85, + "learning_rate": 3.080780174253037e-07, + "loss": 1.0291, + "step": 28053 + }, + { + "epoch": 0.85, + "learning_rate": 3.0796072374683016e-07, + "loss": 1.0524, + "step": 28054 + }, + { + "epoch": 0.85, + "learning_rate": 3.078434509355149e-07, + "loss": 1.1837, + "step": 28055 + }, + { + "epoch": 0.85, + "learning_rate": 3.07726198992474e-07, + "loss": 1.0975, + "step": 28056 + }, + { + "epoch": 0.85, + "learning_rate": 3.0760896791882375e-07, + "loss": 1.1211, + "step": 28057 + }, + { + "epoch": 0.85, + "learning_rate": 3.0749175771568024e-07, + "loss": 1.1235, + "step": 28058 + }, + { + "epoch": 0.85, + "learning_rate": 3.0737456838415976e-07, + "loss": 1.1372, + "step": 28059 + }, + { + "epoch": 0.85, + "learning_rate": 3.0725739992537693e-07, + "loss": 1.0845, + "step": 28060 + }, + { + "epoch": 0.85, + "learning_rate": 3.0714025234044737e-07, + "loss": 1.0264, + "step": 28061 + }, + { + "epoch": 0.85, + "learning_rate": 3.0702312563048676e-07, + "loss": 1.1651, + "step": 28062 + }, + { + "epoch": 0.85, + "learning_rate": 3.0690601979660976e-07, + "loss": 1.0203, + "step": 28063 + }, + { + "epoch": 0.85, + "learning_rate": 3.067889348399311e-07, + "loss": 1.0773, + "step": 28064 + }, + { + "epoch": 0.85, + "learning_rate": 3.0667187076156567e-07, + "loss": 1.0975, + "step": 28065 + }, + { + "epoch": 0.85, + "learning_rate": 3.0655482756262733e-07, + "loss": 1.0532, + "step": 28066 + }, + { + "epoch": 0.85, + "learning_rate": 3.06437805244231e-07, + "loss": 1.1826, + "step": 28067 + }, + { + "epoch": 0.85, + "learning_rate": 3.063208038074908e-07, + "loss": 1.0073, + "step": 28068 + }, + { + "epoch": 0.85, + "learning_rate": 3.062038232535194e-07, + "loss": 1.0081, + "step": 28069 + }, + { + "epoch": 0.85, + "learning_rate": 3.06086863583431e-07, + "loss": 1.088, + "step": 28070 + }, + { + "epoch": 0.85, + "learning_rate": 3.0596992479833916e-07, + "loss": 1.191, + "step": 28071 + }, + { + "epoch": 0.85, + "learning_rate": 3.058530068993573e-07, + "loss": 0.9952, + "step": 28072 + }, + { + "epoch": 0.85, + "learning_rate": 3.0573610988759773e-07, + "loss": 1.1183, + "step": 28073 + }, + { + "epoch": 0.85, + "learning_rate": 3.056192337641736e-07, + "loss": 1.1865, + "step": 28074 + }, + { + "epoch": 0.85, + "learning_rate": 3.055023785301975e-07, + "loss": 1.1688, + "step": 28075 + }, + { + "epoch": 0.85, + "learning_rate": 3.053855441867823e-07, + "loss": 1.1147, + "step": 28076 + }, + { + "epoch": 0.85, + "learning_rate": 3.052687307350391e-07, + "loss": 0.9668, + "step": 28077 + }, + { + "epoch": 0.85, + "learning_rate": 3.051519381760809e-07, + "loss": 1.2476, + "step": 28078 + }, + { + "epoch": 0.85, + "learning_rate": 3.0503516651101876e-07, + "loss": 1.0544, + "step": 28079 + }, + { + "epoch": 0.85, + "learning_rate": 3.0491841574096513e-07, + "loss": 1.1953, + "step": 28080 + }, + { + "epoch": 0.85, + "learning_rate": 3.0480168586703134e-07, + "loss": 1.119, + "step": 28081 + }, + { + "epoch": 0.85, + "learning_rate": 3.046849768903276e-07, + "loss": 1.1643, + "step": 28082 + }, + { + "epoch": 0.85, + "learning_rate": 3.045682888119658e-07, + "loss": 1.0573, + "step": 28083 + }, + { + "epoch": 0.85, + "learning_rate": 3.044516216330565e-07, + "loss": 1.1902, + "step": 28084 + }, + { + "epoch": 0.85, + "learning_rate": 3.0433497535471063e-07, + "loss": 1.0936, + "step": 28085 + }, + { + "epoch": 0.85, + "learning_rate": 3.04218349978038e-07, + "loss": 1.1861, + "step": 28086 + }, + { + "epoch": 0.85, + "learning_rate": 3.041017455041492e-07, + "loss": 1.116, + "step": 28087 + }, + { + "epoch": 0.85, + "learning_rate": 3.0398516193415413e-07, + "loss": 1.0013, + "step": 28088 + }, + { + "epoch": 0.85, + "learning_rate": 3.038685992691626e-07, + "loss": 1.1285, + "step": 28089 + }, + { + "epoch": 0.85, + "learning_rate": 3.037520575102845e-07, + "loss": 1.0474, + "step": 28090 + }, + { + "epoch": 0.85, + "learning_rate": 3.0363553665862883e-07, + "loss": 1.0347, + "step": 28091 + }, + { + "epoch": 0.85, + "learning_rate": 3.035190367153054e-07, + "loss": 1.1811, + "step": 28092 + }, + { + "epoch": 0.85, + "learning_rate": 3.034025576814226e-07, + "loss": 1.1254, + "step": 28093 + }, + { + "epoch": 0.85, + "learning_rate": 3.0328609955808994e-07, + "loss": 1.1018, + "step": 28094 + }, + { + "epoch": 0.85, + "learning_rate": 3.031696623464153e-07, + "loss": 1.1348, + "step": 28095 + }, + { + "epoch": 0.85, + "learning_rate": 3.0305324604750746e-07, + "loss": 1.064, + "step": 28096 + }, + { + "epoch": 0.85, + "learning_rate": 3.029368506624747e-07, + "loss": 1.1095, + "step": 28097 + }, + { + "epoch": 0.85, + "learning_rate": 3.028204761924253e-07, + "loss": 1.1265, + "step": 28098 + }, + { + "epoch": 0.85, + "learning_rate": 3.027041226384664e-07, + "loss": 1.152, + "step": 28099 + }, + { + "epoch": 0.85, + "learning_rate": 3.02587790001706e-07, + "loss": 1.1545, + "step": 28100 + }, + { + "epoch": 0.85, + "learning_rate": 3.0247147828325136e-07, + "loss": 1.0806, + "step": 28101 + }, + { + "epoch": 0.85, + "learning_rate": 3.0235518748421065e-07, + "loss": 0.9888, + "step": 28102 + }, + { + "epoch": 0.85, + "learning_rate": 3.0223891760568946e-07, + "loss": 1.0217, + "step": 28103 + }, + { + "epoch": 0.85, + "learning_rate": 3.0212266864879547e-07, + "loss": 1.1685, + "step": 28104 + }, + { + "epoch": 0.85, + "learning_rate": 3.0200644061463473e-07, + "loss": 1.015, + "step": 28105 + }, + { + "epoch": 0.85, + "learning_rate": 3.018902335043145e-07, + "loss": 1.1129, + "step": 28106 + }, + { + "epoch": 0.85, + "learning_rate": 3.0177404731894094e-07, + "loss": 1.046, + "step": 28107 + }, + { + "epoch": 0.85, + "learning_rate": 3.0165788205961916e-07, + "loss": 1.1242, + "step": 28108 + }, + { + "epoch": 0.85, + "learning_rate": 3.015417377274557e-07, + "loss": 1.2508, + "step": 28109 + }, + { + "epoch": 0.85, + "learning_rate": 3.014256143235561e-07, + "loss": 1.1237, + "step": 28110 + }, + { + "epoch": 0.85, + "learning_rate": 3.013095118490264e-07, + "loss": 1.0407, + "step": 28111 + }, + { + "epoch": 0.85, + "learning_rate": 3.0119343030497047e-07, + "loss": 1.2417, + "step": 28112 + }, + { + "epoch": 0.85, + "learning_rate": 3.010773696924943e-07, + "loss": 0.9946, + "step": 28113 + }, + { + "epoch": 0.85, + "learning_rate": 3.0096133001270234e-07, + "loss": 1.1058, + "step": 28114 + }, + { + "epoch": 0.85, + "learning_rate": 3.0084531126669953e-07, + "loss": 1.0358, + "step": 28115 + }, + { + "epoch": 0.85, + "learning_rate": 3.0072931345559024e-07, + "loss": 1.0236, + "step": 28116 + }, + { + "epoch": 0.85, + "learning_rate": 3.0061333658047863e-07, + "loss": 1.0366, + "step": 28117 + }, + { + "epoch": 0.85, + "learning_rate": 3.004973806424688e-07, + "loss": 1.1317, + "step": 28118 + }, + { + "epoch": 0.85, + "learning_rate": 3.003814456426646e-07, + "loss": 1.1576, + "step": 28119 + }, + { + "epoch": 0.85, + "learning_rate": 3.002655315821701e-07, + "loss": 1.139, + "step": 28120 + }, + { + "epoch": 0.85, + "learning_rate": 3.0014963846208777e-07, + "loss": 1.0001, + "step": 28121 + }, + { + "epoch": 0.85, + "learning_rate": 3.000337662835215e-07, + "loss": 1.1055, + "step": 28122 + }, + { + "epoch": 0.85, + "learning_rate": 2.9991791504757425e-07, + "loss": 1.0667, + "step": 28123 + }, + { + "epoch": 0.85, + "learning_rate": 2.9980208475534953e-07, + "loss": 1.0682, + "step": 28124 + }, + { + "epoch": 0.85, + "learning_rate": 2.9968627540794853e-07, + "loss": 1.1515, + "step": 28125 + }, + { + "epoch": 0.85, + "learning_rate": 2.9957048700647445e-07, + "loss": 1.0497, + "step": 28126 + }, + { + "epoch": 0.85, + "learning_rate": 2.9945471955202976e-07, + "loss": 1.0543, + "step": 28127 + }, + { + "epoch": 0.85, + "learning_rate": 2.993389730457169e-07, + "loss": 1.1615, + "step": 28128 + }, + { + "epoch": 0.85, + "learning_rate": 2.992232474886364e-07, + "loss": 1.1188, + "step": 28129 + }, + { + "epoch": 0.85, + "learning_rate": 2.991075428818907e-07, + "loss": 0.9384, + "step": 28130 + }, + { + "epoch": 0.85, + "learning_rate": 2.9899185922658113e-07, + "loss": 1.104, + "step": 28131 + }, + { + "epoch": 0.85, + "learning_rate": 2.9887619652380936e-07, + "loss": 1.1022, + "step": 28132 + }, + { + "epoch": 0.85, + "learning_rate": 2.987605547746764e-07, + "loss": 1.0716, + "step": 28133 + }, + { + "epoch": 0.85, + "learning_rate": 2.9864493398028217e-07, + "loss": 1.1304, + "step": 28134 + }, + { + "epoch": 0.85, + "learning_rate": 2.985293341417281e-07, + "loss": 1.2184, + "step": 28135 + }, + { + "epoch": 0.85, + "learning_rate": 2.9841375526011434e-07, + "loss": 1.2015, + "step": 28136 + }, + { + "epoch": 0.85, + "learning_rate": 2.98298197336542e-07, + "loss": 1.0731, + "step": 28137 + }, + { + "epoch": 0.85, + "learning_rate": 2.9818266037211e-07, + "loss": 1.0999, + "step": 28138 + }, + { + "epoch": 0.85, + "learning_rate": 2.980671443679184e-07, + "loss": 1.0555, + "step": 28139 + }, + { + "epoch": 0.85, + "learning_rate": 2.9795164932506725e-07, + "loss": 1.0602, + "step": 28140 + }, + { + "epoch": 0.85, + "learning_rate": 2.9783617524465596e-07, + "loss": 1.0909, + "step": 28141 + }, + { + "epoch": 0.85, + "learning_rate": 2.977207221277839e-07, + "loss": 1.2069, + "step": 28142 + }, + { + "epoch": 0.85, + "learning_rate": 2.9760528997554964e-07, + "loss": 1.1588, + "step": 28143 + }, + { + "epoch": 0.85, + "learning_rate": 2.9748987878905236e-07, + "loss": 1.1381, + "step": 28144 + }, + { + "epoch": 0.85, + "learning_rate": 2.9737448856939047e-07, + "loss": 1.0516, + "step": 28145 + }, + { + "epoch": 0.85, + "learning_rate": 2.972591193176627e-07, + "loss": 1.1454, + "step": 28146 + }, + { + "epoch": 0.85, + "learning_rate": 2.9714377103496726e-07, + "loss": 1.1255, + "step": 28147 + }, + { + "epoch": 0.85, + "learning_rate": 2.970284437224022e-07, + "loss": 1.0588, + "step": 28148 + }, + { + "epoch": 0.85, + "learning_rate": 2.969131373810652e-07, + "loss": 1.1084, + "step": 28149 + }, + { + "epoch": 0.85, + "learning_rate": 2.9679785201205487e-07, + "loss": 1.0369, + "step": 28150 + }, + { + "epoch": 0.85, + "learning_rate": 2.9668258761646724e-07, + "loss": 1.1824, + "step": 28151 + }, + { + "epoch": 0.85, + "learning_rate": 2.9656734419540035e-07, + "loss": 1.0947, + "step": 28152 + }, + { + "epoch": 0.85, + "learning_rate": 2.964521217499508e-07, + "loss": 1.0737, + "step": 28153 + }, + { + "epoch": 0.85, + "learning_rate": 2.9633692028121665e-07, + "loss": 1.1717, + "step": 28154 + }, + { + "epoch": 0.85, + "learning_rate": 2.9622173979029307e-07, + "loss": 1.2395, + "step": 28155 + }, + { + "epoch": 0.85, + "learning_rate": 2.96106580278277e-07, + "loss": 1.0382, + "step": 28156 + }, + { + "epoch": 0.85, + "learning_rate": 2.95991441746265e-07, + "loss": 1.1346, + "step": 28157 + }, + { + "epoch": 0.85, + "learning_rate": 2.9587632419535357e-07, + "loss": 1.2074, + "step": 28158 + }, + { + "epoch": 0.85, + "learning_rate": 2.957612276266375e-07, + "loss": 1.0839, + "step": 28159 + }, + { + "epoch": 0.85, + "learning_rate": 2.9564615204121265e-07, + "loss": 1.1218, + "step": 28160 + }, + { + "epoch": 0.85, + "learning_rate": 2.9553109744017513e-07, + "loss": 1.1387, + "step": 28161 + }, + { + "epoch": 0.85, + "learning_rate": 2.954160638246195e-07, + "loss": 1.0483, + "step": 28162 + }, + { + "epoch": 0.85, + "learning_rate": 2.9530105119564196e-07, + "loss": 0.9904, + "step": 28163 + }, + { + "epoch": 0.85, + "learning_rate": 2.95186059554336e-07, + "loss": 1.1125, + "step": 28164 + }, + { + "epoch": 0.85, + "learning_rate": 2.9507108890179684e-07, + "loss": 1.0452, + "step": 28165 + }, + { + "epoch": 0.85, + "learning_rate": 2.94956139239119e-07, + "loss": 1.1174, + "step": 28166 + }, + { + "epoch": 0.85, + "learning_rate": 2.948412105673973e-07, + "loss": 1.0324, + "step": 28167 + }, + { + "epoch": 0.85, + "learning_rate": 2.947263028877248e-07, + "loss": 1.2671, + "step": 28168 + }, + { + "epoch": 0.85, + "learning_rate": 2.9461141620119565e-07, + "loss": 0.9808, + "step": 28169 + }, + { + "epoch": 0.85, + "learning_rate": 2.9449655050890367e-07, + "loss": 1.1611, + "step": 28170 + }, + { + "epoch": 0.85, + "learning_rate": 2.943817058119425e-07, + "loss": 1.0605, + "step": 28171 + }, + { + "epoch": 0.85, + "learning_rate": 2.94266882111405e-07, + "loss": 1.1025, + "step": 28172 + }, + { + "epoch": 0.85, + "learning_rate": 2.9415207940838465e-07, + "loss": 1.1418, + "step": 28173 + }, + { + "epoch": 0.85, + "learning_rate": 2.940372977039738e-07, + "loss": 1.1409, + "step": 28174 + }, + { + "epoch": 0.85, + "learning_rate": 2.939225369992657e-07, + "loss": 1.0959, + "step": 28175 + }, + { + "epoch": 0.85, + "learning_rate": 2.938077972953532e-07, + "loss": 1.0675, + "step": 28176 + }, + { + "epoch": 0.85, + "learning_rate": 2.936930785933273e-07, + "loss": 1.0073, + "step": 28177 + }, + { + "epoch": 0.85, + "learning_rate": 2.9357838089428046e-07, + "loss": 1.0732, + "step": 28178 + }, + { + "epoch": 0.85, + "learning_rate": 2.934637041993052e-07, + "loss": 1.1065, + "step": 28179 + }, + { + "epoch": 0.85, + "learning_rate": 2.933490485094931e-07, + "loss": 1.2239, + "step": 28180 + }, + { + "epoch": 0.85, + "learning_rate": 2.9323441382593463e-07, + "loss": 1.1542, + "step": 28181 + }, + { + "epoch": 0.85, + "learning_rate": 2.931198001497218e-07, + "loss": 1.0036, + "step": 28182 + }, + { + "epoch": 0.85, + "learning_rate": 2.930052074819459e-07, + "loss": 1.0504, + "step": 28183 + }, + { + "epoch": 0.85, + "learning_rate": 2.928906358236977e-07, + "loss": 1.0989, + "step": 28184 + }, + { + "epoch": 0.85, + "learning_rate": 2.927760851760672e-07, + "loss": 1.0188, + "step": 28185 + }, + { + "epoch": 0.85, + "learning_rate": 2.9266155554014545e-07, + "loss": 0.9976, + "step": 28186 + }, + { + "epoch": 0.85, + "learning_rate": 2.9254704691702247e-07, + "loss": 1.1287, + "step": 28187 + }, + { + "epoch": 0.85, + "learning_rate": 2.924325593077884e-07, + "loss": 1.0016, + "step": 28188 + }, + { + "epoch": 0.85, + "learning_rate": 2.9231809271353386e-07, + "loss": 1.1458, + "step": 28189 + }, + { + "epoch": 0.85, + "learning_rate": 2.922036471353473e-07, + "loss": 1.0774, + "step": 28190 + }, + { + "epoch": 0.85, + "learning_rate": 2.9208922257431857e-07, + "loss": 1.0683, + "step": 28191 + }, + { + "epoch": 0.85, + "learning_rate": 2.919748190315372e-07, + "loss": 1.0134, + "step": 28192 + }, + { + "epoch": 0.85, + "learning_rate": 2.918604365080927e-07, + "loss": 1.1623, + "step": 28193 + }, + { + "epoch": 0.85, + "learning_rate": 2.9174607500507267e-07, + "loss": 1.1942, + "step": 28194 + }, + { + "epoch": 0.85, + "learning_rate": 2.9163173452356643e-07, + "loss": 1.1013, + "step": 28195 + }, + { + "epoch": 0.85, + "learning_rate": 2.915174150646627e-07, + "loss": 1.1118, + "step": 28196 + }, + { + "epoch": 0.85, + "learning_rate": 2.9140311662944924e-07, + "loss": 1.1407, + "step": 28197 + }, + { + "epoch": 0.85, + "learning_rate": 2.912888392190147e-07, + "loss": 1.0782, + "step": 28198 + }, + { + "epoch": 0.85, + "learning_rate": 2.911745828344467e-07, + "loss": 1.1509, + "step": 28199 + }, + { + "epoch": 0.85, + "learning_rate": 2.9106034747683254e-07, + "loss": 1.2404, + "step": 28200 + }, + { + "epoch": 0.85, + "learning_rate": 2.9094613314726043e-07, + "loss": 1.0649, + "step": 28201 + }, + { + "epoch": 0.85, + "learning_rate": 2.9083193984681733e-07, + "loss": 1.0929, + "step": 28202 + }, + { + "epoch": 0.85, + "learning_rate": 2.907177675765899e-07, + "loss": 1.1238, + "step": 28203 + }, + { + "epoch": 0.85, + "learning_rate": 2.906036163376652e-07, + "loss": 1.027, + "step": 28204 + }, + { + "epoch": 0.85, + "learning_rate": 2.9048948613113027e-07, + "loss": 1.1071, + "step": 28205 + }, + { + "epoch": 0.85, + "learning_rate": 2.903753769580714e-07, + "loss": 1.1077, + "step": 28206 + }, + { + "epoch": 0.85, + "learning_rate": 2.902612888195744e-07, + "loss": 1.0928, + "step": 28207 + }, + { + "epoch": 0.85, + "learning_rate": 2.901472217167259e-07, + "loss": 1.0523, + "step": 28208 + }, + { + "epoch": 0.85, + "learning_rate": 2.9003317565061113e-07, + "loss": 1.0087, + "step": 28209 + }, + { + "epoch": 0.85, + "learning_rate": 2.89919150622317e-07, + "loss": 1.1761, + "step": 28210 + }, + { + "epoch": 0.85, + "learning_rate": 2.898051466329274e-07, + "loss": 1.1418, + "step": 28211 + }, + { + "epoch": 0.85, + "learning_rate": 2.896911636835287e-07, + "loss": 0.9873, + "step": 28212 + }, + { + "epoch": 0.85, + "learning_rate": 2.8957720177520523e-07, + "loss": 1.0245, + "step": 28213 + }, + { + "epoch": 0.85, + "learning_rate": 2.8946326090904255e-07, + "loss": 1.2134, + "step": 28214 + }, + { + "epoch": 0.85, + "learning_rate": 2.8934934108612533e-07, + "loss": 1.0551, + "step": 28215 + }, + { + "epoch": 0.85, + "learning_rate": 2.892354423075369e-07, + "loss": 1.0933, + "step": 28216 + }, + { + "epoch": 0.85, + "learning_rate": 2.891215645743628e-07, + "loss": 1.2004, + "step": 28217 + }, + { + "epoch": 0.85, + "learning_rate": 2.890077078876863e-07, + "loss": 1.2139, + "step": 28218 + }, + { + "epoch": 0.85, + "learning_rate": 2.888938722485923e-07, + "loss": 1.0839, + "step": 28219 + }, + { + "epoch": 0.85, + "learning_rate": 2.8878005765816315e-07, + "loss": 1.1042, + "step": 28220 + }, + { + "epoch": 0.85, + "learning_rate": 2.8866626411748284e-07, + "loss": 1.1448, + "step": 28221 + }, + { + "epoch": 0.85, + "learning_rate": 2.885524916276347e-07, + "loss": 1.025, + "step": 28222 + }, + { + "epoch": 0.85, + "learning_rate": 2.884387401897018e-07, + "loss": 1.0132, + "step": 28223 + }, + { + "epoch": 0.85, + "learning_rate": 2.883250098047674e-07, + "loss": 1.1605, + "step": 28224 + }, + { + "epoch": 0.85, + "learning_rate": 2.8821130047391315e-07, + "loss": 1.0558, + "step": 28225 + }, + { + "epoch": 0.85, + "learning_rate": 2.8809761219822234e-07, + "loss": 1.1545, + "step": 28226 + }, + { + "epoch": 0.85, + "learning_rate": 2.879839449787766e-07, + "loss": 1.0895, + "step": 28227 + }, + { + "epoch": 0.85, + "learning_rate": 2.8787029881665873e-07, + "loss": 1.1053, + "step": 28228 + }, + { + "epoch": 0.85, + "learning_rate": 2.8775667371295e-07, + "loss": 1.1146, + "step": 28229 + }, + { + "epoch": 0.85, + "learning_rate": 2.876430696687324e-07, + "loss": 1.1732, + "step": 28230 + }, + { + "epoch": 0.85, + "learning_rate": 2.8752948668508726e-07, + "loss": 1.0701, + "step": 28231 + }, + { + "epoch": 0.85, + "learning_rate": 2.8741592476309616e-07, + "loss": 1.0735, + "step": 28232 + }, + { + "epoch": 0.85, + "learning_rate": 2.873023839038397e-07, + "loss": 1.0452, + "step": 28233 + }, + { + "epoch": 0.85, + "learning_rate": 2.8718886410839865e-07, + "loss": 1.053, + "step": 28234 + }, + { + "epoch": 0.85, + "learning_rate": 2.870753653778538e-07, + "loss": 1.1575, + "step": 28235 + }, + { + "epoch": 0.85, + "learning_rate": 2.8696188771328627e-07, + "loss": 1.162, + "step": 28236 + }, + { + "epoch": 0.85, + "learning_rate": 2.868484311157754e-07, + "loss": 1.1573, + "step": 28237 + }, + { + "epoch": 0.85, + "learning_rate": 2.8673499558640127e-07, + "loss": 1.0412, + "step": 28238 + }, + { + "epoch": 0.85, + "learning_rate": 2.866215811262443e-07, + "loss": 1.0794, + "step": 28239 + }, + { + "epoch": 0.85, + "learning_rate": 2.8650818773638374e-07, + "loss": 1.1053, + "step": 28240 + }, + { + "epoch": 0.85, + "learning_rate": 2.863948154178997e-07, + "loss": 1.1133, + "step": 28241 + }, + { + "epoch": 0.85, + "learning_rate": 2.8628146417187057e-07, + "loss": 1.2199, + "step": 28242 + }, + { + "epoch": 0.85, + "learning_rate": 2.861681339993755e-07, + "loss": 1.0455, + "step": 28243 + }, + { + "epoch": 0.85, + "learning_rate": 2.8605482490149354e-07, + "loss": 1.0856, + "step": 28244 + }, + { + "epoch": 0.85, + "learning_rate": 2.859415368793042e-07, + "loss": 0.9975, + "step": 28245 + }, + { + "epoch": 0.85, + "learning_rate": 2.8582826993388435e-07, + "loss": 1.0355, + "step": 28246 + }, + { + "epoch": 0.85, + "learning_rate": 2.8571502406631315e-07, + "loss": 1.0546, + "step": 28247 + }, + { + "epoch": 0.85, + "learning_rate": 2.856017992776683e-07, + "loss": 1.1739, + "step": 28248 + }, + { + "epoch": 0.85, + "learning_rate": 2.854885955690284e-07, + "loss": 1.1338, + "step": 28249 + }, + { + "epoch": 0.85, + "learning_rate": 2.853754129414699e-07, + "loss": 1.0829, + "step": 28250 + }, + { + "epoch": 0.85, + "learning_rate": 2.852622513960709e-07, + "loss": 1.0977, + "step": 28251 + }, + { + "epoch": 0.85, + "learning_rate": 2.8514911093390886e-07, + "loss": 1.0366, + "step": 28252 + }, + { + "epoch": 0.85, + "learning_rate": 2.850359915560605e-07, + "loss": 0.9763, + "step": 28253 + }, + { + "epoch": 0.85, + "learning_rate": 2.8492289326360253e-07, + "loss": 1.0554, + "step": 28254 + }, + { + "epoch": 0.85, + "learning_rate": 2.848098160576121e-07, + "loss": 1.1567, + "step": 28255 + }, + { + "epoch": 0.85, + "learning_rate": 2.846967599391651e-07, + "loss": 1.0314, + "step": 28256 + }, + { + "epoch": 0.85, + "learning_rate": 2.845837249093381e-07, + "loss": 1.0826, + "step": 28257 + }, + { + "epoch": 0.85, + "learning_rate": 2.844707109692077e-07, + "loss": 1.1068, + "step": 28258 + }, + { + "epoch": 0.85, + "learning_rate": 2.843577181198484e-07, + "loss": 1.0549, + "step": 28259 + }, + { + "epoch": 0.85, + "learning_rate": 2.842447463623366e-07, + "loss": 1.1876, + "step": 28260 + }, + { + "epoch": 0.85, + "learning_rate": 2.8413179569774767e-07, + "loss": 1.2665, + "step": 28261 + }, + { + "epoch": 0.85, + "learning_rate": 2.840188661271573e-07, + "loss": 1.2118, + "step": 28262 + }, + { + "epoch": 0.85, + "learning_rate": 2.8390595765163955e-07, + "loss": 1.1055, + "step": 28263 + }, + { + "epoch": 0.85, + "learning_rate": 2.8379307027226995e-07, + "loss": 1.1274, + "step": 28264 + }, + { + "epoch": 0.85, + "learning_rate": 2.8368020399012265e-07, + "loss": 1.1735, + "step": 28265 + }, + { + "epoch": 0.85, + "learning_rate": 2.835673588062726e-07, + "loss": 1.1011, + "step": 28266 + }, + { + "epoch": 0.85, + "learning_rate": 2.834545347217943e-07, + "loss": 1.1335, + "step": 28267 + }, + { + "epoch": 0.85, + "learning_rate": 2.8334173173776096e-07, + "loss": 1.0361, + "step": 28268 + }, + { + "epoch": 0.85, + "learning_rate": 2.832289498552465e-07, + "loss": 1.0476, + "step": 28269 + }, + { + "epoch": 0.85, + "learning_rate": 2.831161890753248e-07, + "loss": 1.1401, + "step": 28270 + }, + { + "epoch": 0.85, + "learning_rate": 2.8300344939906994e-07, + "loss": 1.096, + "step": 28271 + }, + { + "epoch": 0.85, + "learning_rate": 2.828907308275541e-07, + "loss": 1.0413, + "step": 28272 + }, + { + "epoch": 0.85, + "learning_rate": 2.8277803336185047e-07, + "loss": 1.1895, + "step": 28273 + }, + { + "epoch": 0.85, + "learning_rate": 2.8266535700303213e-07, + "loss": 1.0902, + "step": 28274 + }, + { + "epoch": 0.85, + "learning_rate": 2.825527017521723e-07, + "loss": 1.1017, + "step": 28275 + }, + { + "epoch": 0.85, + "learning_rate": 2.8244006761034225e-07, + "loss": 1.0261, + "step": 28276 + }, + { + "epoch": 0.85, + "learning_rate": 2.8232745457861476e-07, + "loss": 1.074, + "step": 28277 + }, + { + "epoch": 0.85, + "learning_rate": 2.82214862658062e-07, + "loss": 1.1012, + "step": 28278 + }, + { + "epoch": 0.85, + "learning_rate": 2.821022918497554e-07, + "loss": 1.0415, + "step": 28279 + }, + { + "epoch": 0.85, + "learning_rate": 2.819897421547668e-07, + "loss": 1.0534, + "step": 28280 + }, + { + "epoch": 0.85, + "learning_rate": 2.818772135741676e-07, + "loss": 1.185, + "step": 28281 + }, + { + "epoch": 0.85, + "learning_rate": 2.817647061090292e-07, + "loss": 1.1118, + "step": 28282 + }, + { + "epoch": 0.85, + "learning_rate": 2.816522197604224e-07, + "loss": 1.051, + "step": 28283 + }, + { + "epoch": 0.85, + "learning_rate": 2.815397545294185e-07, + "loss": 1.0241, + "step": 28284 + }, + { + "epoch": 0.85, + "learning_rate": 2.8142731041708726e-07, + "loss": 1.0942, + "step": 28285 + }, + { + "epoch": 0.85, + "learning_rate": 2.8131488742449947e-07, + "loss": 1.1871, + "step": 28286 + }, + { + "epoch": 0.85, + "learning_rate": 2.812024855527254e-07, + "loss": 1.1389, + "step": 28287 + }, + { + "epoch": 0.85, + "learning_rate": 2.810901048028358e-07, + "loss": 1.0977, + "step": 28288 + }, + { + "epoch": 0.85, + "learning_rate": 2.809777451758988e-07, + "loss": 1.0775, + "step": 28289 + }, + { + "epoch": 0.85, + "learning_rate": 2.808654066729855e-07, + "loss": 1.108, + "step": 28290 + }, + { + "epoch": 0.85, + "learning_rate": 2.807530892951643e-07, + "loss": 1.1036, + "step": 28291 + }, + { + "epoch": 0.85, + "learning_rate": 2.8064079304350485e-07, + "loss": 1.0631, + "step": 28292 + }, + { + "epoch": 0.85, + "learning_rate": 2.8052851791907697e-07, + "loss": 0.9991, + "step": 28293 + }, + { + "epoch": 0.85, + "learning_rate": 2.8041626392294797e-07, + "loss": 1.0722, + "step": 28294 + }, + { + "epoch": 0.85, + "learning_rate": 2.803040310561872e-07, + "loss": 1.1161, + "step": 28295 + }, + { + "epoch": 0.85, + "learning_rate": 2.80191819319863e-07, + "loss": 1.0817, + "step": 28296 + }, + { + "epoch": 0.85, + "learning_rate": 2.8007962871504423e-07, + "loss": 1.0039, + "step": 28297 + }, + { + "epoch": 0.85, + "learning_rate": 2.799674592427976e-07, + "loss": 1.1117, + "step": 28298 + }, + { + "epoch": 0.85, + "learning_rate": 2.798553109041915e-07, + "loss": 1.136, + "step": 28299 + }, + { + "epoch": 0.85, + "learning_rate": 2.797431837002937e-07, + "loss": 1.0126, + "step": 28300 + }, + { + "epoch": 0.85, + "learning_rate": 2.796310776321717e-07, + "loss": 1.1445, + "step": 28301 + }, + { + "epoch": 0.85, + "learning_rate": 2.7951899270089234e-07, + "loss": 1.1525, + "step": 28302 + }, + { + "epoch": 0.85, + "learning_rate": 2.794069289075224e-07, + "loss": 1.066, + "step": 28303 + }, + { + "epoch": 0.85, + "learning_rate": 2.7929488625312944e-07, + "loss": 1.1451, + "step": 28304 + }, + { + "epoch": 0.85, + "learning_rate": 2.791828647387793e-07, + "loss": 1.2478, + "step": 28305 + }, + { + "epoch": 0.85, + "learning_rate": 2.790708643655393e-07, + "loss": 1.1725, + "step": 28306 + }, + { + "epoch": 0.85, + "learning_rate": 2.789588851344746e-07, + "loss": 1.0969, + "step": 28307 + }, + { + "epoch": 0.85, + "learning_rate": 2.788469270466515e-07, + "loss": 1.1281, + "step": 28308 + }, + { + "epoch": 0.85, + "learning_rate": 2.787349901031361e-07, + "loss": 1.1357, + "step": 28309 + }, + { + "epoch": 0.85, + "learning_rate": 2.786230743049936e-07, + "loss": 1.1242, + "step": 28310 + }, + { + "epoch": 0.85, + "learning_rate": 2.785111796532897e-07, + "loss": 1.2654, + "step": 28311 + }, + { + "epoch": 0.85, + "learning_rate": 2.783993061490894e-07, + "loss": 1.1215, + "step": 28312 + }, + { + "epoch": 0.85, + "learning_rate": 2.7828745379345797e-07, + "loss": 1.0851, + "step": 28313 + }, + { + "epoch": 0.85, + "learning_rate": 2.7817562258746014e-07, + "loss": 1.261, + "step": 28314 + }, + { + "epoch": 0.85, + "learning_rate": 2.7806381253216e-07, + "loss": 1.0957, + "step": 28315 + }, + { + "epoch": 0.85, + "learning_rate": 2.7795202362862233e-07, + "loss": 1.1107, + "step": 28316 + }, + { + "epoch": 0.85, + "learning_rate": 2.778402558779109e-07, + "loss": 1.084, + "step": 28317 + }, + { + "epoch": 0.85, + "learning_rate": 2.7772850928109024e-07, + "loss": 1.0944, + "step": 28318 + }, + { + "epoch": 0.85, + "learning_rate": 2.7761678383922436e-07, + "loss": 0.9783, + "step": 28319 + }, + { + "epoch": 0.85, + "learning_rate": 2.77505079553376e-07, + "loss": 1.1199, + "step": 28320 + }, + { + "epoch": 0.85, + "learning_rate": 2.773933964246087e-07, + "loss": 1.1178, + "step": 28321 + }, + { + "epoch": 0.85, + "learning_rate": 2.772817344539858e-07, + "loss": 1.0913, + "step": 28322 + }, + { + "epoch": 0.85, + "learning_rate": 2.7717009364257085e-07, + "loss": 1.2252, + "step": 28323 + }, + { + "epoch": 0.85, + "learning_rate": 2.770584739914256e-07, + "loss": 1.1898, + "step": 28324 + }, + { + "epoch": 0.85, + "learning_rate": 2.76946875501613e-07, + "loss": 1.1826, + "step": 28325 + }, + { + "epoch": 0.85, + "learning_rate": 2.7683529817419537e-07, + "loss": 1.0711, + "step": 28326 + }, + { + "epoch": 0.85, + "learning_rate": 2.767237420102356e-07, + "loss": 1.1523, + "step": 28327 + }, + { + "epoch": 0.85, + "learning_rate": 2.766122070107946e-07, + "loss": 1.1443, + "step": 28328 + }, + { + "epoch": 0.85, + "learning_rate": 2.765006931769346e-07, + "loss": 1.1931, + "step": 28329 + }, + { + "epoch": 0.85, + "learning_rate": 2.763892005097171e-07, + "loss": 1.0569, + "step": 28330 + }, + { + "epoch": 0.85, + "learning_rate": 2.7627772901020394e-07, + "loss": 1.0515, + "step": 28331 + }, + { + "epoch": 0.85, + "learning_rate": 2.761662786794553e-07, + "loss": 1.1401, + "step": 28332 + }, + { + "epoch": 0.85, + "learning_rate": 2.7605484951853277e-07, + "loss": 1.0821, + "step": 28333 + }, + { + "epoch": 0.85, + "learning_rate": 2.7594344152849674e-07, + "loss": 1.0034, + "step": 28334 + }, + { + "epoch": 0.85, + "learning_rate": 2.758320547104082e-07, + "loss": 1.0344, + "step": 28335 + }, + { + "epoch": 0.85, + "learning_rate": 2.757206890653272e-07, + "loss": 1.1744, + "step": 28336 + }, + { + "epoch": 0.85, + "learning_rate": 2.7560934459431423e-07, + "loss": 1.0428, + "step": 28337 + }, + { + "epoch": 0.85, + "learning_rate": 2.7549802129842873e-07, + "loss": 1.135, + "step": 28338 + }, + { + "epoch": 0.85, + "learning_rate": 2.753867191787307e-07, + "loss": 1.0084, + "step": 28339 + }, + { + "epoch": 0.85, + "learning_rate": 2.7527543823628046e-07, + "loss": 1.1442, + "step": 28340 + }, + { + "epoch": 0.85, + "learning_rate": 2.7516417847213595e-07, + "loss": 1.0473, + "step": 28341 + }, + { + "epoch": 0.85, + "learning_rate": 2.7505293988735694e-07, + "loss": 1.079, + "step": 28342 + }, + { + "epoch": 0.85, + "learning_rate": 2.7494172248300227e-07, + "loss": 1.1132, + "step": 28343 + }, + { + "epoch": 0.85, + "learning_rate": 2.748305262601314e-07, + "loss": 1.0717, + "step": 28344 + }, + { + "epoch": 0.85, + "learning_rate": 2.7471935121980155e-07, + "loss": 1.1098, + "step": 28345 + }, + { + "epoch": 0.85, + "learning_rate": 2.746081973630718e-07, + "loss": 1.1589, + "step": 28346 + }, + { + "epoch": 0.85, + "learning_rate": 2.744970646910003e-07, + "loss": 1.0566, + "step": 28347 + }, + { + "epoch": 0.85, + "learning_rate": 2.74385953204645e-07, + "loss": 1.0986, + "step": 28348 + }, + { + "epoch": 0.85, + "learning_rate": 2.74274862905064e-07, + "loss": 1.0492, + "step": 28349 + }, + { + "epoch": 0.85, + "learning_rate": 2.7416379379331365e-07, + "loss": 1.0141, + "step": 28350 + }, + { + "epoch": 0.85, + "learning_rate": 2.740527458704523e-07, + "loss": 1.1201, + "step": 28351 + }, + { + "epoch": 0.85, + "learning_rate": 2.739417191375365e-07, + "loss": 1.1504, + "step": 28352 + }, + { + "epoch": 0.85, + "learning_rate": 2.738307135956242e-07, + "loss": 1.0784, + "step": 28353 + }, + { + "epoch": 0.85, + "learning_rate": 2.737197292457705e-07, + "loss": 1.0444, + "step": 28354 + }, + { + "epoch": 0.85, + "learning_rate": 2.7360876608903295e-07, + "loss": 1.1512, + "step": 28355 + }, + { + "epoch": 0.85, + "learning_rate": 2.734978241264677e-07, + "loss": 1.045, + "step": 28356 + }, + { + "epoch": 0.85, + "learning_rate": 2.733869033591313e-07, + "loss": 1.0175, + "step": 28357 + }, + { + "epoch": 0.85, + "learning_rate": 2.7327600378807885e-07, + "loss": 1.192, + "step": 28358 + }, + { + "epoch": 0.85, + "learning_rate": 2.731651254143661e-07, + "loss": 1.069, + "step": 28359 + }, + { + "epoch": 0.85, + "learning_rate": 2.730542682390491e-07, + "loss": 1.0858, + "step": 28360 + }, + { + "epoch": 0.85, + "learning_rate": 2.72943432263183e-07, + "loss": 1.1276, + "step": 28361 + }, + { + "epoch": 0.85, + "learning_rate": 2.7283261748782264e-07, + "loss": 1.067, + "step": 28362 + }, + { + "epoch": 0.85, + "learning_rate": 2.7272182391402305e-07, + "loss": 1.1323, + "step": 28363 + }, + { + "epoch": 0.85, + "learning_rate": 2.726110515428393e-07, + "loss": 1.0769, + "step": 28364 + }, + { + "epoch": 0.85, + "learning_rate": 2.7250030037532545e-07, + "loss": 1.0825, + "step": 28365 + }, + { + "epoch": 0.85, + "learning_rate": 2.723895704125365e-07, + "loss": 1.0468, + "step": 28366 + }, + { + "epoch": 0.85, + "learning_rate": 2.7227886165552525e-07, + "loss": 1.1868, + "step": 28367 + }, + { + "epoch": 0.85, + "learning_rate": 2.721681741053467e-07, + "loss": 1.0109, + "step": 28368 + }, + { + "epoch": 0.85, + "learning_rate": 2.7205750776305384e-07, + "loss": 1.13, + "step": 28369 + }, + { + "epoch": 0.85, + "learning_rate": 2.719468626297012e-07, + "loss": 1.1919, + "step": 28370 + }, + { + "epoch": 0.85, + "learning_rate": 2.7183623870634087e-07, + "loss": 1.0938, + "step": 28371 + }, + { + "epoch": 0.85, + "learning_rate": 2.7172563599402626e-07, + "loss": 1.1022, + "step": 28372 + }, + { + "epoch": 0.85, + "learning_rate": 2.716150544938106e-07, + "loss": 1.0262, + "step": 28373 + }, + { + "epoch": 0.85, + "learning_rate": 2.715044942067463e-07, + "loss": 1.1057, + "step": 28374 + }, + { + "epoch": 0.85, + "learning_rate": 2.713939551338865e-07, + "loss": 1.0918, + "step": 28375 + }, + { + "epoch": 0.85, + "learning_rate": 2.712834372762821e-07, + "loss": 1.1102, + "step": 28376 + }, + { + "epoch": 0.85, + "learning_rate": 2.711729406349864e-07, + "loss": 1.0894, + "step": 28377 + }, + { + "epoch": 0.85, + "learning_rate": 2.710624652110508e-07, + "loss": 1.039, + "step": 28378 + }, + { + "epoch": 0.85, + "learning_rate": 2.709520110055272e-07, + "loss": 1.0624, + "step": 28379 + }, + { + "epoch": 0.85, + "learning_rate": 2.7084157801946674e-07, + "loss": 1.0626, + "step": 28380 + }, + { + "epoch": 0.85, + "learning_rate": 2.707311662539208e-07, + "loss": 1.1609, + "step": 28381 + }, + { + "epoch": 0.86, + "learning_rate": 2.706207757099405e-07, + "loss": 1.1234, + "step": 28382 + }, + { + "epoch": 0.86, + "learning_rate": 2.7051040638857715e-07, + "loss": 1.1, + "step": 28383 + }, + { + "epoch": 0.86, + "learning_rate": 2.704000582908806e-07, + "loss": 1.1439, + "step": 28384 + }, + { + "epoch": 0.86, + "learning_rate": 2.702897314179015e-07, + "loss": 1.2351, + "step": 28385 + }, + { + "epoch": 0.86, + "learning_rate": 2.701794257706905e-07, + "loss": 1.1774, + "step": 28386 + }, + { + "epoch": 0.86, + "learning_rate": 2.7006914135029735e-07, + "loss": 1.1166, + "step": 28387 + }, + { + "epoch": 0.86, + "learning_rate": 2.6995887815777193e-07, + "loss": 1.112, + "step": 28388 + }, + { + "epoch": 0.86, + "learning_rate": 2.6984863619416433e-07, + "loss": 1.1216, + "step": 28389 + }, + { + "epoch": 0.86, + "learning_rate": 2.6973841546052345e-07, + "loss": 1.2246, + "step": 28390 + }, + { + "epoch": 0.86, + "learning_rate": 2.696282159578986e-07, + "loss": 1.1037, + "step": 28391 + }, + { + "epoch": 0.86, + "learning_rate": 2.695180376873391e-07, + "loss": 1.1114, + "step": 28392 + }, + { + "epoch": 0.86, + "learning_rate": 2.694078806498934e-07, + "loss": 1.1157, + "step": 28393 + }, + { + "epoch": 0.86, + "learning_rate": 2.692977448466105e-07, + "loss": 1.0534, + "step": 28394 + }, + { + "epoch": 0.86, + "learning_rate": 2.691876302785387e-07, + "loss": 1.0154, + "step": 28395 + }, + { + "epoch": 0.86, + "learning_rate": 2.690775369467266e-07, + "loss": 1.1304, + "step": 28396 + }, + { + "epoch": 0.86, + "learning_rate": 2.689674648522217e-07, + "loss": 1.0597, + "step": 28397 + }, + { + "epoch": 0.86, + "learning_rate": 2.68857413996072e-07, + "loss": 1.0219, + "step": 28398 + }, + { + "epoch": 0.86, + "learning_rate": 2.687473843793251e-07, + "loss": 1.1352, + "step": 28399 + }, + { + "epoch": 0.86, + "learning_rate": 2.6863737600302837e-07, + "loss": 1.075, + "step": 28400 + }, + { + "epoch": 0.86, + "learning_rate": 2.6852738886822967e-07, + "loss": 0.9876, + "step": 28401 + }, + { + "epoch": 0.86, + "learning_rate": 2.6841742297597506e-07, + "loss": 1.0868, + "step": 28402 + }, + { + "epoch": 0.86, + "learning_rate": 2.683074783273118e-07, + "loss": 1.0755, + "step": 28403 + }, + { + "epoch": 0.86, + "learning_rate": 2.681975549232865e-07, + "loss": 1.137, + "step": 28404 + }, + { + "epoch": 0.86, + "learning_rate": 2.680876527649465e-07, + "loss": 1.1743, + "step": 28405 + }, + { + "epoch": 0.86, + "learning_rate": 2.6797777185333605e-07, + "loss": 1.0547, + "step": 28406 + }, + { + "epoch": 0.86, + "learning_rate": 2.678679121895025e-07, + "loss": 1.1589, + "step": 28407 + }, + { + "epoch": 0.86, + "learning_rate": 2.677580737744914e-07, + "loss": 1.212, + "step": 28408 + }, + { + "epoch": 0.86, + "learning_rate": 2.6764825660934885e-07, + "loss": 1.0698, + "step": 28409 + }, + { + "epoch": 0.86, + "learning_rate": 2.6753846069511923e-07, + "loss": 1.0972, + "step": 28410 + }, + { + "epoch": 0.86, + "learning_rate": 2.674286860328484e-07, + "loss": 1.2137, + "step": 28411 + }, + { + "epoch": 0.86, + "learning_rate": 2.673189326235812e-07, + "loss": 1.1067, + "step": 28412 + }, + { + "epoch": 0.86, + "learning_rate": 2.6720920046836213e-07, + "loss": 1.213, + "step": 28413 + }, + { + "epoch": 0.86, + "learning_rate": 2.6709948956823687e-07, + "loss": 1.0931, + "step": 28414 + }, + { + "epoch": 0.86, + "learning_rate": 2.669897999242488e-07, + "loss": 1.1169, + "step": 28415 + }, + { + "epoch": 0.86, + "learning_rate": 2.6688013153744195e-07, + "loss": 1.1487, + "step": 28416 + }, + { + "epoch": 0.86, + "learning_rate": 2.667704844088609e-07, + "loss": 1.0715, + "step": 28417 + }, + { + "epoch": 0.86, + "learning_rate": 2.666608585395494e-07, + "loss": 1.1854, + "step": 28418 + }, + { + "epoch": 0.86, + "learning_rate": 2.6655125393055093e-07, + "loss": 1.0474, + "step": 28419 + }, + { + "epoch": 0.86, + "learning_rate": 2.664416705829087e-07, + "loss": 1.1061, + "step": 28420 + }, + { + "epoch": 0.86, + "learning_rate": 2.663321084976661e-07, + "loss": 1.0587, + "step": 28421 + }, + { + "epoch": 0.86, + "learning_rate": 2.6622256767586644e-07, + "loss": 1.0261, + "step": 28422 + }, + { + "epoch": 0.86, + "learning_rate": 2.66113048118552e-07, + "loss": 1.1084, + "step": 28423 + }, + { + "epoch": 0.86, + "learning_rate": 2.660035498267652e-07, + "loss": 1.0898, + "step": 28424 + }, + { + "epoch": 0.86, + "learning_rate": 2.6589407280154856e-07, + "loss": 1.1225, + "step": 28425 + }, + { + "epoch": 0.86, + "learning_rate": 2.657846170439446e-07, + "loss": 1.1242, + "step": 28426 + }, + { + "epoch": 0.86, + "learning_rate": 2.6567518255499523e-07, + "loss": 1.0891, + "step": 28427 + }, + { + "epoch": 0.86, + "learning_rate": 2.655657693357419e-07, + "loss": 1.1036, + "step": 28428 + }, + { + "epoch": 0.86, + "learning_rate": 2.6545637738722596e-07, + "loss": 1.1605, + "step": 28429 + }, + { + "epoch": 0.86, + "learning_rate": 2.6534700671048935e-07, + "loss": 1.1243, + "step": 28430 + }, + { + "epoch": 0.86, + "learning_rate": 2.6523765730657345e-07, + "loss": 1.1282, + "step": 28431 + }, + { + "epoch": 0.86, + "learning_rate": 2.651283291765183e-07, + "loss": 1.1268, + "step": 28432 + }, + { + "epoch": 0.86, + "learning_rate": 2.65019022321365e-07, + "loss": 1.1452, + "step": 28433 + }, + { + "epoch": 0.86, + "learning_rate": 2.649097367421544e-07, + "loss": 1.0417, + "step": 28434 + }, + { + "epoch": 0.86, + "learning_rate": 2.6480047243992695e-07, + "loss": 0.9905, + "step": 28435 + }, + { + "epoch": 0.86, + "learning_rate": 2.6469122941572195e-07, + "loss": 1.0593, + "step": 28436 + }, + { + "epoch": 0.86, + "learning_rate": 2.645820076705799e-07, + "loss": 1.2992, + "step": 28437 + }, + { + "epoch": 0.86, + "learning_rate": 2.644728072055408e-07, + "loss": 1.0358, + "step": 28438 + }, + { + "epoch": 0.86, + "learning_rate": 2.6436362802164354e-07, + "loss": 1.075, + "step": 28439 + }, + { + "epoch": 0.86, + "learning_rate": 2.6425447011992845e-07, + "loss": 1.1323, + "step": 28440 + }, + { + "epoch": 0.86, + "learning_rate": 2.6414533350143377e-07, + "loss": 1.0972, + "step": 28441 + }, + { + "epoch": 0.86, + "learning_rate": 2.640362181671985e-07, + "loss": 1.1071, + "step": 28442 + }, + { + "epoch": 0.86, + "learning_rate": 2.639271241182614e-07, + "loss": 1.0605, + "step": 28443 + }, + { + "epoch": 0.86, + "learning_rate": 2.6381805135566126e-07, + "loss": 1.0877, + "step": 28444 + }, + { + "epoch": 0.86, + "learning_rate": 2.6370899988043653e-07, + "loss": 1.1071, + "step": 28445 + }, + { + "epoch": 0.86, + "learning_rate": 2.635999696936248e-07, + "loss": 1.0847, + "step": 28446 + }, + { + "epoch": 0.86, + "learning_rate": 2.6349096079626436e-07, + "loss": 1.1149, + "step": 28447 + }, + { + "epoch": 0.86, + "learning_rate": 2.633819731893933e-07, + "loss": 1.1225, + "step": 28448 + }, + { + "epoch": 0.86, + "learning_rate": 2.6327300687404827e-07, + "loss": 1.1699, + "step": 28449 + }, + { + "epoch": 0.86, + "learning_rate": 2.631640618512668e-07, + "loss": 1.1726, + "step": 28450 + }, + { + "epoch": 0.86, + "learning_rate": 2.6305513812208637e-07, + "loss": 1.1536, + "step": 28451 + }, + { + "epoch": 0.86, + "learning_rate": 2.6294623568754343e-07, + "loss": 1.1075, + "step": 28452 + }, + { + "epoch": 0.86, + "learning_rate": 2.628373545486756e-07, + "loss": 1.1112, + "step": 28453 + }, + { + "epoch": 0.86, + "learning_rate": 2.6272849470651814e-07, + "loss": 1.1683, + "step": 28454 + }, + { + "epoch": 0.86, + "learning_rate": 2.6261965616210805e-07, + "loss": 1.1627, + "step": 28455 + }, + { + "epoch": 0.86, + "learning_rate": 2.62510838916481e-07, + "loss": 1.1482, + "step": 28456 + }, + { + "epoch": 0.86, + "learning_rate": 2.624020429706739e-07, + "loss": 1.0137, + "step": 28457 + }, + { + "epoch": 0.86, + "learning_rate": 2.6229326832572096e-07, + "loss": 1.0238, + "step": 28458 + }, + { + "epoch": 0.86, + "learning_rate": 2.621845149826585e-07, + "loss": 1.1207, + "step": 28459 + }, + { + "epoch": 0.86, + "learning_rate": 2.620757829425216e-07, + "loss": 1.1182, + "step": 28460 + }, + { + "epoch": 0.86, + "learning_rate": 2.619670722063461e-07, + "loss": 1.0438, + "step": 28461 + }, + { + "epoch": 0.86, + "learning_rate": 2.618583827751656e-07, + "loss": 1.1637, + "step": 28462 + }, + { + "epoch": 0.86, + "learning_rate": 2.6174971465001556e-07, + "loss": 1.1274, + "step": 28463 + }, + { + "epoch": 0.86, + "learning_rate": 2.6164106783193004e-07, + "loss": 1.1376, + "step": 28464 + }, + { + "epoch": 0.86, + "learning_rate": 2.615324423219434e-07, + "loss": 1.0325, + "step": 28465 + }, + { + "epoch": 0.86, + "learning_rate": 2.614238381210907e-07, + "loss": 1.0216, + "step": 28466 + }, + { + "epoch": 0.86, + "learning_rate": 2.613152552304041e-07, + "loss": 1.1293, + "step": 28467 + }, + { + "epoch": 0.86, + "learning_rate": 2.612066936509183e-07, + "loss": 1.0905, + "step": 28468 + }, + { + "epoch": 0.86, + "learning_rate": 2.610981533836665e-07, + "loss": 1.104, + "step": 28469 + }, + { + "epoch": 0.86, + "learning_rate": 2.609896344296819e-07, + "loss": 1.1121, + "step": 28470 + }, + { + "epoch": 0.86, + "learning_rate": 2.6088113678999797e-07, + "loss": 1.0836, + "step": 28471 + }, + { + "epoch": 0.86, + "learning_rate": 2.6077266046564714e-07, + "loss": 1.088, + "step": 28472 + }, + { + "epoch": 0.86, + "learning_rate": 2.606642054576619e-07, + "loss": 1.1672, + "step": 28473 + }, + { + "epoch": 0.86, + "learning_rate": 2.605557717670748e-07, + "loss": 1.0335, + "step": 28474 + }, + { + "epoch": 0.86, + "learning_rate": 2.6044735939491835e-07, + "loss": 1.0758, + "step": 28475 + }, + { + "epoch": 0.86, + "learning_rate": 2.603389683422244e-07, + "loss": 1.0436, + "step": 28476 + }, + { + "epoch": 0.86, + "learning_rate": 2.602305986100248e-07, + "loss": 1.0144, + "step": 28477 + }, + { + "epoch": 0.86, + "learning_rate": 2.601222501993514e-07, + "loss": 1.0676, + "step": 28478 + }, + { + "epoch": 0.86, + "learning_rate": 2.600139231112356e-07, + "loss": 1.0577, + "step": 28479 + }, + { + "epoch": 0.86, + "learning_rate": 2.599056173467082e-07, + "loss": 1.1077, + "step": 28480 + }, + { + "epoch": 0.86, + "learning_rate": 2.5979733290680043e-07, + "loss": 1.0814, + "step": 28481 + }, + { + "epoch": 0.86, + "learning_rate": 2.5968906979254303e-07, + "loss": 1.0536, + "step": 28482 + }, + { + "epoch": 0.86, + "learning_rate": 2.595808280049672e-07, + "loss": 1.0604, + "step": 28483 + }, + { + "epoch": 0.86, + "learning_rate": 2.5947260754510235e-07, + "loss": 1.0695, + "step": 28484 + }, + { + "epoch": 0.86, + "learning_rate": 2.593644084139793e-07, + "loss": 0.9882, + "step": 28485 + }, + { + "epoch": 0.86, + "learning_rate": 2.5925623061262784e-07, + "loss": 1.1802, + "step": 28486 + }, + { + "epoch": 0.86, + "learning_rate": 2.591480741420785e-07, + "loss": 1.278, + "step": 28487 + }, + { + "epoch": 0.86, + "learning_rate": 2.590399390033596e-07, + "loss": 1.0438, + "step": 28488 + }, + { + "epoch": 0.86, + "learning_rate": 2.589318251975012e-07, + "loss": 1.115, + "step": 28489 + }, + { + "epoch": 0.86, + "learning_rate": 2.5882373272553276e-07, + "loss": 1.0858, + "step": 28490 + }, + { + "epoch": 0.86, + "learning_rate": 2.587156615884828e-07, + "loss": 1.1956, + "step": 28491 + }, + { + "epoch": 0.86, + "learning_rate": 2.586076117873806e-07, + "loss": 1.1202, + "step": 28492 + }, + { + "epoch": 0.86, + "learning_rate": 2.5849958332325426e-07, + "loss": 1.2181, + "step": 28493 + }, + { + "epoch": 0.86, + "learning_rate": 2.583915761971323e-07, + "loss": 1.0346, + "step": 28494 + }, + { + "epoch": 0.86, + "learning_rate": 2.582835904100428e-07, + "loss": 1.1202, + "step": 28495 + }, + { + "epoch": 0.86, + "learning_rate": 2.5817562596301443e-07, + "loss": 1.1014, + "step": 28496 + }, + { + "epoch": 0.86, + "learning_rate": 2.5806768285707414e-07, + "loss": 1.1692, + "step": 28497 + }, + { + "epoch": 0.86, + "learning_rate": 2.579597610932494e-07, + "loss": 1.0184, + "step": 28498 + }, + { + "epoch": 0.86, + "learning_rate": 2.57851860672568e-07, + "loss": 1.1912, + "step": 28499 + }, + { + "epoch": 0.86, + "learning_rate": 2.577439815960572e-07, + "loss": 1.1561, + "step": 28500 + }, + { + "epoch": 0.86, + "learning_rate": 2.5763612386474376e-07, + "loss": 1.0332, + "step": 28501 + }, + { + "epoch": 0.86, + "learning_rate": 2.5752828747965447e-07, + "loss": 0.9838, + "step": 28502 + }, + { + "epoch": 0.86, + "learning_rate": 2.5742047244181583e-07, + "loss": 1.1113, + "step": 28503 + }, + { + "epoch": 0.86, + "learning_rate": 2.573126787522545e-07, + "loss": 1.062, + "step": 28504 + }, + { + "epoch": 0.86, + "learning_rate": 2.572049064119961e-07, + "loss": 1.1009, + "step": 28505 + }, + { + "epoch": 0.86, + "learning_rate": 2.5709715542206693e-07, + "loss": 1.0659, + "step": 28506 + }, + { + "epoch": 0.86, + "learning_rate": 2.5698942578349235e-07, + "loss": 1.1647, + "step": 28507 + }, + { + "epoch": 0.86, + "learning_rate": 2.5688171749729843e-07, + "loss": 1.052, + "step": 28508 + }, + { + "epoch": 0.86, + "learning_rate": 2.5677403056451056e-07, + "loss": 1.0338, + "step": 28509 + }, + { + "epoch": 0.86, + "learning_rate": 2.566663649861531e-07, + "loss": 1.1433, + "step": 28510 + }, + { + "epoch": 0.86, + "learning_rate": 2.565587207632514e-07, + "loss": 1.0926, + "step": 28511 + }, + { + "epoch": 0.86, + "learning_rate": 2.564510978968301e-07, + "loss": 1.0155, + "step": 28512 + }, + { + "epoch": 0.86, + "learning_rate": 2.563434963879144e-07, + "loss": 1.1016, + "step": 28513 + }, + { + "epoch": 0.86, + "learning_rate": 2.5623591623752745e-07, + "loss": 1.2075, + "step": 28514 + }, + { + "epoch": 0.86, + "learning_rate": 2.5612835744669413e-07, + "loss": 1.1359, + "step": 28515 + }, + { + "epoch": 0.86, + "learning_rate": 2.5602082001643794e-07, + "loss": 1.054, + "step": 28516 + }, + { + "epoch": 0.86, + "learning_rate": 2.559133039477835e-07, + "loss": 1.1387, + "step": 28517 + }, + { + "epoch": 0.86, + "learning_rate": 2.5580580924175316e-07, + "loss": 0.9663, + "step": 28518 + }, + { + "epoch": 0.86, + "learning_rate": 2.5569833589937057e-07, + "loss": 1.0684, + "step": 28519 + }, + { + "epoch": 0.86, + "learning_rate": 2.5559088392165893e-07, + "loss": 1.0626, + "step": 28520 + }, + { + "epoch": 0.86, + "learning_rate": 2.554834533096412e-07, + "loss": 1.0615, + "step": 28521 + }, + { + "epoch": 0.86, + "learning_rate": 2.5537604406434046e-07, + "loss": 1.0689, + "step": 28522 + }, + { + "epoch": 0.86, + "learning_rate": 2.5526865618677815e-07, + "loss": 1.1833, + "step": 28523 + }, + { + "epoch": 0.86, + "learning_rate": 2.5516128967797706e-07, + "loss": 1.0211, + "step": 28524 + }, + { + "epoch": 0.86, + "learning_rate": 2.5505394453895966e-07, + "loss": 1.1827, + "step": 28525 + }, + { + "epoch": 0.86, + "learning_rate": 2.549466207707471e-07, + "loss": 1.019, + "step": 28526 + }, + { + "epoch": 0.86, + "learning_rate": 2.5483931837436165e-07, + "loss": 1.0116, + "step": 28527 + }, + { + "epoch": 0.86, + "learning_rate": 2.5473203735082467e-07, + "loss": 1.0117, + "step": 28528 + }, + { + "epoch": 0.86, + "learning_rate": 2.5462477770115736e-07, + "loss": 1.0578, + "step": 28529 + }, + { + "epoch": 0.86, + "learning_rate": 2.5451753942638103e-07, + "loss": 1.1712, + "step": 28530 + }, + { + "epoch": 0.86, + "learning_rate": 2.5441032252751604e-07, + "loss": 1.1838, + "step": 28531 + }, + { + "epoch": 0.86, + "learning_rate": 2.543031270055829e-07, + "loss": 1.091, + "step": 28532 + }, + { + "epoch": 0.86, + "learning_rate": 2.5419595286160283e-07, + "loss": 1.1573, + "step": 28533 + }, + { + "epoch": 0.86, + "learning_rate": 2.540888000965955e-07, + "loss": 1.1033, + "step": 28534 + }, + { + "epoch": 0.86, + "learning_rate": 2.539816687115815e-07, + "loss": 1.1048, + "step": 28535 + }, + { + "epoch": 0.86, + "learning_rate": 2.5387455870758e-07, + "loss": 1.3295, + "step": 28536 + }, + { + "epoch": 0.86, + "learning_rate": 2.5376747008561074e-07, + "loss": 1.0531, + "step": 28537 + }, + { + "epoch": 0.86, + "learning_rate": 2.5366040284669354e-07, + "loss": 1.1071, + "step": 28538 + }, + { + "epoch": 0.86, + "learning_rate": 2.535533569918477e-07, + "loss": 1.1477, + "step": 28539 + }, + { + "epoch": 0.86, + "learning_rate": 2.5344633252209175e-07, + "loss": 1.0949, + "step": 28540 + }, + { + "epoch": 0.86, + "learning_rate": 2.5333932943844455e-07, + "loss": 1.0258, + "step": 28541 + }, + { + "epoch": 0.86, + "learning_rate": 2.532323477419249e-07, + "loss": 0.964, + "step": 28542 + }, + { + "epoch": 0.86, + "learning_rate": 2.531253874335518e-07, + "loss": 1.2157, + "step": 28543 + }, + { + "epoch": 0.86, + "learning_rate": 2.530184485143422e-07, + "loss": 1.0018, + "step": 28544 + }, + { + "epoch": 0.86, + "learning_rate": 2.52911530985315e-07, + "loss": 1.1417, + "step": 28545 + }, + { + "epoch": 0.86, + "learning_rate": 2.5280463484748777e-07, + "loss": 1.1123, + "step": 28546 + }, + { + "epoch": 0.86, + "learning_rate": 2.5269776010187817e-07, + "loss": 1.0472, + "step": 28547 + }, + { + "epoch": 0.86, + "learning_rate": 2.525909067495039e-07, + "loss": 1.1805, + "step": 28548 + }, + { + "epoch": 0.86, + "learning_rate": 2.524840747913815e-07, + "loss": 0.979, + "step": 28549 + }, + { + "epoch": 0.86, + "learning_rate": 2.5237726422852797e-07, + "loss": 1.117, + "step": 28550 + }, + { + "epoch": 0.86, + "learning_rate": 2.522704750619606e-07, + "loss": 1.091, + "step": 28551 + }, + { + "epoch": 0.86, + "learning_rate": 2.521637072926958e-07, + "loss": 1.0989, + "step": 28552 + }, + { + "epoch": 0.86, + "learning_rate": 2.520569609217502e-07, + "loss": 1.0664, + "step": 28553 + }, + { + "epoch": 0.86, + "learning_rate": 2.519502359501394e-07, + "loss": 1.0099, + "step": 28554 + }, + { + "epoch": 0.86, + "learning_rate": 2.5184353237887954e-07, + "loss": 1.2057, + "step": 28555 + }, + { + "epoch": 0.86, + "learning_rate": 2.5173685020898676e-07, + "loss": 0.9684, + "step": 28556 + }, + { + "epoch": 0.86, + "learning_rate": 2.5163018944147604e-07, + "loss": 1.0322, + "step": 28557 + }, + { + "epoch": 0.86, + "learning_rate": 2.515235500773633e-07, + "loss": 1.0796, + "step": 28558 + }, + { + "epoch": 0.86, + "learning_rate": 2.514169321176632e-07, + "loss": 1.1089, + "step": 28559 + }, + { + "epoch": 0.86, + "learning_rate": 2.5131033556339114e-07, + "loss": 1.0939, + "step": 28560 + }, + { + "epoch": 0.86, + "learning_rate": 2.5120376041556205e-07, + "loss": 1.1055, + "step": 28561 + }, + { + "epoch": 0.86, + "learning_rate": 2.510972066751896e-07, + "loss": 1.0507, + "step": 28562 + }, + { + "epoch": 0.86, + "learning_rate": 2.5099067434328886e-07, + "loss": 0.9825, + "step": 28563 + }, + { + "epoch": 0.86, + "learning_rate": 2.508841634208736e-07, + "loss": 1.1777, + "step": 28564 + }, + { + "epoch": 0.86, + "learning_rate": 2.507776739089582e-07, + "loss": 1.1019, + "step": 28565 + }, + { + "epoch": 0.86, + "learning_rate": 2.506712058085559e-07, + "loss": 1.0215, + "step": 28566 + }, + { + "epoch": 0.86, + "learning_rate": 2.5056475912068027e-07, + "loss": 1.0848, + "step": 28567 + }, + { + "epoch": 0.86, + "learning_rate": 2.504583338463448e-07, + "loss": 1.1058, + "step": 28568 + }, + { + "epoch": 0.86, + "learning_rate": 2.503519299865631e-07, + "loss": 0.9233, + "step": 28569 + }, + { + "epoch": 0.86, + "learning_rate": 2.5024554754234683e-07, + "loss": 1.091, + "step": 28570 + }, + { + "epoch": 0.86, + "learning_rate": 2.501391865147096e-07, + "loss": 1.0139, + "step": 28571 + }, + { + "epoch": 0.86, + "learning_rate": 2.5003284690466393e-07, + "loss": 1.1045, + "step": 28572 + }, + { + "epoch": 0.86, + "learning_rate": 2.499265287132216e-07, + "loss": 1.075, + "step": 28573 + }, + { + "epoch": 0.86, + "learning_rate": 2.498202319413959e-07, + "loss": 1.0502, + "step": 28574 + }, + { + "epoch": 0.86, + "learning_rate": 2.497139565901971e-07, + "loss": 1.0085, + "step": 28575 + }, + { + "epoch": 0.86, + "learning_rate": 2.496077026606378e-07, + "loss": 1.1722, + "step": 28576 + }, + { + "epoch": 0.86, + "learning_rate": 2.4950147015372906e-07, + "loss": 0.9975, + "step": 28577 + }, + { + "epoch": 0.86, + "learning_rate": 2.4939525907048315e-07, + "loss": 1.0551, + "step": 28578 + }, + { + "epoch": 0.86, + "learning_rate": 2.4928906941191015e-07, + "loss": 1.0458, + "step": 28579 + }, + { + "epoch": 0.86, + "learning_rate": 2.491829011790209e-07, + "loss": 1.1236, + "step": 28580 + }, + { + "epoch": 0.86, + "learning_rate": 2.4907675437282646e-07, + "loss": 1.0339, + "step": 28581 + }, + { + "epoch": 0.86, + "learning_rate": 2.4897062899433747e-07, + "loss": 1.0744, + "step": 28582 + }, + { + "epoch": 0.86, + "learning_rate": 2.488645250445637e-07, + "loss": 1.0506, + "step": 28583 + }, + { + "epoch": 0.86, + "learning_rate": 2.487584425245157e-07, + "loss": 1.0345, + "step": 28584 + }, + { + "epoch": 0.86, + "learning_rate": 2.4865238143520294e-07, + "loss": 1.0058, + "step": 28585 + }, + { + "epoch": 0.86, + "learning_rate": 2.4854634177763517e-07, + "loss": 1.0626, + "step": 28586 + }, + { + "epoch": 0.86, + "learning_rate": 2.484403235528224e-07, + "loss": 1.0544, + "step": 28587 + }, + { + "epoch": 0.86, + "learning_rate": 2.48334326761773e-07, + "loss": 1.1374, + "step": 28588 + }, + { + "epoch": 0.86, + "learning_rate": 2.4822835140549616e-07, + "loss": 1.0593, + "step": 28589 + }, + { + "epoch": 0.86, + "learning_rate": 2.481223974850011e-07, + "loss": 1.1105, + "step": 28590 + }, + { + "epoch": 0.86, + "learning_rate": 2.480164650012967e-07, + "loss": 1.057, + "step": 28591 + }, + { + "epoch": 0.86, + "learning_rate": 2.4791055395539053e-07, + "loss": 1.0488, + "step": 28592 + }, + { + "epoch": 0.86, + "learning_rate": 2.478046643482912e-07, + "loss": 1.0478, + "step": 28593 + }, + { + "epoch": 0.86, + "learning_rate": 2.4769879618100676e-07, + "loss": 1.1288, + "step": 28594 + }, + { + "epoch": 0.86, + "learning_rate": 2.4759294945454563e-07, + "loss": 1.1408, + "step": 28595 + }, + { + "epoch": 0.86, + "learning_rate": 2.474871241699142e-07, + "loss": 1.0046, + "step": 28596 + }, + { + "epoch": 0.86, + "learning_rate": 2.4738132032812056e-07, + "loss": 1.1075, + "step": 28597 + }, + { + "epoch": 0.86, + "learning_rate": 2.4727553793017197e-07, + "loss": 1.061, + "step": 28598 + }, + { + "epoch": 0.86, + "learning_rate": 2.4716977697707505e-07, + "loss": 1.122, + "step": 28599 + }, + { + "epoch": 0.86, + "learning_rate": 2.4706403746983745e-07, + "loss": 1.0491, + "step": 28600 + }, + { + "epoch": 0.86, + "learning_rate": 2.4695831940946465e-07, + "loss": 1.0607, + "step": 28601 + }, + { + "epoch": 0.86, + "learning_rate": 2.4685262279696366e-07, + "loss": 1.1356, + "step": 28602 + }, + { + "epoch": 0.86, + "learning_rate": 2.467469476333406e-07, + "loss": 1.0312, + "step": 28603 + }, + { + "epoch": 0.86, + "learning_rate": 2.4664129391960167e-07, + "loss": 1.1051, + "step": 28604 + }, + { + "epoch": 0.86, + "learning_rate": 2.4653566165675183e-07, + "loss": 1.2046, + "step": 28605 + }, + { + "epoch": 0.86, + "learning_rate": 2.464300508457976e-07, + "loss": 1.156, + "step": 28606 + }, + { + "epoch": 0.86, + "learning_rate": 2.463244614877436e-07, + "loss": 1.0684, + "step": 28607 + }, + { + "epoch": 0.86, + "learning_rate": 2.4621889358359516e-07, + "loss": 1.1505, + "step": 28608 + }, + { + "epoch": 0.86, + "learning_rate": 2.461133471343577e-07, + "loss": 0.9995, + "step": 28609 + }, + { + "epoch": 0.86, + "learning_rate": 2.460078221410356e-07, + "loss": 1.1373, + "step": 28610 + }, + { + "epoch": 0.86, + "learning_rate": 2.459023186046336e-07, + "loss": 1.0787, + "step": 28611 + }, + { + "epoch": 0.86, + "learning_rate": 2.4579683652615564e-07, + "loss": 1.1348, + "step": 28612 + }, + { + "epoch": 0.86, + "learning_rate": 2.456913759066068e-07, + "loss": 1.023, + "step": 28613 + }, + { + "epoch": 0.86, + "learning_rate": 2.455859367469898e-07, + "loss": 1.1224, + "step": 28614 + }, + { + "epoch": 0.86, + "learning_rate": 2.4548051904830896e-07, + "loss": 1.0893, + "step": 28615 + }, + { + "epoch": 0.86, + "learning_rate": 2.4537512281156776e-07, + "loss": 1.0522, + "step": 28616 + }, + { + "epoch": 0.86, + "learning_rate": 2.4526974803777e-07, + "loss": 1.1014, + "step": 28617 + }, + { + "epoch": 0.86, + "learning_rate": 2.451643947279178e-07, + "loss": 1.0997, + "step": 28618 + }, + { + "epoch": 0.86, + "learning_rate": 2.450590628830146e-07, + "loss": 1.013, + "step": 28619 + }, + { + "epoch": 0.86, + "learning_rate": 2.4495375250406294e-07, + "loss": 1.0603, + "step": 28620 + }, + { + "epoch": 0.86, + "learning_rate": 2.4484846359206614e-07, + "loss": 1.057, + "step": 28621 + }, + { + "epoch": 0.86, + "learning_rate": 2.4474319614802537e-07, + "loss": 0.9769, + "step": 28622 + }, + { + "epoch": 0.86, + "learning_rate": 2.4463795017294346e-07, + "loss": 1.0634, + "step": 28623 + }, + { + "epoch": 0.86, + "learning_rate": 2.4453272566782176e-07, + "loss": 1.1089, + "step": 28624 + }, + { + "epoch": 0.86, + "learning_rate": 2.444275226336623e-07, + "loss": 1.139, + "step": 28625 + }, + { + "epoch": 0.86, + "learning_rate": 2.443223410714668e-07, + "loss": 1.127, + "step": 28626 + }, + { + "epoch": 0.86, + "learning_rate": 2.4421718098223607e-07, + "loss": 1.1263, + "step": 28627 + }, + { + "epoch": 0.86, + "learning_rate": 2.441120423669713e-07, + "loss": 1.054, + "step": 28628 + }, + { + "epoch": 0.86, + "learning_rate": 2.440069252266733e-07, + "loss": 1.0658, + "step": 28629 + }, + { + "epoch": 0.86, + "learning_rate": 2.4390182956234324e-07, + "loss": 1.2197, + "step": 28630 + }, + { + "epoch": 0.86, + "learning_rate": 2.4379675537498094e-07, + "loss": 1.1722, + "step": 28631 + }, + { + "epoch": 0.86, + "learning_rate": 2.436917026655866e-07, + "loss": 1.0649, + "step": 28632 + }, + { + "epoch": 0.86, + "learning_rate": 2.435866714351609e-07, + "loss": 1.1273, + "step": 28633 + }, + { + "epoch": 0.86, + "learning_rate": 2.4348166168470326e-07, + "loss": 1.0483, + "step": 28634 + }, + { + "epoch": 0.86, + "learning_rate": 2.433766734152132e-07, + "loss": 1.0692, + "step": 28635 + }, + { + "epoch": 0.86, + "learning_rate": 2.43271706627691e-07, + "loss": 1.1028, + "step": 28636 + }, + { + "epoch": 0.86, + "learning_rate": 2.4316676132313505e-07, + "loss": 1.2136, + "step": 28637 + }, + { + "epoch": 0.86, + "learning_rate": 2.430618375025442e-07, + "loss": 1.1417, + "step": 28638 + }, + { + "epoch": 0.86, + "learning_rate": 2.429569351669181e-07, + "loss": 1.0448, + "step": 28639 + }, + { + "epoch": 0.86, + "learning_rate": 2.428520543172547e-07, + "loss": 1.0513, + "step": 28640 + }, + { + "epoch": 0.86, + "learning_rate": 2.427471949545526e-07, + "loss": 1.0771, + "step": 28641 + }, + { + "epoch": 0.86, + "learning_rate": 2.4264235707981e-07, + "loss": 1.1122, + "step": 28642 + }, + { + "epoch": 0.86, + "learning_rate": 2.4253754069402584e-07, + "loss": 1.0972, + "step": 28643 + }, + { + "epoch": 0.86, + "learning_rate": 2.424327457981962e-07, + "loss": 0.9922, + "step": 28644 + }, + { + "epoch": 0.86, + "learning_rate": 2.423279723933197e-07, + "loss": 1.111, + "step": 28645 + }, + { + "epoch": 0.86, + "learning_rate": 2.422232204803937e-07, + "loss": 1.0967, + "step": 28646 + }, + { + "epoch": 0.86, + "learning_rate": 2.4211849006041566e-07, + "loss": 1.1968, + "step": 28647 + }, + { + "epoch": 0.86, + "learning_rate": 2.4201378113438144e-07, + "loss": 1.0682, + "step": 28648 + }, + { + "epoch": 0.86, + "learning_rate": 2.4190909370328893e-07, + "loss": 1.1348, + "step": 28649 + }, + { + "epoch": 0.86, + "learning_rate": 2.418044277681342e-07, + "loss": 1.1682, + "step": 28650 + }, + { + "epoch": 0.86, + "learning_rate": 2.416997833299134e-07, + "loss": 1.087, + "step": 28651 + }, + { + "epoch": 0.86, + "learning_rate": 2.4159516038962384e-07, + "loss": 1.1534, + "step": 28652 + }, + { + "epoch": 0.86, + "learning_rate": 2.4149055894826025e-07, + "loss": 1.0519, + "step": 28653 + }, + { + "epoch": 0.86, + "learning_rate": 2.413859790068185e-07, + "loss": 1.1406, + "step": 28654 + }, + { + "epoch": 0.86, + "learning_rate": 2.4128142056629475e-07, + "loss": 1.1468, + "step": 28655 + }, + { + "epoch": 0.86, + "learning_rate": 2.4117688362768425e-07, + "loss": 1.1378, + "step": 28656 + }, + { + "epoch": 0.86, + "learning_rate": 2.410723681919816e-07, + "loss": 1.1376, + "step": 28657 + }, + { + "epoch": 0.86, + "learning_rate": 2.4096787426018204e-07, + "loss": 1.1607, + "step": 28658 + }, + { + "epoch": 0.86, + "learning_rate": 2.408634018332803e-07, + "loss": 1.0245, + "step": 28659 + }, + { + "epoch": 0.86, + "learning_rate": 2.4075895091227153e-07, + "loss": 1.1516, + "step": 28660 + }, + { + "epoch": 0.86, + "learning_rate": 2.406545214981487e-07, + "loss": 1.2324, + "step": 28661 + }, + { + "epoch": 0.86, + "learning_rate": 2.4055011359190695e-07, + "loss": 0.9018, + "step": 28662 + }, + { + "epoch": 0.86, + "learning_rate": 2.4044572719453983e-07, + "loss": 1.1736, + "step": 28663 + }, + { + "epoch": 0.86, + "learning_rate": 2.4034136230704135e-07, + "loss": 1.0226, + "step": 28664 + }, + { + "epoch": 0.86, + "learning_rate": 2.4023701893040457e-07, + "loss": 1.0149, + "step": 28665 + }, + { + "epoch": 0.86, + "learning_rate": 2.4013269706562315e-07, + "loss": 1.1005, + "step": 28666 + }, + { + "epoch": 0.86, + "learning_rate": 2.4002839671368986e-07, + "loss": 0.9942, + "step": 28667 + }, + { + "epoch": 0.86, + "learning_rate": 2.399241178755982e-07, + "loss": 1.1489, + "step": 28668 + }, + { + "epoch": 0.86, + "learning_rate": 2.398198605523405e-07, + "loss": 0.9997, + "step": 28669 + }, + { + "epoch": 0.86, + "learning_rate": 2.397156247449089e-07, + "loss": 1.2307, + "step": 28670 + }, + { + "epoch": 0.86, + "learning_rate": 2.39611410454296e-07, + "loss": 1.0488, + "step": 28671 + }, + { + "epoch": 0.86, + "learning_rate": 2.395072176814939e-07, + "loss": 1.1363, + "step": 28672 + }, + { + "epoch": 0.86, + "learning_rate": 2.3940304642749464e-07, + "loss": 1.1512, + "step": 28673 + }, + { + "epoch": 0.86, + "learning_rate": 2.3929889669328937e-07, + "loss": 1.1837, + "step": 28674 + }, + { + "epoch": 0.86, + "learning_rate": 2.3919476847986957e-07, + "loss": 1.0544, + "step": 28675 + }, + { + "epoch": 0.86, + "learning_rate": 2.3909066178822686e-07, + "loss": 1.0135, + "step": 28676 + }, + { + "epoch": 0.86, + "learning_rate": 2.389865766193522e-07, + "loss": 1.031, + "step": 28677 + }, + { + "epoch": 0.86, + "learning_rate": 2.38882512974237e-07, + "loss": 1.1035, + "step": 28678 + }, + { + "epoch": 0.86, + "learning_rate": 2.387784708538707e-07, + "loss": 0.9827, + "step": 28679 + }, + { + "epoch": 0.86, + "learning_rate": 2.386744502592442e-07, + "loss": 1.165, + "step": 28680 + }, + { + "epoch": 0.86, + "learning_rate": 2.385704511913478e-07, + "loss": 0.8938, + "step": 28681 + }, + { + "epoch": 0.86, + "learning_rate": 2.3846647365117215e-07, + "loss": 1.0792, + "step": 28682 + }, + { + "epoch": 0.86, + "learning_rate": 2.3836251763970615e-07, + "loss": 1.0455, + "step": 28683 + }, + { + "epoch": 0.86, + "learning_rate": 2.3825858315793955e-07, + "loss": 1.0938, + "step": 28684 + }, + { + "epoch": 0.86, + "learning_rate": 2.3815467020686212e-07, + "loss": 1.0325, + "step": 28685 + }, + { + "epoch": 0.86, + "learning_rate": 2.3805077878746309e-07, + "loss": 1.21, + "step": 28686 + }, + { + "epoch": 0.86, + "learning_rate": 2.379469089007308e-07, + "loss": 1.072, + "step": 28687 + }, + { + "epoch": 0.86, + "learning_rate": 2.3784306054765476e-07, + "loss": 1.2501, + "step": 28688 + }, + { + "epoch": 0.86, + "learning_rate": 2.3773923372922309e-07, + "loss": 1.1495, + "step": 28689 + }, + { + "epoch": 0.86, + "learning_rate": 2.376354284464244e-07, + "loss": 1.1067, + "step": 28690 + }, + { + "epoch": 0.86, + "learning_rate": 2.3753164470024708e-07, + "loss": 1.0325, + "step": 28691 + }, + { + "epoch": 0.86, + "learning_rate": 2.3742788249167843e-07, + "loss": 1.1736, + "step": 28692 + }, + { + "epoch": 0.86, + "learning_rate": 2.3732414182170706e-07, + "loss": 1.1755, + "step": 28693 + }, + { + "epoch": 0.86, + "learning_rate": 2.3722042269131994e-07, + "loss": 1.1508, + "step": 28694 + }, + { + "epoch": 0.86, + "learning_rate": 2.3711672510150496e-07, + "loss": 1.128, + "step": 28695 + }, + { + "epoch": 0.86, + "learning_rate": 2.370130490532485e-07, + "loss": 1.0274, + "step": 28696 + }, + { + "epoch": 0.86, + "learning_rate": 2.3690939454753813e-07, + "loss": 1.0201, + "step": 28697 + }, + { + "epoch": 0.86, + "learning_rate": 2.3680576158536e-07, + "loss": 1.1204, + "step": 28698 + }, + { + "epoch": 0.86, + "learning_rate": 2.3670215016770192e-07, + "loss": 1.2427, + "step": 28699 + }, + { + "epoch": 0.86, + "learning_rate": 2.3659856029554867e-07, + "loss": 1.2328, + "step": 28700 + }, + { + "epoch": 0.86, + "learning_rate": 2.3649499196988694e-07, + "loss": 1.0697, + "step": 28701 + }, + { + "epoch": 0.86, + "learning_rate": 2.3639144519170292e-07, + "loss": 1.0978, + "step": 28702 + }, + { + "epoch": 0.86, + "learning_rate": 2.3628791996198247e-07, + "loss": 1.1263, + "step": 28703 + }, + { + "epoch": 0.86, + "learning_rate": 2.3618441628171034e-07, + "loss": 1.0778, + "step": 28704 + }, + { + "epoch": 0.86, + "learning_rate": 2.3608093415187217e-07, + "loss": 1.0507, + "step": 28705 + }, + { + "epoch": 0.86, + "learning_rate": 2.3597747357345353e-07, + "loss": 1.1655, + "step": 28706 + }, + { + "epoch": 0.86, + "learning_rate": 2.3587403454743861e-07, + "loss": 1.1115, + "step": 28707 + }, + { + "epoch": 0.86, + "learning_rate": 2.357706170748131e-07, + "loss": 1.0076, + "step": 28708 + }, + { + "epoch": 0.86, + "learning_rate": 2.3566722115656027e-07, + "loss": 1.0914, + "step": 28709 + }, + { + "epoch": 0.86, + "learning_rate": 2.3556384679366495e-07, + "loss": 1.0997, + "step": 28710 + }, + { + "epoch": 0.86, + "learning_rate": 2.3546049398711108e-07, + "loss": 1.139, + "step": 28711 + }, + { + "epoch": 0.86, + "learning_rate": 2.353571627378834e-07, + "loss": 1.0941, + "step": 28712 + }, + { + "epoch": 0.86, + "learning_rate": 2.3525385304696418e-07, + "loss": 1.103, + "step": 28713 + }, + { + "epoch": 0.87, + "learning_rate": 2.3515056491533768e-07, + "loss": 1.1054, + "step": 28714 + }, + { + "epoch": 0.87, + "learning_rate": 2.3504729834398693e-07, + "loss": 1.1288, + "step": 28715 + }, + { + "epoch": 0.87, + "learning_rate": 2.349440533338951e-07, + "loss": 1.0039, + "step": 28716 + }, + { + "epoch": 0.87, + "learning_rate": 2.3484082988604495e-07, + "loss": 1.1566, + "step": 28717 + }, + { + "epoch": 0.87, + "learning_rate": 2.3473762800141965e-07, + "loss": 1.1799, + "step": 28718 + }, + { + "epoch": 0.87, + "learning_rate": 2.3463444768100085e-07, + "loss": 1.044, + "step": 28719 + }, + { + "epoch": 0.87, + "learning_rate": 2.3453128892577086e-07, + "loss": 1.1727, + "step": 28720 + }, + { + "epoch": 0.87, + "learning_rate": 2.3442815173671197e-07, + "loss": 1.0972, + "step": 28721 + }, + { + "epoch": 0.87, + "learning_rate": 2.3432503611480584e-07, + "loss": 1.0868, + "step": 28722 + }, + { + "epoch": 0.87, + "learning_rate": 2.3422194206103422e-07, + "loss": 1.0943, + "step": 28723 + }, + { + "epoch": 0.87, + "learning_rate": 2.3411886957637853e-07, + "loss": 1.2056, + "step": 28724 + }, + { + "epoch": 0.87, + "learning_rate": 2.3401581866182048e-07, + "loss": 1.2151, + "step": 28725 + }, + { + "epoch": 0.87, + "learning_rate": 2.3391278931833988e-07, + "loss": 1.0422, + "step": 28726 + }, + { + "epoch": 0.87, + "learning_rate": 2.3380978154691814e-07, + "loss": 1.11, + "step": 28727 + }, + { + "epoch": 0.87, + "learning_rate": 2.3370679534853586e-07, + "loss": 1.1339, + "step": 28728 + }, + { + "epoch": 0.87, + "learning_rate": 2.336038307241739e-07, + "loss": 1.1478, + "step": 28729 + }, + { + "epoch": 0.87, + "learning_rate": 2.3350088767481154e-07, + "loss": 1.0176, + "step": 28730 + }, + { + "epoch": 0.87, + "learning_rate": 2.3339796620142906e-07, + "loss": 1.1757, + "step": 28731 + }, + { + "epoch": 0.87, + "learning_rate": 2.3329506630500627e-07, + "loss": 1.0411, + "step": 28732 + }, + { + "epoch": 0.87, + "learning_rate": 2.3319218798652287e-07, + "loss": 1.0944, + "step": 28733 + }, + { + "epoch": 0.87, + "learning_rate": 2.3308933124695842e-07, + "loss": 1.1204, + "step": 28734 + }, + { + "epoch": 0.87, + "learning_rate": 2.3298649608729158e-07, + "loss": 1.1174, + "step": 28735 + }, + { + "epoch": 0.87, + "learning_rate": 2.3288368250850124e-07, + "loss": 1.1061, + "step": 28736 + }, + { + "epoch": 0.87, + "learning_rate": 2.327808905115664e-07, + "loss": 1.0472, + "step": 28737 + }, + { + "epoch": 0.87, + "learning_rate": 2.3267812009746594e-07, + "loss": 1.1151, + "step": 28738 + }, + { + "epoch": 0.87, + "learning_rate": 2.3257537126717743e-07, + "loss": 1.0582, + "step": 28739 + }, + { + "epoch": 0.87, + "learning_rate": 2.324726440216793e-07, + "loss": 1.1157, + "step": 28740 + }, + { + "epoch": 0.87, + "learning_rate": 2.323699383619496e-07, + "loss": 1.014, + "step": 28741 + }, + { + "epoch": 0.87, + "learning_rate": 2.3226725428896645e-07, + "loss": 1.1913, + "step": 28742 + }, + { + "epoch": 0.87, + "learning_rate": 2.3216459180370633e-07, + "loss": 1.1033, + "step": 28743 + }, + { + "epoch": 0.87, + "learning_rate": 2.3206195090714702e-07, + "loss": 1.2079, + "step": 28744 + }, + { + "epoch": 0.87, + "learning_rate": 2.3195933160026578e-07, + "loss": 1.1149, + "step": 28745 + }, + { + "epoch": 0.87, + "learning_rate": 2.318567338840394e-07, + "loss": 1.0829, + "step": 28746 + }, + { + "epoch": 0.87, + "learning_rate": 2.3175415775944427e-07, + "loss": 1.0875, + "step": 28747 + }, + { + "epoch": 0.87, + "learning_rate": 2.316516032274574e-07, + "loss": 1.0837, + "step": 28748 + }, + { + "epoch": 0.87, + "learning_rate": 2.3154907028905465e-07, + "loss": 1.0175, + "step": 28749 + }, + { + "epoch": 0.87, + "learning_rate": 2.3144655894521222e-07, + "loss": 1.0196, + "step": 28750 + }, + { + "epoch": 0.87, + "learning_rate": 2.3134406919690654e-07, + "loss": 1.0645, + "step": 28751 + }, + { + "epoch": 0.87, + "learning_rate": 2.312416010451121e-07, + "loss": 1.0547, + "step": 28752 + }, + { + "epoch": 0.87, + "learning_rate": 2.311391544908051e-07, + "loss": 1.2371, + "step": 28753 + }, + { + "epoch": 0.87, + "learning_rate": 2.3103672953496055e-07, + "loss": 1.1009, + "step": 28754 + }, + { + "epoch": 0.87, + "learning_rate": 2.3093432617855406e-07, + "loss": 1.1005, + "step": 28755 + }, + { + "epoch": 0.87, + "learning_rate": 2.3083194442255959e-07, + "loss": 1.1577, + "step": 28756 + }, + { + "epoch": 0.87, + "learning_rate": 2.3072958426795218e-07, + "loss": 1.1068, + "step": 28757 + }, + { + "epoch": 0.87, + "learning_rate": 2.3062724571570605e-07, + "loss": 1.0352, + "step": 28758 + }, + { + "epoch": 0.87, + "learning_rate": 2.3052492876679543e-07, + "loss": 1.1046, + "step": 28759 + }, + { + "epoch": 0.87, + "learning_rate": 2.3042263342219512e-07, + "loss": 1.0408, + "step": 28760 + }, + { + "epoch": 0.87, + "learning_rate": 2.303203596828779e-07, + "loss": 1.1553, + "step": 28761 + }, + { + "epoch": 0.87, + "learning_rate": 2.302181075498175e-07, + "loss": 1.1403, + "step": 28762 + }, + { + "epoch": 0.87, + "learning_rate": 2.301158770239878e-07, + "loss": 1.078, + "step": 28763 + }, + { + "epoch": 0.87, + "learning_rate": 2.3001366810636195e-07, + "loss": 1.1274, + "step": 28764 + }, + { + "epoch": 0.87, + "learning_rate": 2.2991148079791247e-07, + "loss": 1.1761, + "step": 28765 + }, + { + "epoch": 0.87, + "learning_rate": 2.2980931509961223e-07, + "loss": 1.015, + "step": 28766 + }, + { + "epoch": 0.87, + "learning_rate": 2.2970717101243406e-07, + "loss": 1.165, + "step": 28767 + }, + { + "epoch": 0.87, + "learning_rate": 2.2960504853735078e-07, + "loss": 1.1089, + "step": 28768 + }, + { + "epoch": 0.87, + "learning_rate": 2.2950294767533326e-07, + "loss": 1.0364, + "step": 28769 + }, + { + "epoch": 0.87, + "learning_rate": 2.2940086842735438e-07, + "loss": 1.0343, + "step": 28770 + }, + { + "epoch": 0.87, + "learning_rate": 2.2929881079438553e-07, + "loss": 1.0357, + "step": 28771 + }, + { + "epoch": 0.87, + "learning_rate": 2.2919677477739822e-07, + "loss": 1.067, + "step": 28772 + }, + { + "epoch": 0.87, + "learning_rate": 2.2909476037736438e-07, + "loss": 1.2322, + "step": 28773 + }, + { + "epoch": 0.87, + "learning_rate": 2.289927675952544e-07, + "loss": 1.051, + "step": 28774 + }, + { + "epoch": 0.87, + "learning_rate": 2.288907964320397e-07, + "loss": 1.0658, + "step": 28775 + }, + { + "epoch": 0.87, + "learning_rate": 2.2878884688869063e-07, + "loss": 1.1498, + "step": 28776 + }, + { + "epoch": 0.87, + "learning_rate": 2.2868691896617862e-07, + "loss": 1.0165, + "step": 28777 + }, + { + "epoch": 0.87, + "learning_rate": 2.2858501266547262e-07, + "loss": 1.0657, + "step": 28778 + }, + { + "epoch": 0.87, + "learning_rate": 2.2848312798754325e-07, + "loss": 1.205, + "step": 28779 + }, + { + "epoch": 0.87, + "learning_rate": 2.2838126493336055e-07, + "loss": 1.142, + "step": 28780 + }, + { + "epoch": 0.87, + "learning_rate": 2.2827942350389458e-07, + "loss": 1.1921, + "step": 28781 + }, + { + "epoch": 0.87, + "learning_rate": 2.2817760370011406e-07, + "loss": 1.1316, + "step": 28782 + }, + { + "epoch": 0.87, + "learning_rate": 2.2807580552298868e-07, + "loss": 1.1602, + "step": 28783 + }, + { + "epoch": 0.87, + "learning_rate": 2.279740289734872e-07, + "loss": 1.0093, + "step": 28784 + }, + { + "epoch": 0.87, + "learning_rate": 2.2787227405257878e-07, + "loss": 1.1603, + "step": 28785 + }, + { + "epoch": 0.87, + "learning_rate": 2.2777054076123267e-07, + "loss": 1.2377, + "step": 28786 + }, + { + "epoch": 0.87, + "learning_rate": 2.2766882910041617e-07, + "loss": 1.1415, + "step": 28787 + }, + { + "epoch": 0.87, + "learning_rate": 2.275671390710979e-07, + "loss": 1.202, + "step": 28788 + }, + { + "epoch": 0.87, + "learning_rate": 2.2746547067424602e-07, + "loss": 1.0201, + "step": 28789 + }, + { + "epoch": 0.87, + "learning_rate": 2.273638239108289e-07, + "loss": 0.9269, + "step": 28790 + }, + { + "epoch": 0.87, + "learning_rate": 2.27262198781813e-07, + "loss": 1.0402, + "step": 28791 + }, + { + "epoch": 0.87, + "learning_rate": 2.271605952881667e-07, + "loss": 1.1219, + "step": 28792 + }, + { + "epoch": 0.87, + "learning_rate": 2.2705901343085674e-07, + "loss": 1.2167, + "step": 28793 + }, + { + "epoch": 0.87, + "learning_rate": 2.2695745321085066e-07, + "loss": 1.2034, + "step": 28794 + }, + { + "epoch": 0.87, + "learning_rate": 2.2685591462911438e-07, + "loss": 0.9753, + "step": 28795 + }, + { + "epoch": 0.87, + "learning_rate": 2.2675439768661518e-07, + "loss": 1.1408, + "step": 28796 + }, + { + "epoch": 0.87, + "learning_rate": 2.266529023843192e-07, + "loss": 1.2253, + "step": 28797 + }, + { + "epoch": 0.87, + "learning_rate": 2.265514287231929e-07, + "loss": 1.121, + "step": 28798 + }, + { + "epoch": 0.87, + "learning_rate": 2.2644997670420166e-07, + "loss": 1.1177, + "step": 28799 + }, + { + "epoch": 0.87, + "learning_rate": 2.2634854632831244e-07, + "loss": 1.0355, + "step": 28800 + }, + { + "epoch": 0.87, + "learning_rate": 2.2624713759648946e-07, + "loss": 1.0837, + "step": 28801 + }, + { + "epoch": 0.87, + "learning_rate": 2.2614575050969867e-07, + "loss": 1.1416, + "step": 28802 + }, + { + "epoch": 0.87, + "learning_rate": 2.2604438506890537e-07, + "loss": 1.1082, + "step": 28803 + }, + { + "epoch": 0.87, + "learning_rate": 2.2594304127507405e-07, + "loss": 1.2045, + "step": 28804 + }, + { + "epoch": 0.87, + "learning_rate": 2.2584171912917007e-07, + "loss": 1.2551, + "step": 28805 + }, + { + "epoch": 0.87, + "learning_rate": 2.257404186321574e-07, + "loss": 1.0815, + "step": 28806 + }, + { + "epoch": 0.87, + "learning_rate": 2.2563913978500134e-07, + "loss": 1.05, + "step": 28807 + }, + { + "epoch": 0.87, + "learning_rate": 2.2553788258866449e-07, + "loss": 1.0508, + "step": 28808 + }, + { + "epoch": 0.87, + "learning_rate": 2.2543664704411189e-07, + "loss": 1.0503, + "step": 28809 + }, + { + "epoch": 0.87, + "learning_rate": 2.2533543315230667e-07, + "loss": 1.1309, + "step": 28810 + }, + { + "epoch": 0.87, + "learning_rate": 2.2523424091421276e-07, + "loss": 1.2467, + "step": 28811 + }, + { + "epoch": 0.87, + "learning_rate": 2.2513307033079384e-07, + "loss": 1.146, + "step": 28812 + }, + { + "epoch": 0.87, + "learning_rate": 2.2503192140301195e-07, + "loss": 1.0705, + "step": 28813 + }, + { + "epoch": 0.87, + "learning_rate": 2.2493079413183045e-07, + "loss": 1.0713, + "step": 28814 + }, + { + "epoch": 0.87, + "learning_rate": 2.2482968851821218e-07, + "loss": 1.1244, + "step": 28815 + }, + { + "epoch": 0.87, + "learning_rate": 2.2472860456312002e-07, + "loss": 1.0917, + "step": 28816 + }, + { + "epoch": 0.87, + "learning_rate": 2.246275422675151e-07, + "loss": 1.2612, + "step": 28817 + }, + { + "epoch": 0.87, + "learning_rate": 2.2452650163236028e-07, + "loss": 1.1668, + "step": 28818 + }, + { + "epoch": 0.87, + "learning_rate": 2.2442548265861703e-07, + "loss": 1.0222, + "step": 28819 + }, + { + "epoch": 0.87, + "learning_rate": 2.2432448534724788e-07, + "loss": 1.0445, + "step": 28820 + }, + { + "epoch": 0.87, + "learning_rate": 2.2422350969921318e-07, + "loss": 1.1361, + "step": 28821 + }, + { + "epoch": 0.87, + "learning_rate": 2.241225557154747e-07, + "loss": 1.1389, + "step": 28822 + }, + { + "epoch": 0.87, + "learning_rate": 2.2402162339699301e-07, + "loss": 1.1438, + "step": 28823 + }, + { + "epoch": 0.87, + "learning_rate": 2.239207127447296e-07, + "loss": 1.3439, + "step": 28824 + }, + { + "epoch": 0.87, + "learning_rate": 2.2381982375964535e-07, + "loss": 1.084, + "step": 28825 + }, + { + "epoch": 0.87, + "learning_rate": 2.2371895644269949e-07, + "loss": 1.122, + "step": 28826 + }, + { + "epoch": 0.87, + "learning_rate": 2.236181107948529e-07, + "loss": 1.0462, + "step": 28827 + }, + { + "epoch": 0.87, + "learning_rate": 2.235172868170657e-07, + "loss": 1.0754, + "step": 28828 + }, + { + "epoch": 0.87, + "learning_rate": 2.2341648451029736e-07, + "loss": 1.0934, + "step": 28829 + }, + { + "epoch": 0.87, + "learning_rate": 2.2331570387550767e-07, + "loss": 1.1927, + "step": 28830 + }, + { + "epoch": 0.87, + "learning_rate": 2.2321494491365615e-07, + "loss": 1.1276, + "step": 28831 + }, + { + "epoch": 0.87, + "learning_rate": 2.2311420762570173e-07, + "loss": 1.1649, + "step": 28832 + }, + { + "epoch": 0.87, + "learning_rate": 2.230134920126037e-07, + "loss": 1.1422, + "step": 28833 + }, + { + "epoch": 0.87, + "learning_rate": 2.229127980753204e-07, + "loss": 1.0231, + "step": 28834 + }, + { + "epoch": 0.87, + "learning_rate": 2.2281212581481054e-07, + "loss": 1.027, + "step": 28835 + }, + { + "epoch": 0.87, + "learning_rate": 2.2271147523203252e-07, + "loss": 1.1135, + "step": 28836 + }, + { + "epoch": 0.87, + "learning_rate": 2.2261084632794445e-07, + "loss": 1.1494, + "step": 28837 + }, + { + "epoch": 0.87, + "learning_rate": 2.2251023910350472e-07, + "loss": 0.9831, + "step": 28838 + }, + { + "epoch": 0.87, + "learning_rate": 2.224096535596701e-07, + "loss": 1.1188, + "step": 28839 + }, + { + "epoch": 0.87, + "learning_rate": 2.2230908969739866e-07, + "loss": 1.1501, + "step": 28840 + }, + { + "epoch": 0.87, + "learning_rate": 2.2220854751764804e-07, + "loss": 1.1275, + "step": 28841 + }, + { + "epoch": 0.87, + "learning_rate": 2.2210802702137518e-07, + "loss": 1.093, + "step": 28842 + }, + { + "epoch": 0.87, + "learning_rate": 2.220075282095363e-07, + "loss": 1.1389, + "step": 28843 + }, + { + "epoch": 0.87, + "learning_rate": 2.2190705108308896e-07, + "loss": 1.179, + "step": 28844 + }, + { + "epoch": 0.87, + "learning_rate": 2.2180659564298907e-07, + "loss": 1.0952, + "step": 28845 + }, + { + "epoch": 0.87, + "learning_rate": 2.217061618901936e-07, + "loss": 1.2311, + "step": 28846 + }, + { + "epoch": 0.87, + "learning_rate": 2.2160574982565796e-07, + "loss": 1.1136, + "step": 28847 + }, + { + "epoch": 0.87, + "learning_rate": 2.21505359450338e-07, + "loss": 1.1458, + "step": 28848 + }, + { + "epoch": 0.87, + "learning_rate": 2.2140499076518996e-07, + "loss": 1.1029, + "step": 28849 + }, + { + "epoch": 0.87, + "learning_rate": 2.2130464377116885e-07, + "loss": 1.0493, + "step": 28850 + }, + { + "epoch": 0.87, + "learning_rate": 2.2120431846923057e-07, + "loss": 1.0488, + "step": 28851 + }, + { + "epoch": 0.87, + "learning_rate": 2.2110401486032913e-07, + "loss": 1.0942, + "step": 28852 + }, + { + "epoch": 0.87, + "learning_rate": 2.210037329454198e-07, + "loss": 1.073, + "step": 28853 + }, + { + "epoch": 0.87, + "learning_rate": 2.2090347272545775e-07, + "loss": 1.1541, + "step": 28854 + }, + { + "epoch": 0.87, + "learning_rate": 2.208032342013966e-07, + "loss": 1.0676, + "step": 28855 + }, + { + "epoch": 0.87, + "learning_rate": 2.2070301737419115e-07, + "loss": 1.303, + "step": 28856 + }, + { + "epoch": 0.87, + "learning_rate": 2.2060282224479506e-07, + "loss": 1.1943, + "step": 28857 + }, + { + "epoch": 0.87, + "learning_rate": 2.205026488141626e-07, + "loss": 1.174, + "step": 28858 + }, + { + "epoch": 0.87, + "learning_rate": 2.2040249708324719e-07, + "loss": 1.109, + "step": 28859 + }, + { + "epoch": 0.87, + "learning_rate": 2.2030236705300189e-07, + "loss": 1.1216, + "step": 28860 + }, + { + "epoch": 0.87, + "learning_rate": 2.202022587243799e-07, + "loss": 1.147, + "step": 28861 + }, + { + "epoch": 0.87, + "learning_rate": 2.2010217209833455e-07, + "loss": 1.097, + "step": 28862 + }, + { + "epoch": 0.87, + "learning_rate": 2.2000210717581877e-07, + "loss": 1.0742, + "step": 28863 + }, + { + "epoch": 0.87, + "learning_rate": 2.199020639577848e-07, + "loss": 1.0415, + "step": 28864 + }, + { + "epoch": 0.87, + "learning_rate": 2.1980204244518494e-07, + "loss": 1.1052, + "step": 28865 + }, + { + "epoch": 0.87, + "learning_rate": 2.1970204263897123e-07, + "loss": 1.0735, + "step": 28866 + }, + { + "epoch": 0.87, + "learning_rate": 2.196020645400962e-07, + "loss": 1.1436, + "step": 28867 + }, + { + "epoch": 0.87, + "learning_rate": 2.1950210814951134e-07, + "loss": 1.0672, + "step": 28868 + }, + { + "epoch": 0.87, + "learning_rate": 2.1940217346816783e-07, + "loss": 1.0139, + "step": 28869 + }, + { + "epoch": 0.87, + "learning_rate": 2.1930226049701713e-07, + "loss": 1.1146, + "step": 28870 + }, + { + "epoch": 0.87, + "learning_rate": 2.1920236923701043e-07, + "loss": 1.0544, + "step": 28871 + }, + { + "epoch": 0.87, + "learning_rate": 2.191024996890992e-07, + "loss": 0.9909, + "step": 28872 + }, + { + "epoch": 0.87, + "learning_rate": 2.190026518542332e-07, + "loss": 1.0173, + "step": 28873 + }, + { + "epoch": 0.87, + "learning_rate": 2.1890282573336363e-07, + "loss": 1.1871, + "step": 28874 + }, + { + "epoch": 0.87, + "learning_rate": 2.188030213274403e-07, + "loss": 1.0359, + "step": 28875 + }, + { + "epoch": 0.87, + "learning_rate": 2.1870323863741412e-07, + "loss": 1.1055, + "step": 28876 + }, + { + "epoch": 0.87, + "learning_rate": 2.1860347766423373e-07, + "loss": 1.0577, + "step": 28877 + }, + { + "epoch": 0.87, + "learning_rate": 2.1850373840884982e-07, + "loss": 1.1497, + "step": 28878 + }, + { + "epoch": 0.87, + "learning_rate": 2.184040208722113e-07, + "loss": 1.164, + "step": 28879 + }, + { + "epoch": 0.87, + "learning_rate": 2.1830432505526745e-07, + "loss": 1.0616, + "step": 28880 + }, + { + "epoch": 0.87, + "learning_rate": 2.1820465095896776e-07, + "loss": 1.1013, + "step": 28881 + }, + { + "epoch": 0.87, + "learning_rate": 2.1810499858426093e-07, + "loss": 1.0769, + "step": 28882 + }, + { + "epoch": 0.87, + "learning_rate": 2.1800536793209592e-07, + "loss": 1.0161, + "step": 28883 + }, + { + "epoch": 0.87, + "learning_rate": 2.1790575900342005e-07, + "loss": 1.1913, + "step": 28884 + }, + { + "epoch": 0.87, + "learning_rate": 2.1780617179918252e-07, + "loss": 1.0048, + "step": 28885 + }, + { + "epoch": 0.87, + "learning_rate": 2.177066063203312e-07, + "loss": 1.1532, + "step": 28886 + }, + { + "epoch": 0.87, + "learning_rate": 2.176070625678134e-07, + "loss": 1.0762, + "step": 28887 + }, + { + "epoch": 0.87, + "learning_rate": 2.175075405425775e-07, + "loss": 1.0271, + "step": 28888 + }, + { + "epoch": 0.87, + "learning_rate": 2.1740804024557084e-07, + "loss": 1.017, + "step": 28889 + }, + { + "epoch": 0.87, + "learning_rate": 2.1730856167773983e-07, + "loss": 1.0391, + "step": 28890 + }, + { + "epoch": 0.87, + "learning_rate": 2.1720910484003183e-07, + "loss": 1.0609, + "step": 28891 + }, + { + "epoch": 0.87, + "learning_rate": 2.1710966973339382e-07, + "loss": 1.0768, + "step": 28892 + }, + { + "epoch": 0.87, + "learning_rate": 2.1701025635877228e-07, + "loss": 1.0623, + "step": 28893 + }, + { + "epoch": 0.87, + "learning_rate": 2.169108647171142e-07, + "loss": 1.1201, + "step": 28894 + }, + { + "epoch": 0.87, + "learning_rate": 2.1681149480936443e-07, + "loss": 0.9984, + "step": 28895 + }, + { + "epoch": 0.87, + "learning_rate": 2.1671214663646968e-07, + "loss": 1.1693, + "step": 28896 + }, + { + "epoch": 0.87, + "learning_rate": 2.1661282019937559e-07, + "loss": 1.0993, + "step": 28897 + }, + { + "epoch": 0.87, + "learning_rate": 2.1651351549902834e-07, + "loss": 1.0643, + "step": 28898 + }, + { + "epoch": 0.87, + "learning_rate": 2.164142325363719e-07, + "loss": 1.2066, + "step": 28899 + }, + { + "epoch": 0.87, + "learning_rate": 2.1631497131235247e-07, + "loss": 1.1639, + "step": 28900 + }, + { + "epoch": 0.87, + "learning_rate": 2.1621573182791455e-07, + "loss": 1.0085, + "step": 28901 + }, + { + "epoch": 0.87, + "learning_rate": 2.1611651408400326e-07, + "loss": 0.9636, + "step": 28902 + }, + { + "epoch": 0.87, + "learning_rate": 2.160173180815625e-07, + "loss": 1.0623, + "step": 28903 + }, + { + "epoch": 0.87, + "learning_rate": 2.1591814382153686e-07, + "loss": 1.043, + "step": 28904 + }, + { + "epoch": 0.87, + "learning_rate": 2.1581899130487056e-07, + "loss": 1.073, + "step": 28905 + }, + { + "epoch": 0.87, + "learning_rate": 2.1571986053250698e-07, + "loss": 1.0797, + "step": 28906 + }, + { + "epoch": 0.87, + "learning_rate": 2.1562075150539096e-07, + "loss": 0.9639, + "step": 28907 + }, + { + "epoch": 0.87, + "learning_rate": 2.155216642244648e-07, + "loss": 1.0383, + "step": 28908 + }, + { + "epoch": 0.87, + "learning_rate": 2.154225986906719e-07, + "loss": 1.0345, + "step": 28909 + }, + { + "epoch": 0.87, + "learning_rate": 2.1532355490495565e-07, + "loss": 1.0988, + "step": 28910 + }, + { + "epoch": 0.87, + "learning_rate": 2.1522453286825895e-07, + "loss": 1.1346, + "step": 28911 + }, + { + "epoch": 0.87, + "learning_rate": 2.1512553258152408e-07, + "loss": 1.1629, + "step": 28912 + }, + { + "epoch": 0.87, + "learning_rate": 2.150265540456939e-07, + "loss": 1.0927, + "step": 28913 + }, + { + "epoch": 0.87, + "learning_rate": 2.1492759726171041e-07, + "loss": 1.045, + "step": 28914 + }, + { + "epoch": 0.87, + "learning_rate": 2.1482866223051596e-07, + "loss": 1.002, + "step": 28915 + }, + { + "epoch": 0.87, + "learning_rate": 2.147297489530517e-07, + "loss": 1.0363, + "step": 28916 + }, + { + "epoch": 0.87, + "learning_rate": 2.146308574302597e-07, + "loss": 1.0659, + "step": 28917 + }, + { + "epoch": 0.87, + "learning_rate": 2.1453198766308136e-07, + "loss": 1.1268, + "step": 28918 + }, + { + "epoch": 0.87, + "learning_rate": 2.1443313965245765e-07, + "loss": 1.0746, + "step": 28919 + }, + { + "epoch": 0.87, + "learning_rate": 2.1433431339933002e-07, + "loss": 0.9622, + "step": 28920 + }, + { + "epoch": 0.87, + "learning_rate": 2.1423550890463857e-07, + "loss": 1.0661, + "step": 28921 + }, + { + "epoch": 0.87, + "learning_rate": 2.1413672616932418e-07, + "loss": 1.1349, + "step": 28922 + }, + { + "epoch": 0.87, + "learning_rate": 2.1403796519432723e-07, + "loss": 1.2272, + "step": 28923 + }, + { + "epoch": 0.87, + "learning_rate": 2.1393922598058835e-07, + "loss": 1.1762, + "step": 28924 + }, + { + "epoch": 0.87, + "learning_rate": 2.1384050852904654e-07, + "loss": 1.1559, + "step": 28925 + }, + { + "epoch": 0.87, + "learning_rate": 2.137418128406421e-07, + "loss": 1.1998, + "step": 28926 + }, + { + "epoch": 0.87, + "learning_rate": 2.136431389163146e-07, + "loss": 1.0995, + "step": 28927 + }, + { + "epoch": 0.87, + "learning_rate": 2.1354448675700357e-07, + "loss": 1.0968, + "step": 28928 + }, + { + "epoch": 0.87, + "learning_rate": 2.1344585636364768e-07, + "loss": 1.0516, + "step": 28929 + }, + { + "epoch": 0.87, + "learning_rate": 2.1334724773718562e-07, + "loss": 1.0911, + "step": 28930 + }, + { + "epoch": 0.87, + "learning_rate": 2.1324866087855667e-07, + "loss": 1.0668, + "step": 28931 + }, + { + "epoch": 0.87, + "learning_rate": 2.1315009578869895e-07, + "loss": 1.0982, + "step": 28932 + }, + { + "epoch": 0.87, + "learning_rate": 2.130515524685517e-07, + "loss": 1.102, + "step": 28933 + }, + { + "epoch": 0.87, + "learning_rate": 2.1295303091905139e-07, + "loss": 0.9312, + "step": 28934 + }, + { + "epoch": 0.87, + "learning_rate": 2.1285453114113703e-07, + "loss": 1.0615, + "step": 28935 + }, + { + "epoch": 0.87, + "learning_rate": 2.1275605313574588e-07, + "loss": 1.1033, + "step": 28936 + }, + { + "epoch": 0.87, + "learning_rate": 2.1265759690381554e-07, + "loss": 1.127, + "step": 28937 + }, + { + "epoch": 0.87, + "learning_rate": 2.1255916244628334e-07, + "loss": 0.9957, + "step": 28938 + }, + { + "epoch": 0.87, + "learning_rate": 2.1246074976408627e-07, + "loss": 1.1282, + "step": 28939 + }, + { + "epoch": 0.87, + "learning_rate": 2.123623588581611e-07, + "loss": 1.0359, + "step": 28940 + }, + { + "epoch": 0.87, + "learning_rate": 2.1226398972944483e-07, + "loss": 1.1329, + "step": 28941 + }, + { + "epoch": 0.87, + "learning_rate": 2.1216564237887317e-07, + "loss": 1.0503, + "step": 28942 + }, + { + "epoch": 0.87, + "learning_rate": 2.120673168073828e-07, + "loss": 1.1833, + "step": 28943 + }, + { + "epoch": 0.87, + "learning_rate": 2.1196901301590967e-07, + "loss": 1.092, + "step": 28944 + }, + { + "epoch": 0.87, + "learning_rate": 2.1187073100538968e-07, + "loss": 1.0991, + "step": 28945 + }, + { + "epoch": 0.87, + "learning_rate": 2.117724707767588e-07, + "loss": 1.1213, + "step": 28946 + }, + { + "epoch": 0.87, + "learning_rate": 2.116742323309512e-07, + "loss": 0.9972, + "step": 28947 + }, + { + "epoch": 0.87, + "learning_rate": 2.1157601566890313e-07, + "loss": 1.1886, + "step": 28948 + }, + { + "epoch": 0.87, + "learning_rate": 2.1147782079154884e-07, + "loss": 1.1655, + "step": 28949 + }, + { + "epoch": 0.87, + "learning_rate": 2.1137964769982423e-07, + "loss": 1.0785, + "step": 28950 + }, + { + "epoch": 0.87, + "learning_rate": 2.1128149639466272e-07, + "loss": 0.9708, + "step": 28951 + }, + { + "epoch": 0.87, + "learning_rate": 2.1118336687699914e-07, + "loss": 1.057, + "step": 28952 + }, + { + "epoch": 0.87, + "learning_rate": 2.1108525914776744e-07, + "loss": 1.0704, + "step": 28953 + }, + { + "epoch": 0.87, + "learning_rate": 2.1098717320790217e-07, + "loss": 1.1014, + "step": 28954 + }, + { + "epoch": 0.87, + "learning_rate": 2.108891090583362e-07, + "loss": 1.2323, + "step": 28955 + }, + { + "epoch": 0.87, + "learning_rate": 2.1079106670000322e-07, + "loss": 1.1669, + "step": 28956 + }, + { + "epoch": 0.87, + "learning_rate": 2.106930461338369e-07, + "loss": 1.0175, + "step": 28957 + }, + { + "epoch": 0.87, + "learning_rate": 2.1059504736077042e-07, + "loss": 1.0909, + "step": 28958 + }, + { + "epoch": 0.87, + "learning_rate": 2.1049707038173662e-07, + "loss": 1.0565, + "step": 28959 + }, + { + "epoch": 0.87, + "learning_rate": 2.1039911519766781e-07, + "loss": 1.1554, + "step": 28960 + }, + { + "epoch": 0.87, + "learning_rate": 2.103011818094966e-07, + "loss": 1.1474, + "step": 28961 + }, + { + "epoch": 0.87, + "learning_rate": 2.102032702181553e-07, + "loss": 1.0645, + "step": 28962 + }, + { + "epoch": 0.87, + "learning_rate": 2.1010538042457618e-07, + "loss": 1.0691, + "step": 28963 + }, + { + "epoch": 0.87, + "learning_rate": 2.1000751242969104e-07, + "loss": 1.1806, + "step": 28964 + }, + { + "epoch": 0.87, + "learning_rate": 2.0990966623443186e-07, + "loss": 1.158, + "step": 28965 + }, + { + "epoch": 0.87, + "learning_rate": 2.098118418397291e-07, + "loss": 1.0591, + "step": 28966 + }, + { + "epoch": 0.87, + "learning_rate": 2.0971403924651497e-07, + "loss": 1.1184, + "step": 28967 + }, + { + "epoch": 0.87, + "learning_rate": 2.0961625845571987e-07, + "loss": 0.9332, + "step": 28968 + }, + { + "epoch": 0.87, + "learning_rate": 2.09518499468275e-07, + "loss": 1.1124, + "step": 28969 + }, + { + "epoch": 0.87, + "learning_rate": 2.0942076228511078e-07, + "loss": 1.0573, + "step": 28970 + }, + { + "epoch": 0.87, + "learning_rate": 2.0932304690715776e-07, + "loss": 1.1543, + "step": 28971 + }, + { + "epoch": 0.87, + "learning_rate": 2.0922535333534665e-07, + "loss": 1.0274, + "step": 28972 + }, + { + "epoch": 0.87, + "learning_rate": 2.0912768157060642e-07, + "loss": 1.1255, + "step": 28973 + }, + { + "epoch": 0.87, + "learning_rate": 2.0903003161386743e-07, + "loss": 1.1557, + "step": 28974 + }, + { + "epoch": 0.87, + "learning_rate": 2.0893240346605893e-07, + "loss": 1.1949, + "step": 28975 + }, + { + "epoch": 0.87, + "learning_rate": 2.08834797128111e-07, + "loss": 1.079, + "step": 28976 + }, + { + "epoch": 0.87, + "learning_rate": 2.087372126009521e-07, + "loss": 1.1887, + "step": 28977 + }, + { + "epoch": 0.87, + "learning_rate": 2.0863964988551145e-07, + "loss": 1.0743, + "step": 28978 + }, + { + "epoch": 0.87, + "learning_rate": 2.0854210898271747e-07, + "loss": 0.9619, + "step": 28979 + }, + { + "epoch": 0.87, + "learning_rate": 2.0844458989349975e-07, + "loss": 1.2153, + "step": 28980 + }, + { + "epoch": 0.87, + "learning_rate": 2.0834709261878528e-07, + "loss": 0.9564, + "step": 28981 + }, + { + "epoch": 0.87, + "learning_rate": 2.0824961715950275e-07, + "loss": 1.1306, + "step": 28982 + }, + { + "epoch": 0.87, + "learning_rate": 2.0815216351658036e-07, + "loss": 1.032, + "step": 28983 + }, + { + "epoch": 0.87, + "learning_rate": 2.0805473169094536e-07, + "loss": 1.0384, + "step": 28984 + }, + { + "epoch": 0.87, + "learning_rate": 2.0795732168352596e-07, + "loss": 1.0744, + "step": 28985 + }, + { + "epoch": 0.87, + "learning_rate": 2.0785993349524858e-07, + "loss": 1.1265, + "step": 28986 + }, + { + "epoch": 0.87, + "learning_rate": 2.0776256712704086e-07, + "loss": 0.9879, + "step": 28987 + }, + { + "epoch": 0.87, + "learning_rate": 2.0766522257982924e-07, + "loss": 1.0482, + "step": 28988 + }, + { + "epoch": 0.87, + "learning_rate": 2.0756789985454134e-07, + "loss": 1.158, + "step": 28989 + }, + { + "epoch": 0.87, + "learning_rate": 2.0747059895210227e-07, + "loss": 1.1069, + "step": 28990 + }, + { + "epoch": 0.87, + "learning_rate": 2.07373319873439e-07, + "loss": 1.2102, + "step": 28991 + }, + { + "epoch": 0.87, + "learning_rate": 2.072760626194778e-07, + "loss": 1.0715, + "step": 28992 + }, + { + "epoch": 0.87, + "learning_rate": 2.07178827191144e-07, + "loss": 1.0329, + "step": 28993 + }, + { + "epoch": 0.87, + "learning_rate": 2.0708161358936386e-07, + "loss": 1.0553, + "step": 28994 + }, + { + "epoch": 0.87, + "learning_rate": 2.0698442181506213e-07, + "loss": 1.0875, + "step": 28995 + }, + { + "epoch": 0.87, + "learning_rate": 2.0688725186916446e-07, + "loss": 1.0947, + "step": 28996 + }, + { + "epoch": 0.87, + "learning_rate": 2.0679010375259573e-07, + "loss": 0.9984, + "step": 28997 + }, + { + "epoch": 0.87, + "learning_rate": 2.0669297746628124e-07, + "loss": 1.1112, + "step": 28998 + }, + { + "epoch": 0.87, + "learning_rate": 2.0659587301114475e-07, + "loss": 1.2148, + "step": 28999 + }, + { + "epoch": 0.87, + "learning_rate": 2.0649879038811077e-07, + "loss": 1.2285, + "step": 29000 + }, + { + "epoch": 0.87, + "learning_rate": 2.0640172959810383e-07, + "loss": 1.0502, + "step": 29001 + }, + { + "epoch": 0.87, + "learning_rate": 2.0630469064204823e-07, + "loss": 1.1325, + "step": 29002 + }, + { + "epoch": 0.87, + "learning_rate": 2.0620767352086679e-07, + "loss": 1.1202, + "step": 29003 + }, + { + "epoch": 0.87, + "learning_rate": 2.061106782354838e-07, + "loss": 1.126, + "step": 29004 + }, + { + "epoch": 0.87, + "learning_rate": 2.0601370478682213e-07, + "loss": 1.0898, + "step": 29005 + }, + { + "epoch": 0.87, + "learning_rate": 2.0591675317580577e-07, + "loss": 1.0521, + "step": 29006 + }, + { + "epoch": 0.87, + "learning_rate": 2.058198234033565e-07, + "loss": 0.991, + "step": 29007 + }, + { + "epoch": 0.87, + "learning_rate": 2.057229154703977e-07, + "loss": 1.0566, + "step": 29008 + }, + { + "epoch": 0.87, + "learning_rate": 2.056260293778517e-07, + "loss": 1.1497, + "step": 29009 + }, + { + "epoch": 0.87, + "learning_rate": 2.0552916512664085e-07, + "loss": 1.0731, + "step": 29010 + }, + { + "epoch": 0.87, + "learning_rate": 2.0543232271768798e-07, + "loss": 1.1406, + "step": 29011 + }, + { + "epoch": 0.87, + "learning_rate": 2.053355021519135e-07, + "loss": 1.1447, + "step": 29012 + }, + { + "epoch": 0.87, + "learning_rate": 2.0523870343024028e-07, + "loss": 1.1575, + "step": 29013 + }, + { + "epoch": 0.87, + "learning_rate": 2.0514192655358923e-07, + "loss": 1.098, + "step": 29014 + }, + { + "epoch": 0.87, + "learning_rate": 2.0504517152288213e-07, + "loss": 1.1189, + "step": 29015 + }, + { + "epoch": 0.87, + "learning_rate": 2.0494843833903933e-07, + "loss": 1.0839, + "step": 29016 + }, + { + "epoch": 0.87, + "learning_rate": 2.0485172700298206e-07, + "loss": 1.0474, + "step": 29017 + }, + { + "epoch": 0.87, + "learning_rate": 2.0475503751563097e-07, + "loss": 1.0663, + "step": 29018 + }, + { + "epoch": 0.87, + "learning_rate": 2.0465836987790644e-07, + "loss": 1.0383, + "step": 29019 + }, + { + "epoch": 0.87, + "learning_rate": 2.0456172409072883e-07, + "loss": 1.1407, + "step": 29020 + }, + { + "epoch": 0.87, + "learning_rate": 2.0446510015501824e-07, + "loss": 1.1193, + "step": 29021 + }, + { + "epoch": 0.87, + "learning_rate": 2.0436849807169422e-07, + "loss": 1.0176, + "step": 29022 + }, + { + "epoch": 0.87, + "learning_rate": 2.0427191784167632e-07, + "loss": 0.9821, + "step": 29023 + }, + { + "epoch": 0.87, + "learning_rate": 2.0417535946588463e-07, + "loss": 1.1785, + "step": 29024 + }, + { + "epoch": 0.87, + "learning_rate": 2.0407882294523758e-07, + "loss": 1.0119, + "step": 29025 + }, + { + "epoch": 0.87, + "learning_rate": 2.0398230828065414e-07, + "loss": 1.1144, + "step": 29026 + }, + { + "epoch": 0.87, + "learning_rate": 2.038858154730533e-07, + "loss": 1.0552, + "step": 29027 + }, + { + "epoch": 0.87, + "learning_rate": 2.0378934452335408e-07, + "loss": 1.0698, + "step": 29028 + }, + { + "epoch": 0.87, + "learning_rate": 2.0369289543247407e-07, + "loss": 1.1553, + "step": 29029 + }, + { + "epoch": 0.87, + "learning_rate": 2.0359646820133195e-07, + "loss": 1.1574, + "step": 29030 + }, + { + "epoch": 0.87, + "learning_rate": 2.0350006283084506e-07, + "loss": 1.2496, + "step": 29031 + }, + { + "epoch": 0.87, + "learning_rate": 2.0340367932193238e-07, + "loss": 1.1447, + "step": 29032 + }, + { + "epoch": 0.87, + "learning_rate": 2.0330731767550988e-07, + "loss": 0.9952, + "step": 29033 + }, + { + "epoch": 0.87, + "learning_rate": 2.0321097789249567e-07, + "loss": 1.0603, + "step": 29034 + }, + { + "epoch": 0.87, + "learning_rate": 2.0311465997380682e-07, + "loss": 0.9936, + "step": 29035 + }, + { + "epoch": 0.87, + "learning_rate": 2.0301836392036005e-07, + "loss": 1.0611, + "step": 29036 + }, + { + "epoch": 0.87, + "learning_rate": 2.0292208973307276e-07, + "loss": 1.1105, + "step": 29037 + }, + { + "epoch": 0.87, + "learning_rate": 2.0282583741286028e-07, + "loss": 1.0945, + "step": 29038 + }, + { + "epoch": 0.87, + "learning_rate": 2.0272960696063964e-07, + "loss": 1.1693, + "step": 29039 + }, + { + "epoch": 0.87, + "learning_rate": 2.0263339837732681e-07, + "loss": 1.08, + "step": 29040 + }, + { + "epoch": 0.87, + "learning_rate": 2.0253721166383773e-07, + "loss": 1.0428, + "step": 29041 + }, + { + "epoch": 0.87, + "learning_rate": 2.0244104682108773e-07, + "loss": 1.1353, + "step": 29042 + }, + { + "epoch": 0.87, + "learning_rate": 2.0234490384999224e-07, + "loss": 1.1898, + "step": 29043 + }, + { + "epoch": 0.87, + "learning_rate": 2.0224878275146686e-07, + "loss": 1.2576, + "step": 29044 + }, + { + "epoch": 0.87, + "learning_rate": 2.021526835264262e-07, + "loss": 1.1013, + "step": 29045 + }, + { + "epoch": 0.88, + "learning_rate": 2.020566061757856e-07, + "loss": 1.0834, + "step": 29046 + }, + { + "epoch": 0.88, + "learning_rate": 2.019605507004596e-07, + "loss": 1.0977, + "step": 29047 + }, + { + "epoch": 0.88, + "learning_rate": 2.0186451710136195e-07, + "loss": 1.1815, + "step": 29048 + }, + { + "epoch": 0.88, + "learning_rate": 2.0176850537940746e-07, + "loss": 1.1674, + "step": 29049 + }, + { + "epoch": 0.88, + "learning_rate": 2.0167251553550955e-07, + "loss": 1.1168, + "step": 29050 + }, + { + "epoch": 0.88, + "learning_rate": 2.0157654757058276e-07, + "loss": 1.0117, + "step": 29051 + }, + { + "epoch": 0.88, + "learning_rate": 2.0148060148554e-07, + "loss": 1.017, + "step": 29052 + }, + { + "epoch": 0.88, + "learning_rate": 2.0138467728129524e-07, + "loss": 0.9897, + "step": 29053 + }, + { + "epoch": 0.88, + "learning_rate": 2.0128877495876136e-07, + "loss": 1.0224, + "step": 29054 + }, + { + "epoch": 0.88, + "learning_rate": 2.0119289451885126e-07, + "loss": 1.0688, + "step": 29055 + }, + { + "epoch": 0.88, + "learning_rate": 2.0109703596247725e-07, + "loss": 1.0739, + "step": 29056 + }, + { + "epoch": 0.88, + "learning_rate": 2.0100119929055252e-07, + "loss": 1.1413, + "step": 29057 + }, + { + "epoch": 0.88, + "learning_rate": 2.0090538450398934e-07, + "loss": 1.1075, + "step": 29058 + }, + { + "epoch": 0.88, + "learning_rate": 2.008095916036995e-07, + "loss": 1.1136, + "step": 29059 + }, + { + "epoch": 0.88, + "learning_rate": 2.007138205905948e-07, + "loss": 1.131, + "step": 29060 + }, + { + "epoch": 0.88, + "learning_rate": 2.0061807146558698e-07, + "loss": 1.1406, + "step": 29061 + }, + { + "epoch": 0.88, + "learning_rate": 2.005223442295884e-07, + "loss": 1.1707, + "step": 29062 + }, + { + "epoch": 0.88, + "learning_rate": 2.004266388835091e-07, + "loss": 1.0928, + "step": 29063 + }, + { + "epoch": 0.88, + "learning_rate": 2.003309554282609e-07, + "loss": 1.0601, + "step": 29064 + }, + { + "epoch": 0.88, + "learning_rate": 2.002352938647542e-07, + "loss": 1.0234, + "step": 29065 + }, + { + "epoch": 0.88, + "learning_rate": 2.001396541938999e-07, + "loss": 1.0565, + "step": 29066 + }, + { + "epoch": 0.88, + "learning_rate": 2.0004403641660896e-07, + "loss": 1.1624, + "step": 29067 + }, + { + "epoch": 0.88, + "learning_rate": 1.9994844053379065e-07, + "loss": 1.0967, + "step": 29068 + }, + { + "epoch": 0.88, + "learning_rate": 1.998528665463556e-07, + "loss": 1.0643, + "step": 29069 + }, + { + "epoch": 0.88, + "learning_rate": 1.9975731445521312e-07, + "loss": 1.1328, + "step": 29070 + }, + { + "epoch": 0.88, + "learning_rate": 1.9966178426127387e-07, + "loss": 1.0181, + "step": 29071 + }, + { + "epoch": 0.88, + "learning_rate": 1.9956627596544598e-07, + "loss": 1.1075, + "step": 29072 + }, + { + "epoch": 0.88, + "learning_rate": 1.994707895686393e-07, + "loss": 1.0984, + "step": 29073 + }, + { + "epoch": 0.88, + "learning_rate": 1.9937532507176284e-07, + "loss": 1.0526, + "step": 29074 + }, + { + "epoch": 0.88, + "learning_rate": 1.9927988247572527e-07, + "loss": 1.0231, + "step": 29075 + }, + { + "epoch": 0.88, + "learning_rate": 1.991844617814348e-07, + "loss": 1.1463, + "step": 29076 + }, + { + "epoch": 0.88, + "learning_rate": 1.990890629898004e-07, + "loss": 1.0002, + "step": 29077 + }, + { + "epoch": 0.88, + "learning_rate": 1.9899368610172997e-07, + "loss": 1.1053, + "step": 29078 + }, + { + "epoch": 0.88, + "learning_rate": 1.988983311181314e-07, + "loss": 1.0403, + "step": 29079 + }, + { + "epoch": 0.88, + "learning_rate": 1.9880299803991283e-07, + "loss": 0.9825, + "step": 29080 + }, + { + "epoch": 0.88, + "learning_rate": 1.987076868679813e-07, + "loss": 1.131, + "step": 29081 + }, + { + "epoch": 0.88, + "learning_rate": 1.986123976032439e-07, + "loss": 1.0668, + "step": 29082 + }, + { + "epoch": 0.88, + "learning_rate": 1.9851713024660824e-07, + "loss": 1.0779, + "step": 29083 + }, + { + "epoch": 0.88, + "learning_rate": 1.9842188479898133e-07, + "loss": 1.0292, + "step": 29084 + }, + { + "epoch": 0.88, + "learning_rate": 1.9832666126126942e-07, + "loss": 1.1362, + "step": 29085 + }, + { + "epoch": 0.88, + "learning_rate": 1.9823145963437902e-07, + "loss": 1.0747, + "step": 29086 + }, + { + "epoch": 0.88, + "learning_rate": 1.9813627991921657e-07, + "loss": 1.2219, + "step": 29087 + }, + { + "epoch": 0.88, + "learning_rate": 1.9804112211668862e-07, + "loss": 1.1804, + "step": 29088 + }, + { + "epoch": 0.88, + "learning_rate": 1.979459862277e-07, + "loss": 1.049, + "step": 29089 + }, + { + "epoch": 0.88, + "learning_rate": 1.9785087225315692e-07, + "loss": 1.0916, + "step": 29090 + }, + { + "epoch": 0.88, + "learning_rate": 1.9775578019396502e-07, + "loss": 1.1604, + "step": 29091 + }, + { + "epoch": 0.88, + "learning_rate": 1.9766071005102888e-07, + "loss": 1.1594, + "step": 29092 + }, + { + "epoch": 0.88, + "learning_rate": 1.9756566182525472e-07, + "loss": 1.1371, + "step": 29093 + }, + { + "epoch": 0.88, + "learning_rate": 1.9747063551754598e-07, + "loss": 1.1083, + "step": 29094 + }, + { + "epoch": 0.88, + "learning_rate": 1.9737563112880776e-07, + "loss": 1.0894, + "step": 29095 + }, + { + "epoch": 0.88, + "learning_rate": 1.9728064865994462e-07, + "loss": 1.0251, + "step": 29096 + }, + { + "epoch": 0.88, + "learning_rate": 1.971856881118611e-07, + "loss": 1.0536, + "step": 29097 + }, + { + "epoch": 0.88, + "learning_rate": 1.970907494854604e-07, + "loss": 1.1782, + "step": 29098 + }, + { + "epoch": 0.88, + "learning_rate": 1.9699583278164653e-07, + "loss": 1.1797, + "step": 29099 + }, + { + "epoch": 0.88, + "learning_rate": 1.9690093800132342e-07, + "loss": 1.0185, + "step": 29100 + }, + { + "epoch": 0.88, + "learning_rate": 1.9680606514539375e-07, + "loss": 1.0153, + "step": 29101 + }, + { + "epoch": 0.88, + "learning_rate": 1.9671121421476147e-07, + "loss": 1.095, + "step": 29102 + }, + { + "epoch": 0.88, + "learning_rate": 1.9661638521032893e-07, + "loss": 1.0565, + "step": 29103 + }, + { + "epoch": 0.88, + "learning_rate": 1.9652157813299904e-07, + "loss": 1.1879, + "step": 29104 + }, + { + "epoch": 0.88, + "learning_rate": 1.964267929836744e-07, + "loss": 1.139, + "step": 29105 + }, + { + "epoch": 0.88, + "learning_rate": 1.9633202976325788e-07, + "loss": 1.176, + "step": 29106 + }, + { + "epoch": 0.88, + "learning_rate": 1.9623728847265018e-07, + "loss": 1.0336, + "step": 29107 + }, + { + "epoch": 0.88, + "learning_rate": 1.9614256911275415e-07, + "loss": 1.1318, + "step": 29108 + }, + { + "epoch": 0.88, + "learning_rate": 1.960478716844713e-07, + "loss": 1.1471, + "step": 29109 + }, + { + "epoch": 0.88, + "learning_rate": 1.9595319618870346e-07, + "loss": 1.0749, + "step": 29110 + }, + { + "epoch": 0.88, + "learning_rate": 1.9585854262635097e-07, + "loss": 1.1522, + "step": 29111 + }, + { + "epoch": 0.88, + "learning_rate": 1.957639109983156e-07, + "loss": 1.1675, + "step": 29112 + }, + { + "epoch": 0.88, + "learning_rate": 1.9566930130549806e-07, + "loss": 1.0564, + "step": 29113 + }, + { + "epoch": 0.88, + "learning_rate": 1.9557471354879926e-07, + "loss": 1.1356, + "step": 29114 + }, + { + "epoch": 0.88, + "learning_rate": 1.9548014772911906e-07, + "loss": 1.0861, + "step": 29115 + }, + { + "epoch": 0.88, + "learning_rate": 1.9538560384735783e-07, + "loss": 1.0932, + "step": 29116 + }, + { + "epoch": 0.88, + "learning_rate": 1.952910819044157e-07, + "loss": 1.2293, + "step": 29117 + }, + { + "epoch": 0.88, + "learning_rate": 1.951965819011925e-07, + "loss": 1.256, + "step": 29118 + }, + { + "epoch": 0.88, + "learning_rate": 1.9510210383858835e-07, + "loss": 1.09, + "step": 29119 + }, + { + "epoch": 0.88, + "learning_rate": 1.950076477175017e-07, + "loss": 1.1137, + "step": 29120 + }, + { + "epoch": 0.88, + "learning_rate": 1.949132135388321e-07, + "loss": 1.1296, + "step": 29121 + }, + { + "epoch": 0.88, + "learning_rate": 1.9481880130347852e-07, + "loss": 1.1415, + "step": 29122 + }, + { + "epoch": 0.88, + "learning_rate": 1.9472441101234003e-07, + "loss": 1.0472, + "step": 29123 + }, + { + "epoch": 0.88, + "learning_rate": 1.9463004266631445e-07, + "loss": 1.0999, + "step": 29124 + }, + { + "epoch": 0.88, + "learning_rate": 1.945356962663006e-07, + "loss": 1.0709, + "step": 29125 + }, + { + "epoch": 0.88, + "learning_rate": 1.9444137181319682e-07, + "loss": 1.0965, + "step": 29126 + }, + { + "epoch": 0.88, + "learning_rate": 1.9434706930790052e-07, + "loss": 1.1008, + "step": 29127 + }, + { + "epoch": 0.88, + "learning_rate": 1.9425278875130987e-07, + "loss": 1.1121, + "step": 29128 + }, + { + "epoch": 0.88, + "learning_rate": 1.9415853014432245e-07, + "loss": 1.1552, + "step": 29129 + }, + { + "epoch": 0.88, + "learning_rate": 1.940642934878348e-07, + "loss": 1.0883, + "step": 29130 + }, + { + "epoch": 0.88, + "learning_rate": 1.9397007878274476e-07, + "loss": 1.2009, + "step": 29131 + }, + { + "epoch": 0.88, + "learning_rate": 1.9387588602994862e-07, + "loss": 1.0556, + "step": 29132 + }, + { + "epoch": 0.88, + "learning_rate": 1.9378171523034368e-07, + "loss": 1.082, + "step": 29133 + }, + { + "epoch": 0.88, + "learning_rate": 1.9368756638482588e-07, + "loss": 1.0521, + "step": 29134 + }, + { + "epoch": 0.88, + "learning_rate": 1.9359343949429178e-07, + "loss": 1.1338, + "step": 29135 + }, + { + "epoch": 0.88, + "learning_rate": 1.9349933455963782e-07, + "loss": 1.0759, + "step": 29136 + }, + { + "epoch": 0.88, + "learning_rate": 1.934052515817589e-07, + "loss": 1.1196, + "step": 29137 + }, + { + "epoch": 0.88, + "learning_rate": 1.933111905615509e-07, + "loss": 1.0683, + "step": 29138 + }, + { + "epoch": 0.88, + "learning_rate": 1.9321715149990955e-07, + "loss": 1.0902, + "step": 29139 + }, + { + "epoch": 0.88, + "learning_rate": 1.931231343977305e-07, + "loss": 1.0757, + "step": 29140 + }, + { + "epoch": 0.88, + "learning_rate": 1.930291392559075e-07, + "loss": 1.1026, + "step": 29141 + }, + { + "epoch": 0.88, + "learning_rate": 1.929351660753362e-07, + "loss": 1.1631, + "step": 29142 + }, + { + "epoch": 0.88, + "learning_rate": 1.9284121485691116e-07, + "loss": 0.9124, + "step": 29143 + }, + { + "epoch": 0.88, + "learning_rate": 1.927472856015264e-07, + "loss": 1.0937, + "step": 29144 + }, + { + "epoch": 0.88, + "learning_rate": 1.9265337831007647e-07, + "loss": 1.0977, + "step": 29145 + }, + { + "epoch": 0.88, + "learning_rate": 1.925594929834551e-07, + "loss": 1.1079, + "step": 29146 + }, + { + "epoch": 0.88, + "learning_rate": 1.9246562962255577e-07, + "loss": 1.1129, + "step": 29147 + }, + { + "epoch": 0.88, + "learning_rate": 1.9237178822827246e-07, + "loss": 1.0672, + "step": 29148 + }, + { + "epoch": 0.88, + "learning_rate": 1.9227796880149864e-07, + "loss": 1.1874, + "step": 29149 + }, + { + "epoch": 0.88, + "learning_rate": 1.9218417134312662e-07, + "loss": 1.0886, + "step": 29150 + }, + { + "epoch": 0.88, + "learning_rate": 1.9209039585405014e-07, + "loss": 1.125, + "step": 29151 + }, + { + "epoch": 0.88, + "learning_rate": 1.919966423351613e-07, + "loss": 1.2153, + "step": 29152 + }, + { + "epoch": 0.88, + "learning_rate": 1.9190291078735324e-07, + "loss": 1.0264, + "step": 29153 + }, + { + "epoch": 0.88, + "learning_rate": 1.9180920121151748e-07, + "loss": 1.0644, + "step": 29154 + }, + { + "epoch": 0.88, + "learning_rate": 1.9171551360854661e-07, + "loss": 1.0435, + "step": 29155 + }, + { + "epoch": 0.88, + "learning_rate": 1.916218479793322e-07, + "loss": 1.2036, + "step": 29156 + }, + { + "epoch": 0.88, + "learning_rate": 1.9152820432476598e-07, + "loss": 1.0956, + "step": 29157 + }, + { + "epoch": 0.88, + "learning_rate": 1.9143458264573976e-07, + "loss": 0.9852, + "step": 29158 + }, + { + "epoch": 0.88, + "learning_rate": 1.9134098294314425e-07, + "loss": 1.1033, + "step": 29159 + }, + { + "epoch": 0.88, + "learning_rate": 1.9124740521787062e-07, + "loss": 1.1104, + "step": 29160 + }, + { + "epoch": 0.88, + "learning_rate": 1.9115384947080984e-07, + "loss": 1.0808, + "step": 29161 + }, + { + "epoch": 0.88, + "learning_rate": 1.9106031570285287e-07, + "loss": 1.1428, + "step": 29162 + }, + { + "epoch": 0.88, + "learning_rate": 1.909668039148893e-07, + "loss": 1.0554, + "step": 29163 + }, + { + "epoch": 0.88, + "learning_rate": 1.9087331410780953e-07, + "loss": 1.19, + "step": 29164 + }, + { + "epoch": 0.88, + "learning_rate": 1.907798462825039e-07, + "loss": 1.1964, + "step": 29165 + }, + { + "epoch": 0.88, + "learning_rate": 1.9068640043986232e-07, + "loss": 1.0338, + "step": 29166 + }, + { + "epoch": 0.88, + "learning_rate": 1.9059297658077347e-07, + "loss": 1.1602, + "step": 29167 + }, + { + "epoch": 0.88, + "learning_rate": 1.9049957470612752e-07, + "loss": 1.0253, + "step": 29168 + }, + { + "epoch": 0.88, + "learning_rate": 1.9040619481681317e-07, + "loss": 1.1232, + "step": 29169 + }, + { + "epoch": 0.88, + "learning_rate": 1.9031283691371943e-07, + "loss": 1.1541, + "step": 29170 + }, + { + "epoch": 0.88, + "learning_rate": 1.9021950099773533e-07, + "loss": 1.162, + "step": 29171 + }, + { + "epoch": 0.88, + "learning_rate": 1.9012618706974907e-07, + "loss": 1.1005, + "step": 29172 + }, + { + "epoch": 0.88, + "learning_rate": 1.9003289513064904e-07, + "loss": 1.1362, + "step": 29173 + }, + { + "epoch": 0.88, + "learning_rate": 1.8993962518132319e-07, + "loss": 1.1749, + "step": 29174 + }, + { + "epoch": 0.88, + "learning_rate": 1.8984637722265998e-07, + "loss": 0.9532, + "step": 29175 + }, + { + "epoch": 0.88, + "learning_rate": 1.8975315125554617e-07, + "loss": 1.0528, + "step": 29176 + }, + { + "epoch": 0.88, + "learning_rate": 1.8965994728086968e-07, + "loss": 0.9964, + "step": 29177 + }, + { + "epoch": 0.88, + "learning_rate": 1.8956676529951812e-07, + "loss": 1.1213, + "step": 29178 + }, + { + "epoch": 0.88, + "learning_rate": 1.894736053123783e-07, + "loss": 1.1371, + "step": 29179 + }, + { + "epoch": 0.88, + "learning_rate": 1.893804673203367e-07, + "loss": 1.0213, + "step": 29180 + }, + { + "epoch": 0.88, + "learning_rate": 1.8928735132428015e-07, + "loss": 1.1072, + "step": 29181 + }, + { + "epoch": 0.88, + "learning_rate": 1.8919425732509516e-07, + "loss": 1.0136, + "step": 29182 + }, + { + "epoch": 0.88, + "learning_rate": 1.8910118532366794e-07, + "loss": 1.1141, + "step": 29183 + }, + { + "epoch": 0.88, + "learning_rate": 1.8900813532088446e-07, + "loss": 1.0628, + "step": 29184 + }, + { + "epoch": 0.88, + "learning_rate": 1.889151073176304e-07, + "loss": 0.9647, + "step": 29185 + }, + { + "epoch": 0.88, + "learning_rate": 1.8882210131479145e-07, + "loss": 1.1086, + "step": 29186 + }, + { + "epoch": 0.88, + "learning_rate": 1.8872911731325327e-07, + "loss": 1.0758, + "step": 29187 + }, + { + "epoch": 0.88, + "learning_rate": 1.8863615531390102e-07, + "loss": 1.0628, + "step": 29188 + }, + { + "epoch": 0.88, + "learning_rate": 1.8854321531761894e-07, + "loss": 1.118, + "step": 29189 + }, + { + "epoch": 0.88, + "learning_rate": 1.884502973252922e-07, + "loss": 1.0187, + "step": 29190 + }, + { + "epoch": 0.88, + "learning_rate": 1.8835740133780534e-07, + "loss": 1.156, + "step": 29191 + }, + { + "epoch": 0.88, + "learning_rate": 1.8826452735604324e-07, + "loss": 1.1104, + "step": 29192 + }, + { + "epoch": 0.88, + "learning_rate": 1.8817167538088876e-07, + "loss": 0.9783, + "step": 29193 + }, + { + "epoch": 0.88, + "learning_rate": 1.880788454132268e-07, + "loss": 1.0912, + "step": 29194 + }, + { + "epoch": 0.88, + "learning_rate": 1.879860374539408e-07, + "loss": 1.1125, + "step": 29195 + }, + { + "epoch": 0.88, + "learning_rate": 1.8789325150391391e-07, + "loss": 1.0596, + "step": 29196 + }, + { + "epoch": 0.88, + "learning_rate": 1.8780048756403047e-07, + "loss": 1.061, + "step": 29197 + }, + { + "epoch": 0.88, + "learning_rate": 1.8770774563517225e-07, + "loss": 1.0573, + "step": 29198 + }, + { + "epoch": 0.88, + "learning_rate": 1.876150257182227e-07, + "loss": 1.2014, + "step": 29199 + }, + { + "epoch": 0.88, + "learning_rate": 1.875223278140642e-07, + "loss": 1.1463, + "step": 29200 + }, + { + "epoch": 0.88, + "learning_rate": 1.8742965192357993e-07, + "loss": 1.0386, + "step": 29201 + }, + { + "epoch": 0.88, + "learning_rate": 1.8733699804765137e-07, + "loss": 1.1378, + "step": 29202 + }, + { + "epoch": 0.88, + "learning_rate": 1.8724436618716062e-07, + "loss": 1.1501, + "step": 29203 + }, + { + "epoch": 0.88, + "learning_rate": 1.8715175634298976e-07, + "loss": 1.0965, + "step": 29204 + }, + { + "epoch": 0.88, + "learning_rate": 1.8705916851602058e-07, + "loss": 1.0984, + "step": 29205 + }, + { + "epoch": 0.88, + "learning_rate": 1.8696660270713372e-07, + "loss": 1.147, + "step": 29206 + }, + { + "epoch": 0.88, + "learning_rate": 1.8687405891721077e-07, + "loss": 0.9958, + "step": 29207 + }, + { + "epoch": 0.88, + "learning_rate": 1.8678153714713293e-07, + "loss": 1.0501, + "step": 29208 + }, + { + "epoch": 0.88, + "learning_rate": 1.866890373977806e-07, + "loss": 1.1827, + "step": 29209 + }, + { + "epoch": 0.88, + "learning_rate": 1.8659655967003448e-07, + "loss": 1.0882, + "step": 29210 + }, + { + "epoch": 0.88, + "learning_rate": 1.8650410396477526e-07, + "loss": 1.0388, + "step": 29211 + }, + { + "epoch": 0.88, + "learning_rate": 1.8641167028288276e-07, + "loss": 1.1749, + "step": 29212 + }, + { + "epoch": 0.88, + "learning_rate": 1.8631925862523687e-07, + "loss": 1.1309, + "step": 29213 + }, + { + "epoch": 0.88, + "learning_rate": 1.8622686899271686e-07, + "loss": 1.0055, + "step": 29214 + }, + { + "epoch": 0.88, + "learning_rate": 1.8613450138620315e-07, + "loss": 1.0369, + "step": 29215 + }, + { + "epoch": 0.88, + "learning_rate": 1.8604215580657447e-07, + "loss": 1.078, + "step": 29216 + }, + { + "epoch": 0.88, + "learning_rate": 1.8594983225470987e-07, + "loss": 1.2625, + "step": 29217 + }, + { + "epoch": 0.88, + "learning_rate": 1.8585753073148888e-07, + "loss": 1.1276, + "step": 29218 + }, + { + "epoch": 0.88, + "learning_rate": 1.8576525123778915e-07, + "loss": 1.2079, + "step": 29219 + }, + { + "epoch": 0.88, + "learning_rate": 1.8567299377449e-07, + "loss": 1.1222, + "step": 29220 + }, + { + "epoch": 0.88, + "learning_rate": 1.8558075834246902e-07, + "loss": 0.9719, + "step": 29221 + }, + { + "epoch": 0.88, + "learning_rate": 1.8548854494260472e-07, + "loss": 1.0911, + "step": 29222 + }, + { + "epoch": 0.88, + "learning_rate": 1.8539635357577495e-07, + "loss": 1.0283, + "step": 29223 + }, + { + "epoch": 0.88, + "learning_rate": 1.8530418424285685e-07, + "loss": 1.1476, + "step": 29224 + }, + { + "epoch": 0.88, + "learning_rate": 1.8521203694472827e-07, + "loss": 1.0145, + "step": 29225 + }, + { + "epoch": 0.88, + "learning_rate": 1.8511991168226606e-07, + "loss": 1.0034, + "step": 29226 + }, + { + "epoch": 0.88, + "learning_rate": 1.8502780845634781e-07, + "loss": 1.0499, + "step": 29227 + }, + { + "epoch": 0.88, + "learning_rate": 1.8493572726784952e-07, + "loss": 0.9625, + "step": 29228 + }, + { + "epoch": 0.88, + "learning_rate": 1.8484366811764827e-07, + "loss": 1.1083, + "step": 29229 + }, + { + "epoch": 0.88, + "learning_rate": 1.8475163100662025e-07, + "loss": 1.1714, + "step": 29230 + }, + { + "epoch": 0.88, + "learning_rate": 1.84659615935642e-07, + "loss": 0.9875, + "step": 29231 + }, + { + "epoch": 0.88, + "learning_rate": 1.8456762290558873e-07, + "loss": 1.1499, + "step": 29232 + }, + { + "epoch": 0.88, + "learning_rate": 1.844756519173363e-07, + "loss": 1.1419, + "step": 29233 + }, + { + "epoch": 0.88, + "learning_rate": 1.8438370297176072e-07, + "loss": 1.1286, + "step": 29234 + }, + { + "epoch": 0.88, + "learning_rate": 1.8429177606973715e-07, + "loss": 1.0507, + "step": 29235 + }, + { + "epoch": 0.88, + "learning_rate": 1.8419987121214068e-07, + "loss": 1.0901, + "step": 29236 + }, + { + "epoch": 0.88, + "learning_rate": 1.841079883998459e-07, + "loss": 1.1788, + "step": 29237 + }, + { + "epoch": 0.88, + "learning_rate": 1.8401612763372767e-07, + "loss": 1.04, + "step": 29238 + }, + { + "epoch": 0.88, + "learning_rate": 1.8392428891466057e-07, + "loss": 1.0823, + "step": 29239 + }, + { + "epoch": 0.88, + "learning_rate": 1.8383247224351863e-07, + "loss": 1.0862, + "step": 29240 + }, + { + "epoch": 0.88, + "learning_rate": 1.8374067762117614e-07, + "loss": 1.0628, + "step": 29241 + }, + { + "epoch": 0.88, + "learning_rate": 1.8364890504850656e-07, + "loss": 1.1187, + "step": 29242 + }, + { + "epoch": 0.88, + "learning_rate": 1.8355715452638424e-07, + "loss": 1.1816, + "step": 29243 + }, + { + "epoch": 0.88, + "learning_rate": 1.834654260556823e-07, + "loss": 1.1747, + "step": 29244 + }, + { + "epoch": 0.88, + "learning_rate": 1.8337371963727368e-07, + "loss": 1.1582, + "step": 29245 + }, + { + "epoch": 0.88, + "learning_rate": 1.832820352720313e-07, + "loss": 0.9574, + "step": 29246 + }, + { + "epoch": 0.88, + "learning_rate": 1.8319037296082808e-07, + "loss": 1.0654, + "step": 29247 + }, + { + "epoch": 0.88, + "learning_rate": 1.830987327045375e-07, + "loss": 1.0712, + "step": 29248 + }, + { + "epoch": 0.88, + "learning_rate": 1.8300711450403046e-07, + "loss": 1.1929, + "step": 29249 + }, + { + "epoch": 0.88, + "learning_rate": 1.8291551836017968e-07, + "loss": 1.0391, + "step": 29250 + }, + { + "epoch": 0.88, + "learning_rate": 1.8282394427385746e-07, + "loss": 1.1157, + "step": 29251 + }, + { + "epoch": 0.88, + "learning_rate": 1.8273239224593508e-07, + "loss": 1.0821, + "step": 29252 + }, + { + "epoch": 0.88, + "learning_rate": 1.826408622772849e-07, + "loss": 1.0641, + "step": 29253 + }, + { + "epoch": 0.88, + "learning_rate": 1.82549354368777e-07, + "loss": 1.1335, + "step": 29254 + }, + { + "epoch": 0.88, + "learning_rate": 1.8245786852128327e-07, + "loss": 1.0739, + "step": 29255 + }, + { + "epoch": 0.88, + "learning_rate": 1.8236640473567463e-07, + "loss": 1.0225, + "step": 29256 + }, + { + "epoch": 0.88, + "learning_rate": 1.8227496301282178e-07, + "loss": 1.0552, + "step": 29257 + }, + { + "epoch": 0.88, + "learning_rate": 1.8218354335359456e-07, + "loss": 1.1395, + "step": 29258 + }, + { + "epoch": 0.88, + "learning_rate": 1.8209214575886397e-07, + "loss": 1.1479, + "step": 29259 + }, + { + "epoch": 0.88, + "learning_rate": 1.8200077022949958e-07, + "loss": 1.0536, + "step": 29260 + }, + { + "epoch": 0.88, + "learning_rate": 1.8190941676637182e-07, + "loss": 1.298, + "step": 29261 + }, + { + "epoch": 0.88, + "learning_rate": 1.8181808537034995e-07, + "loss": 1.1059, + "step": 29262 + }, + { + "epoch": 0.88, + "learning_rate": 1.8172677604230305e-07, + "loss": 1.0507, + "step": 29263 + }, + { + "epoch": 0.88, + "learning_rate": 1.8163548878310093e-07, + "loss": 1.094, + "step": 29264 + }, + { + "epoch": 0.88, + "learning_rate": 1.815442235936124e-07, + "loss": 1.0233, + "step": 29265 + }, + { + "epoch": 0.88, + "learning_rate": 1.8145298047470615e-07, + "loss": 1.032, + "step": 29266 + }, + { + "epoch": 0.88, + "learning_rate": 1.813617594272507e-07, + "loss": 1.0819, + "step": 29267 + }, + { + "epoch": 0.88, + "learning_rate": 1.8127056045211506e-07, + "loss": 1.2079, + "step": 29268 + }, + { + "epoch": 0.88, + "learning_rate": 1.8117938355016656e-07, + "loss": 1.0334, + "step": 29269 + }, + { + "epoch": 0.88, + "learning_rate": 1.8108822872227428e-07, + "loss": 1.1647, + "step": 29270 + }, + { + "epoch": 0.88, + "learning_rate": 1.8099709596930442e-07, + "loss": 0.9678, + "step": 29271 + }, + { + "epoch": 0.88, + "learning_rate": 1.8090598529212577e-07, + "loss": 1.1083, + "step": 29272 + }, + { + "epoch": 0.88, + "learning_rate": 1.8081489669160485e-07, + "loss": 1.0311, + "step": 29273 + }, + { + "epoch": 0.88, + "learning_rate": 1.8072383016860984e-07, + "loss": 1.2333, + "step": 29274 + }, + { + "epoch": 0.88, + "learning_rate": 1.8063278572400646e-07, + "loss": 1.0007, + "step": 29275 + }, + { + "epoch": 0.88, + "learning_rate": 1.8054176335866175e-07, + "loss": 1.088, + "step": 29276 + }, + { + "epoch": 0.88, + "learning_rate": 1.8045076307344257e-07, + "loss": 1.1121, + "step": 29277 + }, + { + "epoch": 0.88, + "learning_rate": 1.8035978486921485e-07, + "loss": 1.0555, + "step": 29278 + }, + { + "epoch": 0.88, + "learning_rate": 1.8026882874684544e-07, + "loss": 1.1825, + "step": 29279 + }, + { + "epoch": 0.88, + "learning_rate": 1.8017789470719887e-07, + "loss": 1.0516, + "step": 29280 + }, + { + "epoch": 0.88, + "learning_rate": 1.8008698275114173e-07, + "loss": 1.0597, + "step": 29281 + }, + { + "epoch": 0.88, + "learning_rate": 1.7999609287953912e-07, + "loss": 1.0912, + "step": 29282 + }, + { + "epoch": 0.88, + "learning_rate": 1.7990522509325676e-07, + "loss": 1.2317, + "step": 29283 + }, + { + "epoch": 0.88, + "learning_rate": 1.7981437939315894e-07, + "loss": 1.1459, + "step": 29284 + }, + { + "epoch": 0.88, + "learning_rate": 1.7972355578011052e-07, + "loss": 1.1889, + "step": 29285 + }, + { + "epoch": 0.88, + "learning_rate": 1.7963275425497668e-07, + "loss": 1.1969, + "step": 29286 + }, + { + "epoch": 0.88, + "learning_rate": 1.7954197481862168e-07, + "loss": 1.1968, + "step": 29287 + }, + { + "epoch": 0.88, + "learning_rate": 1.7945121747190903e-07, + "loss": 1.0251, + "step": 29288 + }, + { + "epoch": 0.88, + "learning_rate": 1.7936048221570328e-07, + "loss": 1.0608, + "step": 29289 + }, + { + "epoch": 0.88, + "learning_rate": 1.7926976905086825e-07, + "loss": 1.0339, + "step": 29290 + }, + { + "epoch": 0.88, + "learning_rate": 1.7917907797826705e-07, + "loss": 1.1509, + "step": 29291 + }, + { + "epoch": 0.88, + "learning_rate": 1.7908840899876351e-07, + "loss": 1.1956, + "step": 29292 + }, + { + "epoch": 0.88, + "learning_rate": 1.7899776211322052e-07, + "loss": 1.1492, + "step": 29293 + }, + { + "epoch": 0.88, + "learning_rate": 1.7890713732250125e-07, + "loss": 1.0493, + "step": 29294 + }, + { + "epoch": 0.88, + "learning_rate": 1.7881653462746783e-07, + "loss": 1.1013, + "step": 29295 + }, + { + "epoch": 0.88, + "learning_rate": 1.787259540289829e-07, + "loss": 1.1068, + "step": 29296 + }, + { + "epoch": 0.88, + "learning_rate": 1.786353955279091e-07, + "loss": 1.0013, + "step": 29297 + }, + { + "epoch": 0.88, + "learning_rate": 1.785448591251085e-07, + "loss": 1.1129, + "step": 29298 + }, + { + "epoch": 0.88, + "learning_rate": 1.7845434482144265e-07, + "loss": 1.1611, + "step": 29299 + }, + { + "epoch": 0.88, + "learning_rate": 1.7836385261777362e-07, + "loss": 1.1481, + "step": 29300 + }, + { + "epoch": 0.88, + "learning_rate": 1.7827338251496213e-07, + "loss": 1.0812, + "step": 29301 + }, + { + "epoch": 0.88, + "learning_rate": 1.7818293451386998e-07, + "loss": 1.1683, + "step": 29302 + }, + { + "epoch": 0.88, + "learning_rate": 1.7809250861535815e-07, + "loss": 1.0707, + "step": 29303 + }, + { + "epoch": 0.88, + "learning_rate": 1.7800210482028734e-07, + "loss": 1.0757, + "step": 29304 + }, + { + "epoch": 0.88, + "learning_rate": 1.7791172312951855e-07, + "loss": 1.2014, + "step": 29305 + }, + { + "epoch": 0.88, + "learning_rate": 1.7782136354391134e-07, + "loss": 1.2924, + "step": 29306 + }, + { + "epoch": 0.88, + "learning_rate": 1.7773102606432642e-07, + "loss": 1.084, + "step": 29307 + }, + { + "epoch": 0.88, + "learning_rate": 1.7764071069162363e-07, + "loss": 1.1146, + "step": 29308 + }, + { + "epoch": 0.88, + "learning_rate": 1.7755041742666318e-07, + "loss": 1.0751, + "step": 29309 + }, + { + "epoch": 0.88, + "learning_rate": 1.7746014627030378e-07, + "loss": 1.1619, + "step": 29310 + }, + { + "epoch": 0.88, + "learning_rate": 1.7736989722340531e-07, + "loss": 1.1334, + "step": 29311 + }, + { + "epoch": 0.88, + "learning_rate": 1.772796702868268e-07, + "loss": 1.1354, + "step": 29312 + }, + { + "epoch": 0.88, + "learning_rate": 1.7718946546142756e-07, + "loss": 1.1253, + "step": 29313 + }, + { + "epoch": 0.88, + "learning_rate": 1.7709928274806555e-07, + "loss": 1.0071, + "step": 29314 + }, + { + "epoch": 0.88, + "learning_rate": 1.7700912214759947e-07, + "loss": 1.0167, + "step": 29315 + }, + { + "epoch": 0.88, + "learning_rate": 1.7691898366088784e-07, + "loss": 1.1245, + "step": 29316 + }, + { + "epoch": 0.88, + "learning_rate": 1.7682886728878884e-07, + "loss": 1.1047, + "step": 29317 + }, + { + "epoch": 0.88, + "learning_rate": 1.7673877303216015e-07, + "loss": 1.1254, + "step": 29318 + }, + { + "epoch": 0.88, + "learning_rate": 1.7664870089185937e-07, + "loss": 1.0918, + "step": 29319 + }, + { + "epoch": 0.88, + "learning_rate": 1.765586508687439e-07, + "loss": 1.0416, + "step": 29320 + }, + { + "epoch": 0.88, + "learning_rate": 1.7646862296367084e-07, + "loss": 1.02, + "step": 29321 + }, + { + "epoch": 0.88, + "learning_rate": 1.7637861717749783e-07, + "loss": 1.1056, + "step": 29322 + }, + { + "epoch": 0.88, + "learning_rate": 1.7628863351108112e-07, + "loss": 1.051, + "step": 29323 + }, + { + "epoch": 0.88, + "learning_rate": 1.7619867196527724e-07, + "loss": 1.0588, + "step": 29324 + }, + { + "epoch": 0.88, + "learning_rate": 1.7610873254094302e-07, + "loss": 1.1569, + "step": 29325 + }, + { + "epoch": 0.88, + "learning_rate": 1.76018815238935e-07, + "loss": 1.0734, + "step": 29326 + }, + { + "epoch": 0.88, + "learning_rate": 1.7592892006010804e-07, + "loss": 1.0038, + "step": 29327 + }, + { + "epoch": 0.88, + "learning_rate": 1.758390470053184e-07, + "loss": 1.1293, + "step": 29328 + }, + { + "epoch": 0.88, + "learning_rate": 1.757491960754218e-07, + "loss": 1.1376, + "step": 29329 + }, + { + "epoch": 0.88, + "learning_rate": 1.7565936727127337e-07, + "loss": 1.1168, + "step": 29330 + }, + { + "epoch": 0.88, + "learning_rate": 1.7556956059372882e-07, + "loss": 1.1893, + "step": 29331 + }, + { + "epoch": 0.88, + "learning_rate": 1.754797760436419e-07, + "loss": 1.1606, + "step": 29332 + }, + { + "epoch": 0.88, + "learning_rate": 1.7539001362186835e-07, + "loss": 1.0546, + "step": 29333 + }, + { + "epoch": 0.88, + "learning_rate": 1.7530027332926193e-07, + "loss": 0.9855, + "step": 29334 + }, + { + "epoch": 0.88, + "learning_rate": 1.75210555166678e-07, + "loss": 1.0961, + "step": 29335 + }, + { + "epoch": 0.88, + "learning_rate": 1.751208591349693e-07, + "loss": 1.075, + "step": 29336 + }, + { + "epoch": 0.88, + "learning_rate": 1.7503118523499064e-07, + "loss": 1.2757, + "step": 29337 + }, + { + "epoch": 0.88, + "learning_rate": 1.7494153346759496e-07, + "loss": 1.1427, + "step": 29338 + }, + { + "epoch": 0.88, + "learning_rate": 1.7485190383363686e-07, + "loss": 1.0558, + "step": 29339 + }, + { + "epoch": 0.88, + "learning_rate": 1.7476229633396818e-07, + "loss": 0.97, + "step": 29340 + }, + { + "epoch": 0.88, + "learning_rate": 1.7467271096944265e-07, + "loss": 1.0613, + "step": 29341 + }, + { + "epoch": 0.88, + "learning_rate": 1.7458314774091295e-07, + "loss": 1.0638, + "step": 29342 + }, + { + "epoch": 0.88, + "learning_rate": 1.744936066492317e-07, + "loss": 1.2128, + "step": 29343 + }, + { + "epoch": 0.88, + "learning_rate": 1.7440408769525185e-07, + "loss": 1.1262, + "step": 29344 + }, + { + "epoch": 0.88, + "learning_rate": 1.7431459087982438e-07, + "loss": 1.092, + "step": 29345 + }, + { + "epoch": 0.88, + "learning_rate": 1.7422511620380223e-07, + "loss": 1.11, + "step": 29346 + }, + { + "epoch": 0.88, + "learning_rate": 1.7413566366803663e-07, + "loss": 1.0403, + "step": 29347 + }, + { + "epoch": 0.88, + "learning_rate": 1.7404623327337943e-07, + "loss": 1.1043, + "step": 29348 + }, + { + "epoch": 0.88, + "learning_rate": 1.739568250206816e-07, + "loss": 1.2338, + "step": 29349 + }, + { + "epoch": 0.88, + "learning_rate": 1.73867438910795e-07, + "loss": 1.1278, + "step": 29350 + }, + { + "epoch": 0.88, + "learning_rate": 1.7377807494456973e-07, + "loss": 1.0435, + "step": 29351 + }, + { + "epoch": 0.88, + "learning_rate": 1.7368873312285734e-07, + "loss": 1.1542, + "step": 29352 + }, + { + "epoch": 0.88, + "learning_rate": 1.7359941344650744e-07, + "loss": 1.0013, + "step": 29353 + }, + { + "epoch": 0.88, + "learning_rate": 1.7351011591637074e-07, + "loss": 1.188, + "step": 29354 + }, + { + "epoch": 0.88, + "learning_rate": 1.734208405332971e-07, + "loss": 1.1456, + "step": 29355 + }, + { + "epoch": 0.88, + "learning_rate": 1.7333158729813672e-07, + "loss": 1.216, + "step": 29356 + }, + { + "epoch": 0.88, + "learning_rate": 1.732423562117394e-07, + "loss": 1.0961, + "step": 29357 + }, + { + "epoch": 0.88, + "learning_rate": 1.7315314727495398e-07, + "loss": 1.0477, + "step": 29358 + }, + { + "epoch": 0.88, + "learning_rate": 1.7306396048862973e-07, + "loss": 0.9603, + "step": 29359 + }, + { + "epoch": 0.88, + "learning_rate": 1.7297479585361598e-07, + "loss": 0.9695, + "step": 29360 + }, + { + "epoch": 0.88, + "learning_rate": 1.728856533707618e-07, + "loss": 1.0233, + "step": 29361 + }, + { + "epoch": 0.88, + "learning_rate": 1.727965330409151e-07, + "loss": 1.1018, + "step": 29362 + }, + { + "epoch": 0.88, + "learning_rate": 1.7270743486492437e-07, + "loss": 1.1287, + "step": 29363 + }, + { + "epoch": 0.88, + "learning_rate": 1.7261835884363838e-07, + "loss": 0.9783, + "step": 29364 + }, + { + "epoch": 0.88, + "learning_rate": 1.7252930497790477e-07, + "loss": 1.0324, + "step": 29365 + }, + { + "epoch": 0.88, + "learning_rate": 1.7244027326857095e-07, + "loss": 1.0949, + "step": 29366 + }, + { + "epoch": 0.88, + "learning_rate": 1.723512637164848e-07, + "loss": 1.0818, + "step": 29367 + }, + { + "epoch": 0.88, + "learning_rate": 1.7226227632249348e-07, + "loss": 1.1337, + "step": 29368 + }, + { + "epoch": 0.88, + "learning_rate": 1.7217331108744435e-07, + "loss": 1.0654, + "step": 29369 + }, + { + "epoch": 0.88, + "learning_rate": 1.7208436801218447e-07, + "loss": 1.0483, + "step": 29370 + }, + { + "epoch": 0.88, + "learning_rate": 1.7199544709755988e-07, + "loss": 0.9969, + "step": 29371 + }, + { + "epoch": 0.88, + "learning_rate": 1.719065483444174e-07, + "loss": 1.0715, + "step": 29372 + }, + { + "epoch": 0.88, + "learning_rate": 1.7181767175360326e-07, + "loss": 1.0634, + "step": 29373 + }, + { + "epoch": 0.88, + "learning_rate": 1.7172881732596376e-07, + "loss": 1.1489, + "step": 29374 + }, + { + "epoch": 0.88, + "learning_rate": 1.7163998506234432e-07, + "loss": 1.1253, + "step": 29375 + }, + { + "epoch": 0.88, + "learning_rate": 1.7155117496359148e-07, + "loss": 1.0438, + "step": 29376 + }, + { + "epoch": 0.88, + "learning_rate": 1.7146238703054957e-07, + "loss": 1.0264, + "step": 29377 + }, + { + "epoch": 0.89, + "learning_rate": 1.713736212640643e-07, + "loss": 1.0981, + "step": 29378 + }, + { + "epoch": 0.89, + "learning_rate": 1.712848776649806e-07, + "loss": 1.0681, + "step": 29379 + }, + { + "epoch": 0.89, + "learning_rate": 1.7119615623414326e-07, + "loss": 1.1254, + "step": 29380 + }, + { + "epoch": 0.89, + "learning_rate": 1.7110745697239722e-07, + "loss": 1.0996, + "step": 29381 + }, + { + "epoch": 0.89, + "learning_rate": 1.7101877988058625e-07, + "loss": 1.1099, + "step": 29382 + }, + { + "epoch": 0.89, + "learning_rate": 1.709301249595552e-07, + "loss": 1.0795, + "step": 29383 + }, + { + "epoch": 0.89, + "learning_rate": 1.7084149221014758e-07, + "loss": 1.002, + "step": 29384 + }, + { + "epoch": 0.89, + "learning_rate": 1.7075288163320685e-07, + "loss": 1.0173, + "step": 29385 + }, + { + "epoch": 0.89, + "learning_rate": 1.706642932295771e-07, + "loss": 1.1194, + "step": 29386 + }, + { + "epoch": 0.89, + "learning_rate": 1.7057572700010156e-07, + "loss": 1.046, + "step": 29387 + }, + { + "epoch": 0.89, + "learning_rate": 1.7048718294562312e-07, + "loss": 1.0325, + "step": 29388 + }, + { + "epoch": 0.89, + "learning_rate": 1.7039866106698443e-07, + "loss": 1.1699, + "step": 29389 + }, + { + "epoch": 0.89, + "learning_rate": 1.7031016136502877e-07, + "loss": 1.0775, + "step": 29390 + }, + { + "epoch": 0.89, + "learning_rate": 1.7022168384059871e-07, + "loss": 1.1857, + "step": 29391 + }, + { + "epoch": 0.89, + "learning_rate": 1.7013322849453588e-07, + "loss": 1.1307, + "step": 29392 + }, + { + "epoch": 0.89, + "learning_rate": 1.7004479532768235e-07, + "loss": 1.1212, + "step": 29393 + }, + { + "epoch": 0.89, + "learning_rate": 1.6995638434088053e-07, + "loss": 1.0843, + "step": 29394 + }, + { + "epoch": 0.89, + "learning_rate": 1.6986799553497135e-07, + "loss": 1.119, + "step": 29395 + }, + { + "epoch": 0.89, + "learning_rate": 1.6977962891079725e-07, + "loss": 1.0804, + "step": 29396 + }, + { + "epoch": 0.89, + "learning_rate": 1.6969128446919863e-07, + "loss": 1.079, + "step": 29397 + }, + { + "epoch": 0.89, + "learning_rate": 1.6960296221101624e-07, + "loss": 1.1711, + "step": 29398 + }, + { + "epoch": 0.89, + "learning_rate": 1.695146621370916e-07, + "loss": 1.0856, + "step": 29399 + }, + { + "epoch": 0.89, + "learning_rate": 1.6942638424826519e-07, + "loss": 1.1283, + "step": 29400 + }, + { + "epoch": 0.89, + "learning_rate": 1.6933812854537685e-07, + "loss": 1.0732, + "step": 29401 + }, + { + "epoch": 0.89, + "learning_rate": 1.6924989502926703e-07, + "loss": 1.0597, + "step": 29402 + }, + { + "epoch": 0.89, + "learning_rate": 1.6916168370077561e-07, + "loss": 1.0728, + "step": 29403 + }, + { + "epoch": 0.89, + "learning_rate": 1.6907349456074252e-07, + "loss": 1.1397, + "step": 29404 + }, + { + "epoch": 0.89, + "learning_rate": 1.6898532761000703e-07, + "loss": 1.02, + "step": 29405 + }, + { + "epoch": 0.89, + "learning_rate": 1.6889718284940875e-07, + "loss": 1.0495, + "step": 29406 + }, + { + "epoch": 0.89, + "learning_rate": 1.688090602797865e-07, + "loss": 1.022, + "step": 29407 + }, + { + "epoch": 0.89, + "learning_rate": 1.68720959901979e-07, + "loss": 1.0682, + "step": 29408 + }, + { + "epoch": 0.89, + "learning_rate": 1.686328817168259e-07, + "loss": 1.0323, + "step": 29409 + }, + { + "epoch": 0.89, + "learning_rate": 1.6854482572516455e-07, + "loss": 1.0594, + "step": 29410 + }, + { + "epoch": 0.89, + "learning_rate": 1.6845679192783348e-07, + "loss": 1.1399, + "step": 29411 + }, + { + "epoch": 0.89, + "learning_rate": 1.683687803256709e-07, + "loss": 1.1609, + "step": 29412 + }, + { + "epoch": 0.89, + "learning_rate": 1.6828079091951472e-07, + "loss": 1.0703, + "step": 29413 + }, + { + "epoch": 0.89, + "learning_rate": 1.6819282371020234e-07, + "loss": 1.0939, + "step": 29414 + }, + { + "epoch": 0.89, + "learning_rate": 1.6810487869857117e-07, + "loss": 1.1929, + "step": 29415 + }, + { + "epoch": 0.89, + "learning_rate": 1.680169558854583e-07, + "loss": 1.195, + "step": 29416 + }, + { + "epoch": 0.89, + "learning_rate": 1.679290552717014e-07, + "loss": 1.0416, + "step": 29417 + }, + { + "epoch": 0.89, + "learning_rate": 1.6784117685813644e-07, + "loss": 1.0754, + "step": 29418 + }, + { + "epoch": 0.89, + "learning_rate": 1.6775332064560002e-07, + "loss": 1.0294, + "step": 29419 + }, + { + "epoch": 0.89, + "learning_rate": 1.6766548663492894e-07, + "loss": 0.9794, + "step": 29420 + }, + { + "epoch": 0.89, + "learning_rate": 1.675776748269592e-07, + "loss": 1.0228, + "step": 29421 + }, + { + "epoch": 0.89, + "learning_rate": 1.6748988522252678e-07, + "loss": 1.0781, + "step": 29422 + }, + { + "epoch": 0.89, + "learning_rate": 1.6740211782246717e-07, + "loss": 1.0674, + "step": 29423 + }, + { + "epoch": 0.89, + "learning_rate": 1.673143726276158e-07, + "loss": 1.2431, + "step": 29424 + }, + { + "epoch": 0.89, + "learning_rate": 1.6722664963880836e-07, + "loss": 1.0793, + "step": 29425 + }, + { + "epoch": 0.89, + "learning_rate": 1.6713894885687975e-07, + "loss": 1.0664, + "step": 29426 + }, + { + "epoch": 0.89, + "learning_rate": 1.6705127028266488e-07, + "loss": 1.093, + "step": 29427 + }, + { + "epoch": 0.89, + "learning_rate": 1.6696361391699807e-07, + "loss": 1.032, + "step": 29428 + }, + { + "epoch": 0.89, + "learning_rate": 1.668759797607139e-07, + "loss": 1.2001, + "step": 29429 + }, + { + "epoch": 0.89, + "learning_rate": 1.6678836781464675e-07, + "loss": 1.0862, + "step": 29430 + }, + { + "epoch": 0.89, + "learning_rate": 1.667007780796309e-07, + "loss": 1.0947, + "step": 29431 + }, + { + "epoch": 0.89, + "learning_rate": 1.6661321055649965e-07, + "loss": 1.1355, + "step": 29432 + }, + { + "epoch": 0.89, + "learning_rate": 1.66525665246087e-07, + "loss": 1.0634, + "step": 29433 + }, + { + "epoch": 0.89, + "learning_rate": 1.6643814214922644e-07, + "loss": 1.0685, + "step": 29434 + }, + { + "epoch": 0.89, + "learning_rate": 1.6635064126675037e-07, + "loss": 1.0842, + "step": 29435 + }, + { + "epoch": 0.89, + "learning_rate": 1.662631625994926e-07, + "loss": 1.0567, + "step": 29436 + }, + { + "epoch": 0.89, + "learning_rate": 1.661757061482852e-07, + "loss": 1.2234, + "step": 29437 + }, + { + "epoch": 0.89, + "learning_rate": 1.6608827191396115e-07, + "loss": 1.1136, + "step": 29438 + }, + { + "epoch": 0.89, + "learning_rate": 1.6600085989735337e-07, + "loss": 1.1106, + "step": 29439 + }, + { + "epoch": 0.89, + "learning_rate": 1.6591347009929259e-07, + "loss": 1.0439, + "step": 29440 + }, + { + "epoch": 0.89, + "learning_rate": 1.6582610252061177e-07, + "loss": 1.1139, + "step": 29441 + }, + { + "epoch": 0.89, + "learning_rate": 1.6573875716214216e-07, + "loss": 1.1509, + "step": 29442 + }, + { + "epoch": 0.89, + "learning_rate": 1.6565143402471562e-07, + "loss": 1.0595, + "step": 29443 + }, + { + "epoch": 0.89, + "learning_rate": 1.6556413310916287e-07, + "loss": 1.1562, + "step": 29444 + }, + { + "epoch": 0.89, + "learning_rate": 1.6547685441631518e-07, + "loss": 1.1152, + "step": 29445 + }, + { + "epoch": 0.89, + "learning_rate": 1.6538959794700356e-07, + "loss": 0.9971, + "step": 29446 + }, + { + "epoch": 0.89, + "learning_rate": 1.65302363702059e-07, + "loss": 1.0247, + "step": 29447 + }, + { + "epoch": 0.89, + "learning_rate": 1.6521515168231112e-07, + "loss": 1.1446, + "step": 29448 + }, + { + "epoch": 0.89, + "learning_rate": 1.6512796188859038e-07, + "loss": 1.1914, + "step": 29449 + }, + { + "epoch": 0.89, + "learning_rate": 1.650407943217272e-07, + "loss": 1.1746, + "step": 29450 + }, + { + "epoch": 0.89, + "learning_rate": 1.6495364898255094e-07, + "loss": 1.0148, + "step": 29451 + }, + { + "epoch": 0.89, + "learning_rate": 1.648665258718915e-07, + "loss": 1.105, + "step": 29452 + }, + { + "epoch": 0.89, + "learning_rate": 1.647794249905782e-07, + "loss": 1.1041, + "step": 29453 + }, + { + "epoch": 0.89, + "learning_rate": 1.646923463394398e-07, + "loss": 1.0419, + "step": 29454 + }, + { + "epoch": 0.89, + "learning_rate": 1.646052899193054e-07, + "loss": 1.119, + "step": 29455 + }, + { + "epoch": 0.89, + "learning_rate": 1.6451825573100406e-07, + "loss": 1.1732, + "step": 29456 + }, + { + "epoch": 0.89, + "learning_rate": 1.6443124377536423e-07, + "loss": 0.9999, + "step": 29457 + }, + { + "epoch": 0.89, + "learning_rate": 1.6434425405321392e-07, + "loss": 1.0786, + "step": 29458 + }, + { + "epoch": 0.89, + "learning_rate": 1.6425728656538186e-07, + "loss": 1.0071, + "step": 29459 + }, + { + "epoch": 0.89, + "learning_rate": 1.6417034131269522e-07, + "loss": 1.1666, + "step": 29460 + }, + { + "epoch": 0.89, + "learning_rate": 1.640834182959819e-07, + "loss": 1.0826, + "step": 29461 + }, + { + "epoch": 0.89, + "learning_rate": 1.6399651751606933e-07, + "loss": 1.1826, + "step": 29462 + }, + { + "epoch": 0.89, + "learning_rate": 1.6390963897378486e-07, + "loss": 1.0615, + "step": 29463 + }, + { + "epoch": 0.89, + "learning_rate": 1.6382278266995565e-07, + "loss": 1.0599, + "step": 29464 + }, + { + "epoch": 0.89, + "learning_rate": 1.637359486054088e-07, + "loss": 1.0938, + "step": 29465 + }, + { + "epoch": 0.89, + "learning_rate": 1.6364913678097004e-07, + "loss": 1.1234, + "step": 29466 + }, + { + "epoch": 0.89, + "learning_rate": 1.6356234719746623e-07, + "loss": 1.1036, + "step": 29467 + }, + { + "epoch": 0.89, + "learning_rate": 1.6347557985572388e-07, + "loss": 1.1993, + "step": 29468 + }, + { + "epoch": 0.89, + "learning_rate": 1.6338883475656876e-07, + "loss": 1.1069, + "step": 29469 + }, + { + "epoch": 0.89, + "learning_rate": 1.6330211190082628e-07, + "loss": 1.1016, + "step": 29470 + }, + { + "epoch": 0.89, + "learning_rate": 1.632154112893225e-07, + "loss": 1.0203, + "step": 29471 + }, + { + "epoch": 0.89, + "learning_rate": 1.6312873292288227e-07, + "loss": 1.1859, + "step": 29472 + }, + { + "epoch": 0.89, + "learning_rate": 1.6304207680233163e-07, + "loss": 0.9611, + "step": 29473 + }, + { + "epoch": 0.89, + "learning_rate": 1.6295544292849436e-07, + "loss": 1.1039, + "step": 29474 + }, + { + "epoch": 0.89, + "learning_rate": 1.628688313021959e-07, + "loss": 1.2121, + "step": 29475 + }, + { + "epoch": 0.89, + "learning_rate": 1.6278224192426058e-07, + "loss": 1.032, + "step": 29476 + }, + { + "epoch": 0.89, + "learning_rate": 1.6269567479551246e-07, + "loss": 1.1273, + "step": 29477 + }, + { + "epoch": 0.89, + "learning_rate": 1.6260912991677646e-07, + "loss": 0.9918, + "step": 29478 + }, + { + "epoch": 0.89, + "learning_rate": 1.6252260728887525e-07, + "loss": 1.1987, + "step": 29479 + }, + { + "epoch": 0.89, + "learning_rate": 1.624361069126329e-07, + "loss": 1.1129, + "step": 29480 + }, + { + "epoch": 0.89, + "learning_rate": 1.6234962878887344e-07, + "loss": 1.0923, + "step": 29481 + }, + { + "epoch": 0.89, + "learning_rate": 1.6226317291841958e-07, + "loss": 1.077, + "step": 29482 + }, + { + "epoch": 0.89, + "learning_rate": 1.6217673930209426e-07, + "loss": 1.0482, + "step": 29483 + }, + { + "epoch": 0.89, + "learning_rate": 1.620903279407207e-07, + "loss": 1.1111, + "step": 29484 + }, + { + "epoch": 0.89, + "learning_rate": 1.6200393883512076e-07, + "loss": 1.0628, + "step": 29485 + }, + { + "epoch": 0.89, + "learning_rate": 1.6191757198611768e-07, + "loss": 1.0087, + "step": 29486 + }, + { + "epoch": 0.89, + "learning_rate": 1.61831227394533e-07, + "loss": 0.9907, + "step": 29487 + }, + { + "epoch": 0.89, + "learning_rate": 1.6174490506118913e-07, + "loss": 1.2028, + "step": 29488 + }, + { + "epoch": 0.89, + "learning_rate": 1.616586049869076e-07, + "loss": 1.0403, + "step": 29489 + }, + { + "epoch": 0.89, + "learning_rate": 1.6157232717250976e-07, + "loss": 1.0931, + "step": 29490 + }, + { + "epoch": 0.89, + "learning_rate": 1.614860716188177e-07, + "loss": 1.062, + "step": 29491 + }, + { + "epoch": 0.89, + "learning_rate": 1.6139983832665158e-07, + "loss": 1.0219, + "step": 29492 + }, + { + "epoch": 0.89, + "learning_rate": 1.613136272968327e-07, + "loss": 1.1844, + "step": 29493 + }, + { + "epoch": 0.89, + "learning_rate": 1.612274385301818e-07, + "loss": 1.0696, + "step": 29494 + }, + { + "epoch": 0.89, + "learning_rate": 1.611412720275196e-07, + "loss": 1.0461, + "step": 29495 + }, + { + "epoch": 0.89, + "learning_rate": 1.610551277896655e-07, + "loss": 1.0773, + "step": 29496 + }, + { + "epoch": 0.89, + "learning_rate": 1.609690058174404e-07, + "loss": 1.0082, + "step": 29497 + }, + { + "epoch": 0.89, + "learning_rate": 1.6088290611166375e-07, + "loss": 1.14, + "step": 29498 + }, + { + "epoch": 0.89, + "learning_rate": 1.6079682867315566e-07, + "loss": 1.0401, + "step": 29499 + }, + { + "epoch": 0.89, + "learning_rate": 1.6071077350273469e-07, + "loss": 1.119, + "step": 29500 + }, + { + "epoch": 0.89, + "learning_rate": 1.6062474060122042e-07, + "loss": 0.9948, + "step": 29501 + }, + { + "epoch": 0.89, + "learning_rate": 1.605387299694322e-07, + "loss": 1.0681, + "step": 29502 + }, + { + "epoch": 0.89, + "learning_rate": 1.604527416081883e-07, + "loss": 1.0701, + "step": 29503 + }, + { + "epoch": 0.89, + "learning_rate": 1.6036677551830804e-07, + "loss": 1.0776, + "step": 29504 + }, + { + "epoch": 0.89, + "learning_rate": 1.602808317006091e-07, + "loss": 1.0776, + "step": 29505 + }, + { + "epoch": 0.89, + "learning_rate": 1.6019491015590944e-07, + "loss": 1.2014, + "step": 29506 + }, + { + "epoch": 0.89, + "learning_rate": 1.6010901088502757e-07, + "loss": 1.1585, + "step": 29507 + }, + { + "epoch": 0.89, + "learning_rate": 1.6002313388878144e-07, + "loss": 1.0602, + "step": 29508 + }, + { + "epoch": 0.89, + "learning_rate": 1.5993727916798735e-07, + "loss": 1.153, + "step": 29509 + }, + { + "epoch": 0.89, + "learning_rate": 1.598514467234638e-07, + "loss": 1.0803, + "step": 29510 + }, + { + "epoch": 0.89, + "learning_rate": 1.597656365560271e-07, + "loss": 1.0865, + "step": 29511 + }, + { + "epoch": 0.89, + "learning_rate": 1.5967984866649467e-07, + "loss": 1.0022, + "step": 29512 + }, + { + "epoch": 0.89, + "learning_rate": 1.5959408305568276e-07, + "loss": 1.1149, + "step": 29513 + }, + { + "epoch": 0.89, + "learning_rate": 1.5950833972440792e-07, + "loss": 1.0732, + "step": 29514 + }, + { + "epoch": 0.89, + "learning_rate": 1.594226186734868e-07, + "loss": 1.0447, + "step": 29515 + }, + { + "epoch": 0.89, + "learning_rate": 1.5933691990373478e-07, + "loss": 1.0088, + "step": 29516 + }, + { + "epoch": 0.89, + "learning_rate": 1.592512434159685e-07, + "loss": 1.0949, + "step": 29517 + }, + { + "epoch": 0.89, + "learning_rate": 1.591655892110025e-07, + "loss": 1.1547, + "step": 29518 + }, + { + "epoch": 0.89, + "learning_rate": 1.5907995728965286e-07, + "loss": 1.1302, + "step": 29519 + }, + { + "epoch": 0.89, + "learning_rate": 1.5899434765273475e-07, + "loss": 1.0654, + "step": 29520 + }, + { + "epoch": 0.89, + "learning_rate": 1.5890876030106305e-07, + "loss": 1.096, + "step": 29521 + }, + { + "epoch": 0.89, + "learning_rate": 1.5882319523545243e-07, + "loss": 1.0054, + "step": 29522 + }, + { + "epoch": 0.89, + "learning_rate": 1.5873765245671718e-07, + "loss": 1.0101, + "step": 29523 + }, + { + "epoch": 0.89, + "learning_rate": 1.5865213196567196e-07, + "loss": 1.131, + "step": 29524 + }, + { + "epoch": 0.89, + "learning_rate": 1.5856663376313114e-07, + "loss": 1.0253, + "step": 29525 + }, + { + "epoch": 0.89, + "learning_rate": 1.5848115784990792e-07, + "loss": 1.0265, + "step": 29526 + }, + { + "epoch": 0.89, + "learning_rate": 1.583957042268164e-07, + "loss": 1.1505, + "step": 29527 + }, + { + "epoch": 0.89, + "learning_rate": 1.5831027289467005e-07, + "loss": 1.059, + "step": 29528 + }, + { + "epoch": 0.89, + "learning_rate": 1.5822486385428186e-07, + "loss": 1.0267, + "step": 29529 + }, + { + "epoch": 0.89, + "learning_rate": 1.5813947710646592e-07, + "loss": 1.2579, + "step": 29530 + }, + { + "epoch": 0.89, + "learning_rate": 1.5805411265203352e-07, + "loss": 1.1555, + "step": 29531 + }, + { + "epoch": 0.89, + "learning_rate": 1.5796877049179814e-07, + "loss": 1.0853, + "step": 29532 + }, + { + "epoch": 0.89, + "learning_rate": 1.5788345062657224e-07, + "loss": 1.1752, + "step": 29533 + }, + { + "epoch": 0.89, + "learning_rate": 1.5779815305716818e-07, + "loss": 1.1758, + "step": 29534 + }, + { + "epoch": 0.89, + "learning_rate": 1.5771287778439754e-07, + "loss": 1.1115, + "step": 29535 + }, + { + "epoch": 0.89, + "learning_rate": 1.576276248090719e-07, + "loss": 1.0703, + "step": 29536 + }, + { + "epoch": 0.89, + "learning_rate": 1.5754239413200312e-07, + "loss": 0.9792, + "step": 29537 + }, + { + "epoch": 0.89, + "learning_rate": 1.5745718575400275e-07, + "loss": 1.0151, + "step": 29538 + }, + { + "epoch": 0.89, + "learning_rate": 1.5737199967588185e-07, + "loss": 1.1862, + "step": 29539 + }, + { + "epoch": 0.89, + "learning_rate": 1.572868358984511e-07, + "loss": 1.0569, + "step": 29540 + }, + { + "epoch": 0.89, + "learning_rate": 1.572016944225216e-07, + "loss": 1.0616, + "step": 29541 + }, + { + "epoch": 0.89, + "learning_rate": 1.5711657524890345e-07, + "loss": 1.1229, + "step": 29542 + }, + { + "epoch": 0.89, + "learning_rate": 1.5703147837840716e-07, + "loss": 1.0898, + "step": 29543 + }, + { + "epoch": 0.89, + "learning_rate": 1.569464038118429e-07, + "loss": 0.9849, + "step": 29544 + }, + { + "epoch": 0.89, + "learning_rate": 1.5686135155002002e-07, + "loss": 0.9971, + "step": 29545 + }, + { + "epoch": 0.89, + "learning_rate": 1.56776321593749e-07, + "loss": 1.0549, + "step": 29546 + }, + { + "epoch": 0.89, + "learning_rate": 1.5669131394383919e-07, + "loss": 1.0953, + "step": 29547 + }, + { + "epoch": 0.89, + "learning_rate": 1.566063286010988e-07, + "loss": 1.0482, + "step": 29548 + }, + { + "epoch": 0.89, + "learning_rate": 1.565213655663378e-07, + "loss": 1.1747, + "step": 29549 + }, + { + "epoch": 0.89, + "learning_rate": 1.5643642484036464e-07, + "loss": 1.0518, + "step": 29550 + }, + { + "epoch": 0.89, + "learning_rate": 1.5635150642398843e-07, + "loss": 1.132, + "step": 29551 + }, + { + "epoch": 0.89, + "learning_rate": 1.5626661031801687e-07, + "loss": 1.0709, + "step": 29552 + }, + { + "epoch": 0.89, + "learning_rate": 1.561817365232582e-07, + "loss": 1.1202, + "step": 29553 + }, + { + "epoch": 0.89, + "learning_rate": 1.5609688504052063e-07, + "loss": 1.0498, + "step": 29554 + }, + { + "epoch": 0.89, + "learning_rate": 1.5601205587061214e-07, + "loss": 1.1308, + "step": 29555 + }, + { + "epoch": 0.89, + "learning_rate": 1.5592724901433986e-07, + "loss": 1.0051, + "step": 29556 + }, + { + "epoch": 0.89, + "learning_rate": 1.5584246447251123e-07, + "loss": 1.1389, + "step": 29557 + }, + { + "epoch": 0.89, + "learning_rate": 1.5575770224593333e-07, + "loss": 1.0765, + "step": 29558 + }, + { + "epoch": 0.89, + "learning_rate": 1.5567296233541278e-07, + "loss": 1.1198, + "step": 29559 + }, + { + "epoch": 0.89, + "learning_rate": 1.5558824474175728e-07, + "loss": 1.2238, + "step": 29560 + }, + { + "epoch": 0.89, + "learning_rate": 1.5550354946577195e-07, + "loss": 1.2026, + "step": 29561 + }, + { + "epoch": 0.89, + "learning_rate": 1.554188765082637e-07, + "loss": 1.2179, + "step": 29562 + }, + { + "epoch": 0.89, + "learning_rate": 1.5533422587003881e-07, + "loss": 1.0799, + "step": 29563 + }, + { + "epoch": 0.89, + "learning_rate": 1.5524959755190304e-07, + "loss": 1.063, + "step": 29564 + }, + { + "epoch": 0.89, + "learning_rate": 1.5516499155466157e-07, + "loss": 1.0664, + "step": 29565 + }, + { + "epoch": 0.89, + "learning_rate": 1.5508040787911988e-07, + "loss": 1.0447, + "step": 29566 + }, + { + "epoch": 0.89, + "learning_rate": 1.549958465260834e-07, + "loss": 1.1671, + "step": 29567 + }, + { + "epoch": 0.89, + "learning_rate": 1.5491130749635734e-07, + "loss": 1.1848, + "step": 29568 + }, + { + "epoch": 0.89, + "learning_rate": 1.548267907907458e-07, + "loss": 1.0488, + "step": 29569 + }, + { + "epoch": 0.89, + "learning_rate": 1.5474229641005396e-07, + "loss": 1.1014, + "step": 29570 + }, + { + "epoch": 0.89, + "learning_rate": 1.5465782435508585e-07, + "loss": 1.1826, + "step": 29571 + }, + { + "epoch": 0.89, + "learning_rate": 1.545733746266459e-07, + "loss": 1.0963, + "step": 29572 + }, + { + "epoch": 0.89, + "learning_rate": 1.5448894722553787e-07, + "loss": 1.1854, + "step": 29573 + }, + { + "epoch": 0.89, + "learning_rate": 1.544045421525653e-07, + "loss": 1.0502, + "step": 29574 + }, + { + "epoch": 0.89, + "learning_rate": 1.5432015940853168e-07, + "loss": 1.176, + "step": 29575 + }, + { + "epoch": 0.89, + "learning_rate": 1.5423579899424056e-07, + "loss": 1.0921, + "step": 29576 + }, + { + "epoch": 0.89, + "learning_rate": 1.541514609104952e-07, + "loss": 1.1614, + "step": 29577 + }, + { + "epoch": 0.89, + "learning_rate": 1.5406714515809774e-07, + "loss": 1.1478, + "step": 29578 + }, + { + "epoch": 0.89, + "learning_rate": 1.5398285173785138e-07, + "loss": 1.1748, + "step": 29579 + }, + { + "epoch": 0.89, + "learning_rate": 1.5389858065055802e-07, + "loss": 1.1031, + "step": 29580 + }, + { + "epoch": 0.89, + "learning_rate": 1.538143318970206e-07, + "loss": 1.0403, + "step": 29581 + }, + { + "epoch": 0.89, + "learning_rate": 1.5373010547804101e-07, + "loss": 1.0743, + "step": 29582 + }, + { + "epoch": 0.89, + "learning_rate": 1.5364590139442053e-07, + "loss": 1.0674, + "step": 29583 + }, + { + "epoch": 0.89, + "learning_rate": 1.5356171964696077e-07, + "loss": 1.0198, + "step": 29584 + }, + { + "epoch": 0.89, + "learning_rate": 1.5347756023646355e-07, + "loss": 1.1057, + "step": 29585 + }, + { + "epoch": 0.89, + "learning_rate": 1.5339342316373017e-07, + "loss": 1.1755, + "step": 29586 + }, + { + "epoch": 0.89, + "learning_rate": 1.5330930842956087e-07, + "loss": 1.0926, + "step": 29587 + }, + { + "epoch": 0.89, + "learning_rate": 1.5322521603475692e-07, + "loss": 1.159, + "step": 29588 + }, + { + "epoch": 0.89, + "learning_rate": 1.5314114598011827e-07, + "loss": 1.0824, + "step": 29589 + }, + { + "epoch": 0.89, + "learning_rate": 1.5305709826644645e-07, + "loss": 1.1464, + "step": 29590 + }, + { + "epoch": 0.89, + "learning_rate": 1.5297307289454e-07, + "loss": 1.0613, + "step": 29591 + }, + { + "epoch": 0.89, + "learning_rate": 1.5288906986519969e-07, + "loss": 1.1799, + "step": 29592 + }, + { + "epoch": 0.89, + "learning_rate": 1.5280508917922487e-07, + "loss": 1.1153, + "step": 29593 + }, + { + "epoch": 0.89, + "learning_rate": 1.5272113083741547e-07, + "loss": 1.1601, + "step": 29594 + }, + { + "epoch": 0.89, + "learning_rate": 1.5263719484057028e-07, + "loss": 1.1185, + "step": 29595 + }, + { + "epoch": 0.89, + "learning_rate": 1.5255328118948835e-07, + "loss": 1.1501, + "step": 29596 + }, + { + "epoch": 0.89, + "learning_rate": 1.5246938988496856e-07, + "loss": 0.982, + "step": 29597 + }, + { + "epoch": 0.89, + "learning_rate": 1.5238552092780967e-07, + "loss": 1.1011, + "step": 29598 + }, + { + "epoch": 0.89, + "learning_rate": 1.523016743188105e-07, + "loss": 1.1838, + "step": 29599 + }, + { + "epoch": 0.89, + "learning_rate": 1.5221785005876816e-07, + "loss": 1.2737, + "step": 29600 + }, + { + "epoch": 0.89, + "learning_rate": 1.5213404814848122e-07, + "loss": 1.0515, + "step": 29601 + }, + { + "epoch": 0.89, + "learning_rate": 1.5205026858874733e-07, + "loss": 1.0649, + "step": 29602 + }, + { + "epoch": 0.89, + "learning_rate": 1.519665113803645e-07, + "loss": 1.011, + "step": 29603 + }, + { + "epoch": 0.89, + "learning_rate": 1.5188277652412902e-07, + "loss": 1.0591, + "step": 29604 + }, + { + "epoch": 0.89, + "learning_rate": 1.5179906402083888e-07, + "loss": 1.0167, + "step": 29605 + }, + { + "epoch": 0.89, + "learning_rate": 1.5171537387129066e-07, + "loss": 1.1201, + "step": 29606 + }, + { + "epoch": 0.89, + "learning_rate": 1.516317060762812e-07, + "loss": 1.032, + "step": 29607 + }, + { + "epoch": 0.89, + "learning_rate": 1.515480606366071e-07, + "loss": 1.1465, + "step": 29608 + }, + { + "epoch": 0.89, + "learning_rate": 1.514644375530641e-07, + "loss": 1.0742, + "step": 29609 + }, + { + "epoch": 0.89, + "learning_rate": 1.5138083682644855e-07, + "loss": 1.1035, + "step": 29610 + }, + { + "epoch": 0.89, + "learning_rate": 1.5129725845755615e-07, + "loss": 0.9865, + "step": 29611 + }, + { + "epoch": 0.89, + "learning_rate": 1.5121370244718326e-07, + "loss": 1.0919, + "step": 29612 + }, + { + "epoch": 0.89, + "learning_rate": 1.5113016879612418e-07, + "loss": 1.0829, + "step": 29613 + }, + { + "epoch": 0.89, + "learning_rate": 1.5104665750517473e-07, + "loss": 1.1532, + "step": 29614 + }, + { + "epoch": 0.89, + "learning_rate": 1.5096316857512976e-07, + "loss": 0.9819, + "step": 29615 + }, + { + "epoch": 0.89, + "learning_rate": 1.5087970200678454e-07, + "loss": 1.0784, + "step": 29616 + }, + { + "epoch": 0.89, + "learning_rate": 1.507962578009328e-07, + "loss": 1.0921, + "step": 29617 + }, + { + "epoch": 0.89, + "learning_rate": 1.5071283595836928e-07, + "loss": 1.0733, + "step": 29618 + }, + { + "epoch": 0.89, + "learning_rate": 1.5062943647988798e-07, + "loss": 1.1542, + "step": 29619 + }, + { + "epoch": 0.89, + "learning_rate": 1.5054605936628302e-07, + "loss": 1.0601, + "step": 29620 + }, + { + "epoch": 0.89, + "learning_rate": 1.504627046183482e-07, + "loss": 1.0419, + "step": 29621 + }, + { + "epoch": 0.89, + "learning_rate": 1.503793722368768e-07, + "loss": 1.1261, + "step": 29622 + }, + { + "epoch": 0.89, + "learning_rate": 1.5029606222266235e-07, + "loss": 1.2554, + "step": 29623 + }, + { + "epoch": 0.89, + "learning_rate": 1.5021277457649753e-07, + "loss": 1.0732, + "step": 29624 + }, + { + "epoch": 0.89, + "learning_rate": 1.501295092991753e-07, + "loss": 0.9878, + "step": 29625 + }, + { + "epoch": 0.89, + "learning_rate": 1.500462663914884e-07, + "loss": 1.1647, + "step": 29626 + }, + { + "epoch": 0.89, + "learning_rate": 1.4996304585422922e-07, + "loss": 1.1046, + "step": 29627 + }, + { + "epoch": 0.89, + "learning_rate": 1.498798476881902e-07, + "loss": 1.1288, + "step": 29628 + }, + { + "epoch": 0.89, + "learning_rate": 1.4979667189416347e-07, + "loss": 1.1802, + "step": 29629 + }, + { + "epoch": 0.89, + "learning_rate": 1.497135184729401e-07, + "loss": 1.1669, + "step": 29630 + }, + { + "epoch": 0.89, + "learning_rate": 1.4963038742531216e-07, + "loss": 1.2527, + "step": 29631 + }, + { + "epoch": 0.89, + "learning_rate": 1.4954727875207075e-07, + "loss": 1.1085, + "step": 29632 + }, + { + "epoch": 0.89, + "learning_rate": 1.49464192454008e-07, + "loss": 1.0278, + "step": 29633 + }, + { + "epoch": 0.89, + "learning_rate": 1.4938112853191329e-07, + "loss": 1.0661, + "step": 29634 + }, + { + "epoch": 0.89, + "learning_rate": 1.4929808698657843e-07, + "loss": 1.0762, + "step": 29635 + }, + { + "epoch": 0.89, + "learning_rate": 1.492150678187937e-07, + "loss": 1.2071, + "step": 29636 + }, + { + "epoch": 0.89, + "learning_rate": 1.4913207102934896e-07, + "loss": 1.1572, + "step": 29637 + }, + { + "epoch": 0.89, + "learning_rate": 1.4904909661903556e-07, + "loss": 1.0294, + "step": 29638 + }, + { + "epoch": 0.89, + "learning_rate": 1.4896614458864171e-07, + "loss": 1.0086, + "step": 29639 + }, + { + "epoch": 0.89, + "learning_rate": 1.4888321493895797e-07, + "loss": 1.0358, + "step": 29640 + }, + { + "epoch": 0.89, + "learning_rate": 1.4880030767077393e-07, + "loss": 1.0142, + "step": 29641 + }, + { + "epoch": 0.89, + "learning_rate": 1.4871742278487867e-07, + "loss": 1.1069, + "step": 29642 + }, + { + "epoch": 0.89, + "learning_rate": 1.4863456028206075e-07, + "loss": 1.1731, + "step": 29643 + }, + { + "epoch": 0.89, + "learning_rate": 1.4855172016310954e-07, + "loss": 1.0641, + "step": 29644 + }, + { + "epoch": 0.89, + "learning_rate": 1.4846890242881328e-07, + "loss": 1.0618, + "step": 29645 + }, + { + "epoch": 0.89, + "learning_rate": 1.4838610707996108e-07, + "loss": 1.0582, + "step": 29646 + }, + { + "epoch": 0.89, + "learning_rate": 1.483033341173401e-07, + "loss": 1.0482, + "step": 29647 + }, + { + "epoch": 0.89, + "learning_rate": 1.4822058354173886e-07, + "loss": 1.2147, + "step": 29648 + }, + { + "epoch": 0.89, + "learning_rate": 1.4813785535394503e-07, + "loss": 1.126, + "step": 29649 + }, + { + "epoch": 0.89, + "learning_rate": 1.480551495547461e-07, + "loss": 1.2238, + "step": 29650 + }, + { + "epoch": 0.89, + "learning_rate": 1.4797246614492916e-07, + "loss": 1.0425, + "step": 29651 + }, + { + "epoch": 0.89, + "learning_rate": 1.4788980512528167e-07, + "loss": 1.0811, + "step": 29652 + }, + { + "epoch": 0.89, + "learning_rate": 1.478071664965905e-07, + "loss": 1.1448, + "step": 29653 + }, + { + "epoch": 0.89, + "learning_rate": 1.4772455025964222e-07, + "loss": 1.0969, + "step": 29654 + }, + { + "epoch": 0.89, + "learning_rate": 1.4764195641522372e-07, + "loss": 1.0385, + "step": 29655 + }, + { + "epoch": 0.89, + "learning_rate": 1.4755938496412077e-07, + "loss": 1.2067, + "step": 29656 + }, + { + "epoch": 0.89, + "learning_rate": 1.4747683590711908e-07, + "loss": 1.0688, + "step": 29657 + }, + { + "epoch": 0.89, + "learning_rate": 1.4739430924500503e-07, + "loss": 1.028, + "step": 29658 + }, + { + "epoch": 0.89, + "learning_rate": 1.473118049785646e-07, + "loss": 1.1516, + "step": 29659 + }, + { + "epoch": 0.89, + "learning_rate": 1.4722932310858196e-07, + "loss": 1.0805, + "step": 29660 + }, + { + "epoch": 0.89, + "learning_rate": 1.4714686363584335e-07, + "loss": 1.0433, + "step": 29661 + }, + { + "epoch": 0.89, + "learning_rate": 1.4706442656113345e-07, + "loss": 1.1609, + "step": 29662 + }, + { + "epoch": 0.89, + "learning_rate": 1.469820118852369e-07, + "loss": 1.0757, + "step": 29663 + }, + { + "epoch": 0.89, + "learning_rate": 1.4689961960893868e-07, + "loss": 1.1242, + "step": 29664 + }, + { + "epoch": 0.89, + "learning_rate": 1.4681724973302254e-07, + "loss": 1.0543, + "step": 29665 + }, + { + "epoch": 0.89, + "learning_rate": 1.4673490225827259e-07, + "loss": 1.0941, + "step": 29666 + }, + { + "epoch": 0.89, + "learning_rate": 1.466525771854732e-07, + "loss": 1.1394, + "step": 29667 + }, + { + "epoch": 0.89, + "learning_rate": 1.4657027451540823e-07, + "loss": 1.1852, + "step": 29668 + }, + { + "epoch": 0.89, + "learning_rate": 1.4648799424886033e-07, + "loss": 1.1616, + "step": 29669 + }, + { + "epoch": 0.89, + "learning_rate": 1.4640573638661338e-07, + "loss": 1.0606, + "step": 29670 + }, + { + "epoch": 0.89, + "learning_rate": 1.463235009294503e-07, + "loss": 1.0982, + "step": 29671 + }, + { + "epoch": 0.89, + "learning_rate": 1.462412878781541e-07, + "loss": 1.129, + "step": 29672 + }, + { + "epoch": 0.89, + "learning_rate": 1.4615909723350696e-07, + "loss": 0.9667, + "step": 29673 + }, + { + "epoch": 0.89, + "learning_rate": 1.4607692899629156e-07, + "loss": 0.9905, + "step": 29674 + }, + { + "epoch": 0.89, + "learning_rate": 1.4599478316729032e-07, + "loss": 1.1279, + "step": 29675 + }, + { + "epoch": 0.89, + "learning_rate": 1.4591265974728457e-07, + "loss": 1.0248, + "step": 29676 + }, + { + "epoch": 0.89, + "learning_rate": 1.4583055873705704e-07, + "loss": 1.1455, + "step": 29677 + }, + { + "epoch": 0.89, + "learning_rate": 1.4574848013738846e-07, + "loss": 1.1334, + "step": 29678 + }, + { + "epoch": 0.89, + "learning_rate": 1.4566642394906045e-07, + "loss": 1.0834, + "step": 29679 + }, + { + "epoch": 0.89, + "learning_rate": 1.455843901728543e-07, + "loss": 1.1429, + "step": 29680 + }, + { + "epoch": 0.89, + "learning_rate": 1.4550237880955137e-07, + "loss": 1.0975, + "step": 29681 + }, + { + "epoch": 0.89, + "learning_rate": 1.454203898599313e-07, + "loss": 1.2098, + "step": 29682 + }, + { + "epoch": 0.89, + "learning_rate": 1.453384233247751e-07, + "loss": 1.0815, + "step": 29683 + }, + { + "epoch": 0.89, + "learning_rate": 1.4525647920486302e-07, + "loss": 1.1143, + "step": 29684 + }, + { + "epoch": 0.89, + "learning_rate": 1.4517455750097553e-07, + "loss": 0.9445, + "step": 29685 + }, + { + "epoch": 0.89, + "learning_rate": 1.45092658213892e-07, + "loss": 1.0585, + "step": 29686 + }, + { + "epoch": 0.89, + "learning_rate": 1.4501078134439184e-07, + "loss": 1.0782, + "step": 29687 + }, + { + "epoch": 0.89, + "learning_rate": 1.4492892689325523e-07, + "loss": 1.1323, + "step": 29688 + }, + { + "epoch": 0.89, + "learning_rate": 1.448470948612607e-07, + "loss": 1.0944, + "step": 29689 + }, + { + "epoch": 0.89, + "learning_rate": 1.4476528524918792e-07, + "loss": 1.1609, + "step": 29690 + }, + { + "epoch": 0.89, + "learning_rate": 1.4468349805781517e-07, + "loss": 1.1589, + "step": 29691 + }, + { + "epoch": 0.89, + "learning_rate": 1.4460173328792098e-07, + "loss": 1.0898, + "step": 29692 + }, + { + "epoch": 0.89, + "learning_rate": 1.445199909402839e-07, + "loss": 1.0137, + "step": 29693 + }, + { + "epoch": 0.89, + "learning_rate": 1.444382710156825e-07, + "loss": 1.2548, + "step": 29694 + }, + { + "epoch": 0.89, + "learning_rate": 1.4435657351489385e-07, + "loss": 1.1932, + "step": 29695 + }, + { + "epoch": 0.89, + "learning_rate": 1.442748984386963e-07, + "loss": 1.1192, + "step": 29696 + }, + { + "epoch": 0.89, + "learning_rate": 1.4419324578786697e-07, + "loss": 1.1293, + "step": 29697 + }, + { + "epoch": 0.89, + "learning_rate": 1.441116155631836e-07, + "loss": 1.0609, + "step": 29698 + }, + { + "epoch": 0.89, + "learning_rate": 1.4403000776542275e-07, + "loss": 1.0322, + "step": 29699 + }, + { + "epoch": 0.89, + "learning_rate": 1.439484223953616e-07, + "loss": 1.1065, + "step": 29700 + }, + { + "epoch": 0.89, + "learning_rate": 1.4386685945377677e-07, + "loss": 1.0167, + "step": 29701 + }, + { + "epoch": 0.89, + "learning_rate": 1.4378531894144483e-07, + "loss": 1.0569, + "step": 29702 + }, + { + "epoch": 0.89, + "learning_rate": 1.4370380085914154e-07, + "loss": 1.0377, + "step": 29703 + }, + { + "epoch": 0.89, + "learning_rate": 1.4362230520764352e-07, + "loss": 1.017, + "step": 29704 + }, + { + "epoch": 0.89, + "learning_rate": 1.4354083198772602e-07, + "loss": 1.1459, + "step": 29705 + }, + { + "epoch": 0.89, + "learning_rate": 1.4345938120016555e-07, + "loss": 1.1125, + "step": 29706 + }, + { + "epoch": 0.89, + "learning_rate": 1.433779528457363e-07, + "loss": 1.1777, + "step": 29707 + }, + { + "epoch": 0.89, + "learning_rate": 1.4329654692521373e-07, + "loss": 1.0418, + "step": 29708 + }, + { + "epoch": 0.89, + "learning_rate": 1.432151634393733e-07, + "loss": 0.9675, + "step": 29709 + }, + { + "epoch": 0.9, + "learning_rate": 1.4313380238898944e-07, + "loss": 1.0536, + "step": 29710 + }, + { + "epoch": 0.9, + "learning_rate": 1.4305246377483706e-07, + "loss": 1.113, + "step": 29711 + }, + { + "epoch": 0.9, + "learning_rate": 1.4297114759768942e-07, + "loss": 1.0818, + "step": 29712 + }, + { + "epoch": 0.9, + "learning_rate": 1.428898538583215e-07, + "loss": 1.1966, + "step": 29713 + }, + { + "epoch": 0.9, + "learning_rate": 1.4280858255750706e-07, + "loss": 1.1572, + "step": 29714 + }, + { + "epoch": 0.9, + "learning_rate": 1.4272733369601944e-07, + "loss": 1.0087, + "step": 29715 + }, + { + "epoch": 0.9, + "learning_rate": 1.4264610727463268e-07, + "loss": 1.1289, + "step": 29716 + }, + { + "epoch": 0.9, + "learning_rate": 1.4256490329411954e-07, + "loss": 1.0806, + "step": 29717 + }, + { + "epoch": 0.9, + "learning_rate": 1.424837217552527e-07, + "loss": 1.2351, + "step": 29718 + }, + { + "epoch": 0.9, + "learning_rate": 1.4240256265880574e-07, + "loss": 0.9594, + "step": 29719 + }, + { + "epoch": 0.9, + "learning_rate": 1.423214260055511e-07, + "loss": 1.0595, + "step": 29720 + }, + { + "epoch": 0.9, + "learning_rate": 1.4224031179626092e-07, + "loss": 0.98, + "step": 29721 + }, + { + "epoch": 0.9, + "learning_rate": 1.4215922003170706e-07, + "loss": 1.0563, + "step": 29722 + }, + { + "epoch": 0.9, + "learning_rate": 1.4207815071266202e-07, + "loss": 1.0415, + "step": 29723 + }, + { + "epoch": 0.9, + "learning_rate": 1.4199710383989789e-07, + "loss": 1.2224, + "step": 29724 + }, + { + "epoch": 0.9, + "learning_rate": 1.4191607941418522e-07, + "loss": 1.1351, + "step": 29725 + }, + { + "epoch": 0.9, + "learning_rate": 1.418350774362956e-07, + "loss": 1.014, + "step": 29726 + }, + { + "epoch": 0.9, + "learning_rate": 1.4175409790700033e-07, + "loss": 1.1104, + "step": 29727 + }, + { + "epoch": 0.9, + "learning_rate": 1.416731408270705e-07, + "loss": 1.061, + "step": 29728 + }, + { + "epoch": 0.9, + "learning_rate": 1.4159220619727688e-07, + "loss": 1.1669, + "step": 29729 + }, + { + "epoch": 0.9, + "learning_rate": 1.415112940183891e-07, + "loss": 1.1469, + "step": 29730 + }, + { + "epoch": 0.9, + "learning_rate": 1.4143040429117792e-07, + "loss": 0.9668, + "step": 29731 + }, + { + "epoch": 0.9, + "learning_rate": 1.4134953701641364e-07, + "loss": 1.1179, + "step": 29732 + }, + { + "epoch": 0.9, + "learning_rate": 1.4126869219486555e-07, + "loss": 1.2216, + "step": 29733 + }, + { + "epoch": 0.9, + "learning_rate": 1.4118786982730336e-07, + "loss": 1.0703, + "step": 29734 + }, + { + "epoch": 0.9, + "learning_rate": 1.41107069914497e-07, + "loss": 1.0509, + "step": 29735 + }, + { + "epoch": 0.9, + "learning_rate": 1.4102629245721505e-07, + "loss": 1.0854, + "step": 29736 + }, + { + "epoch": 0.9, + "learning_rate": 1.4094553745622686e-07, + "loss": 1.0212, + "step": 29737 + }, + { + "epoch": 0.9, + "learning_rate": 1.4086480491230098e-07, + "loss": 1.0967, + "step": 29738 + }, + { + "epoch": 0.9, + "learning_rate": 1.407840948262057e-07, + "loss": 1.2054, + "step": 29739 + }, + { + "epoch": 0.9, + "learning_rate": 1.4070340719870983e-07, + "loss": 1.0687, + "step": 29740 + }, + { + "epoch": 0.9, + "learning_rate": 1.4062274203058085e-07, + "loss": 1.0768, + "step": 29741 + }, + { + "epoch": 0.9, + "learning_rate": 1.4054209932258784e-07, + "loss": 1.1041, + "step": 29742 + }, + { + "epoch": 0.9, + "learning_rate": 1.4046147907549713e-07, + "loss": 1.2211, + "step": 29743 + }, + { + "epoch": 0.9, + "learning_rate": 1.403808812900767e-07, + "loss": 1.1409, + "step": 29744 + }, + { + "epoch": 0.9, + "learning_rate": 1.4030030596709404e-07, + "loss": 1.0749, + "step": 29745 + }, + { + "epoch": 0.9, + "learning_rate": 1.402197531073163e-07, + "loss": 1.0999, + "step": 29746 + }, + { + "epoch": 0.9, + "learning_rate": 1.4013922271150947e-07, + "loss": 1.2283, + "step": 29747 + }, + { + "epoch": 0.9, + "learning_rate": 1.400587147804408e-07, + "loss": 1.1044, + "step": 29748 + }, + { + "epoch": 0.9, + "learning_rate": 1.3997822931487658e-07, + "loss": 1.1366, + "step": 29749 + }, + { + "epoch": 0.9, + "learning_rate": 1.3989776631558343e-07, + "loss": 1.0577, + "step": 29750 + }, + { + "epoch": 0.9, + "learning_rate": 1.398173257833263e-07, + "loss": 1.0866, + "step": 29751 + }, + { + "epoch": 0.9, + "learning_rate": 1.3973690771887176e-07, + "loss": 1.0716, + "step": 29752 + }, + { + "epoch": 0.9, + "learning_rate": 1.3965651212298508e-07, + "loss": 1.1721, + "step": 29753 + }, + { + "epoch": 0.9, + "learning_rate": 1.3957613899643146e-07, + "loss": 1.1748, + "step": 29754 + }, + { + "epoch": 0.9, + "learning_rate": 1.3949578833997668e-07, + "loss": 1.0991, + "step": 29755 + }, + { + "epoch": 0.9, + "learning_rate": 1.3941546015438484e-07, + "loss": 1.1357, + "step": 29756 + }, + { + "epoch": 0.9, + "learning_rate": 1.393351544404206e-07, + "loss": 1.1342, + "step": 29757 + }, + { + "epoch": 0.9, + "learning_rate": 1.3925487119884924e-07, + "loss": 1.0144, + "step": 29758 + }, + { + "epoch": 0.9, + "learning_rate": 1.3917461043043423e-07, + "loss": 1.0049, + "step": 29759 + }, + { + "epoch": 0.9, + "learning_rate": 1.3909437213594001e-07, + "loss": 0.9422, + "step": 29760 + }, + { + "epoch": 0.9, + "learning_rate": 1.3901415631613013e-07, + "loss": 1.1197, + "step": 29761 + }, + { + "epoch": 0.9, + "learning_rate": 1.389339629717684e-07, + "loss": 1.0957, + "step": 29762 + }, + { + "epoch": 0.9, + "learning_rate": 1.38853792103619e-07, + "loss": 1.0463, + "step": 29763 + }, + { + "epoch": 0.9, + "learning_rate": 1.3877364371244346e-07, + "loss": 1.1302, + "step": 29764 + }, + { + "epoch": 0.9, + "learning_rate": 1.3869351779900592e-07, + "loss": 0.9821, + "step": 29765 + }, + { + "epoch": 0.9, + "learning_rate": 1.3861341436406883e-07, + "loss": 1.101, + "step": 29766 + }, + { + "epoch": 0.9, + "learning_rate": 1.3853333340839464e-07, + "loss": 1.0559, + "step": 29767 + }, + { + "epoch": 0.9, + "learning_rate": 1.3845327493274608e-07, + "loss": 1.1405, + "step": 29768 + }, + { + "epoch": 0.9, + "learning_rate": 1.3837323893788473e-07, + "loss": 1.1525, + "step": 29769 + }, + { + "epoch": 0.9, + "learning_rate": 1.382932254245728e-07, + "loss": 1.1342, + "step": 29770 + }, + { + "epoch": 0.9, + "learning_rate": 1.3821323439357187e-07, + "loss": 1.2176, + "step": 29771 + }, + { + "epoch": 0.9, + "learning_rate": 1.3813326584564386e-07, + "loss": 1.2067, + "step": 29772 + }, + { + "epoch": 0.9, + "learning_rate": 1.380533197815495e-07, + "loss": 1.2432, + "step": 29773 + }, + { + "epoch": 0.9, + "learning_rate": 1.3797339620204965e-07, + "loss": 1.0829, + "step": 29774 + }, + { + "epoch": 0.9, + "learning_rate": 1.3789349510790556e-07, + "loss": 1.1205, + "step": 29775 + }, + { + "epoch": 0.9, + "learning_rate": 1.3781361649987806e-07, + "loss": 1.1352, + "step": 29776 + }, + { + "epoch": 0.9, + "learning_rate": 1.377337603787271e-07, + "loss": 1.0632, + "step": 29777 + }, + { + "epoch": 0.9, + "learning_rate": 1.3765392674521288e-07, + "loss": 1.0717, + "step": 29778 + }, + { + "epoch": 0.9, + "learning_rate": 1.3757411560009564e-07, + "loss": 1.1218, + "step": 29779 + }, + { + "epoch": 0.9, + "learning_rate": 1.3749432694413505e-07, + "loss": 1.1862, + "step": 29780 + }, + { + "epoch": 0.9, + "learning_rate": 1.374145607780908e-07, + "loss": 1.0632, + "step": 29781 + }, + { + "epoch": 0.9, + "learning_rate": 1.3733481710272194e-07, + "loss": 1.0757, + "step": 29782 + }, + { + "epoch": 0.9, + "learning_rate": 1.3725509591878767e-07, + "loss": 1.0571, + "step": 29783 + }, + { + "epoch": 0.9, + "learning_rate": 1.3717539722704675e-07, + "loss": 1.1166, + "step": 29784 + }, + { + "epoch": 0.9, + "learning_rate": 1.3709572102825836e-07, + "loss": 1.0111, + "step": 29785 + }, + { + "epoch": 0.9, + "learning_rate": 1.3701606732318046e-07, + "loss": 1.0779, + "step": 29786 + }, + { + "epoch": 0.9, + "learning_rate": 1.369364361125719e-07, + "loss": 1.0186, + "step": 29787 + }, + { + "epoch": 0.9, + "learning_rate": 1.3685682739719043e-07, + "loss": 1.0568, + "step": 29788 + }, + { + "epoch": 0.9, + "learning_rate": 1.3677724117779344e-07, + "loss": 1.0942, + "step": 29789 + }, + { + "epoch": 0.9, + "learning_rate": 1.36697677455139e-07, + "loss": 1.1774, + "step": 29790 + }, + { + "epoch": 0.9, + "learning_rate": 1.3661813622998454e-07, + "loss": 1.0518, + "step": 29791 + }, + { + "epoch": 0.9, + "learning_rate": 1.3653861750308721e-07, + "loss": 1.0717, + "step": 29792 + }, + { + "epoch": 0.9, + "learning_rate": 1.3645912127520421e-07, + "loss": 1.204, + "step": 29793 + }, + { + "epoch": 0.9, + "learning_rate": 1.3637964754709188e-07, + "loss": 1.0245, + "step": 29794 + }, + { + "epoch": 0.9, + "learning_rate": 1.363001963195068e-07, + "loss": 1.1149, + "step": 29795 + }, + { + "epoch": 0.9, + "learning_rate": 1.3622076759320535e-07, + "loss": 1.0565, + "step": 29796 + }, + { + "epoch": 0.9, + "learning_rate": 1.3614136136894385e-07, + "loss": 1.0038, + "step": 29797 + }, + { + "epoch": 0.9, + "learning_rate": 1.3606197764747864e-07, + "loss": 1.1523, + "step": 29798 + }, + { + "epoch": 0.9, + "learning_rate": 1.3598261642956439e-07, + "loss": 1.1594, + "step": 29799 + }, + { + "epoch": 0.9, + "learning_rate": 1.359032777159569e-07, + "loss": 1.0269, + "step": 29800 + }, + { + "epoch": 0.9, + "learning_rate": 1.3582396150741194e-07, + "loss": 1.0193, + "step": 29801 + }, + { + "epoch": 0.9, + "learning_rate": 1.357446678046845e-07, + "loss": 1.0195, + "step": 29802 + }, + { + "epoch": 0.9, + "learning_rate": 1.356653966085286e-07, + "loss": 0.9905, + "step": 29803 + }, + { + "epoch": 0.9, + "learning_rate": 1.355861479196996e-07, + "loss": 0.9924, + "step": 29804 + }, + { + "epoch": 0.9, + "learning_rate": 1.355069217389518e-07, + "loss": 1.1003, + "step": 29805 + }, + { + "epoch": 0.9, + "learning_rate": 1.3542771806703964e-07, + "loss": 1.1268, + "step": 29806 + }, + { + "epoch": 0.9, + "learning_rate": 1.3534853690471638e-07, + "loss": 1.1008, + "step": 29807 + }, + { + "epoch": 0.9, + "learning_rate": 1.3526937825273617e-07, + "loss": 1.0294, + "step": 29808 + }, + { + "epoch": 0.9, + "learning_rate": 1.3519024211185257e-07, + "loss": 1.0906, + "step": 29809 + }, + { + "epoch": 0.9, + "learning_rate": 1.3511112848281882e-07, + "loss": 1.1038, + "step": 29810 + }, + { + "epoch": 0.9, + "learning_rate": 1.350320373663888e-07, + "loss": 1.2338, + "step": 29811 + }, + { + "epoch": 0.9, + "learning_rate": 1.3495296876331443e-07, + "loss": 1.157, + "step": 29812 + }, + { + "epoch": 0.9, + "learning_rate": 1.348739226743484e-07, + "loss": 1.1795, + "step": 29813 + }, + { + "epoch": 0.9, + "learning_rate": 1.3479489910024374e-07, + "loss": 1.138, + "step": 29814 + }, + { + "epoch": 0.9, + "learning_rate": 1.347158980417526e-07, + "loss": 0.9577, + "step": 29815 + }, + { + "epoch": 0.9, + "learning_rate": 1.3463691949962692e-07, + "loss": 1.1354, + "step": 29816 + }, + { + "epoch": 0.9, + "learning_rate": 1.3455796347461858e-07, + "loss": 1.2133, + "step": 29817 + }, + { + "epoch": 0.9, + "learning_rate": 1.344790299674792e-07, + "loss": 1.0483, + "step": 29818 + }, + { + "epoch": 0.9, + "learning_rate": 1.3440011897896038e-07, + "loss": 1.1302, + "step": 29819 + }, + { + "epoch": 0.9, + "learning_rate": 1.3432123050981295e-07, + "loss": 1.0431, + "step": 29820 + }, + { + "epoch": 0.9, + "learning_rate": 1.3424236456078792e-07, + "loss": 1.0123, + "step": 29821 + }, + { + "epoch": 0.9, + "learning_rate": 1.3416352113263614e-07, + "loss": 1.1069, + "step": 29822 + }, + { + "epoch": 0.9, + "learning_rate": 1.3408470022610837e-07, + "loss": 1.1375, + "step": 29823 + }, + { + "epoch": 0.9, + "learning_rate": 1.3400590184195512e-07, + "loss": 1.0942, + "step": 29824 + }, + { + "epoch": 0.9, + "learning_rate": 1.3392712598092578e-07, + "loss": 1.1742, + "step": 29825 + }, + { + "epoch": 0.9, + "learning_rate": 1.338483726437706e-07, + "loss": 0.9976, + "step": 29826 + }, + { + "epoch": 0.9, + "learning_rate": 1.3376964183123952e-07, + "loss": 1.1611, + "step": 29827 + }, + { + "epoch": 0.9, + "learning_rate": 1.3369093354408198e-07, + "loss": 0.9938, + "step": 29828 + }, + { + "epoch": 0.9, + "learning_rate": 1.3361224778304677e-07, + "loss": 1.0641, + "step": 29829 + }, + { + "epoch": 0.9, + "learning_rate": 1.3353358454888332e-07, + "loss": 1.1257, + "step": 29830 + }, + { + "epoch": 0.9, + "learning_rate": 1.3345494384234047e-07, + "loss": 1.1158, + "step": 29831 + }, + { + "epoch": 0.9, + "learning_rate": 1.333763256641671e-07, + "loss": 1.0113, + "step": 29832 + }, + { + "epoch": 0.9, + "learning_rate": 1.3329773001511115e-07, + "loss": 1.0514, + "step": 29833 + }, + { + "epoch": 0.9, + "learning_rate": 1.3321915689592068e-07, + "loss": 1.1207, + "step": 29834 + }, + { + "epoch": 0.9, + "learning_rate": 1.33140606307344e-07, + "loss": 0.9637, + "step": 29835 + }, + { + "epoch": 0.9, + "learning_rate": 1.330620782501288e-07, + "loss": 1.0579, + "step": 29836 + }, + { + "epoch": 0.9, + "learning_rate": 1.329835727250231e-07, + "loss": 1.259, + "step": 29837 + }, + { + "epoch": 0.9, + "learning_rate": 1.3290508973277354e-07, + "loss": 1.0819, + "step": 29838 + }, + { + "epoch": 0.9, + "learning_rate": 1.3282662927412732e-07, + "loss": 1.1464, + "step": 29839 + }, + { + "epoch": 0.9, + "learning_rate": 1.327481913498316e-07, + "loss": 0.9977, + "step": 29840 + }, + { + "epoch": 0.9, + "learning_rate": 1.3266977596063297e-07, + "loss": 1.0244, + "step": 29841 + }, + { + "epoch": 0.9, + "learning_rate": 1.3259138310727808e-07, + "loss": 1.0036, + "step": 29842 + }, + { + "epoch": 0.9, + "learning_rate": 1.3251301279051278e-07, + "loss": 1.1151, + "step": 29843 + }, + { + "epoch": 0.9, + "learning_rate": 1.324346650110836e-07, + "loss": 1.0162, + "step": 29844 + }, + { + "epoch": 0.9, + "learning_rate": 1.3235633976973638e-07, + "loss": 1.1031, + "step": 29845 + }, + { + "epoch": 0.9, + "learning_rate": 1.322780370672161e-07, + "loss": 1.1884, + "step": 29846 + }, + { + "epoch": 0.9, + "learning_rate": 1.3219975690426878e-07, + "loss": 1.2017, + "step": 29847 + }, + { + "epoch": 0.9, + "learning_rate": 1.3212149928163915e-07, + "loss": 1.1107, + "step": 29848 + }, + { + "epoch": 0.9, + "learning_rate": 1.320432642000727e-07, + "loss": 1.1879, + "step": 29849 + }, + { + "epoch": 0.9, + "learning_rate": 1.319650516603141e-07, + "loss": 1.1085, + "step": 29850 + }, + { + "epoch": 0.9, + "learning_rate": 1.318868616631072e-07, + "loss": 1.0723, + "step": 29851 + }, + { + "epoch": 0.9, + "learning_rate": 1.3180869420919727e-07, + "loss": 1.0916, + "step": 29852 + }, + { + "epoch": 0.9, + "learning_rate": 1.317305492993276e-07, + "loss": 1.0322, + "step": 29853 + }, + { + "epoch": 0.9, + "learning_rate": 1.3165242693424312e-07, + "loss": 1.1782, + "step": 29854 + }, + { + "epoch": 0.9, + "learning_rate": 1.315743271146866e-07, + "loss": 1.1567, + "step": 29855 + }, + { + "epoch": 0.9, + "learning_rate": 1.3149624984140159e-07, + "loss": 1.2115, + "step": 29856 + }, + { + "epoch": 0.9, + "learning_rate": 1.3141819511513164e-07, + "loss": 1.1057, + "step": 29857 + }, + { + "epoch": 0.9, + "learning_rate": 1.3134016293662012e-07, + "loss": 1.0695, + "step": 29858 + }, + { + "epoch": 0.9, + "learning_rate": 1.3126215330660912e-07, + "loss": 1.0395, + "step": 29859 + }, + { + "epoch": 0.9, + "learning_rate": 1.3118416622584173e-07, + "loss": 1.0439, + "step": 29860 + }, + { + "epoch": 0.9, + "learning_rate": 1.3110620169506012e-07, + "loss": 1.0255, + "step": 29861 + }, + { + "epoch": 0.9, + "learning_rate": 1.3102825971500644e-07, + "loss": 1.0933, + "step": 29862 + }, + { + "epoch": 0.9, + "learning_rate": 1.3095034028642317e-07, + "loss": 1.0648, + "step": 29863 + }, + { + "epoch": 0.9, + "learning_rate": 1.308724434100514e-07, + "loss": 1.0623, + "step": 29864 + }, + { + "epoch": 0.9, + "learning_rate": 1.3079456908663302e-07, + "loss": 1.0715, + "step": 29865 + }, + { + "epoch": 0.9, + "learning_rate": 1.3071671731690912e-07, + "loss": 1.0457, + "step": 29866 + }, + { + "epoch": 0.9, + "learning_rate": 1.30638888101621e-07, + "loss": 1.1267, + "step": 29867 + }, + { + "epoch": 0.9, + "learning_rate": 1.305610814415098e-07, + "loss": 1.1457, + "step": 29868 + }, + { + "epoch": 0.9, + "learning_rate": 1.3048329733731574e-07, + "loss": 1.1349, + "step": 29869 + }, + { + "epoch": 0.9, + "learning_rate": 1.304055357897799e-07, + "loss": 1.1714, + "step": 29870 + }, + { + "epoch": 0.9, + "learning_rate": 1.3032779679964164e-07, + "loss": 1.0401, + "step": 29871 + }, + { + "epoch": 0.9, + "learning_rate": 1.3025008036764154e-07, + "loss": 1.0316, + "step": 29872 + }, + { + "epoch": 0.9, + "learning_rate": 1.3017238649451952e-07, + "loss": 1.076, + "step": 29873 + }, + { + "epoch": 0.9, + "learning_rate": 1.3009471518101502e-07, + "loss": 1.1362, + "step": 29874 + }, + { + "epoch": 0.9, + "learning_rate": 1.3001706642786715e-07, + "loss": 1.2112, + "step": 29875 + }, + { + "epoch": 0.9, + "learning_rate": 1.299394402358159e-07, + "loss": 1.0878, + "step": 29876 + }, + { + "epoch": 0.9, + "learning_rate": 1.2986183660559954e-07, + "loss": 1.0638, + "step": 29877 + }, + { + "epoch": 0.9, + "learning_rate": 1.2978425553795692e-07, + "loss": 1.0668, + "step": 29878 + }, + { + "epoch": 0.9, + "learning_rate": 1.2970669703362665e-07, + "loss": 1.0538, + "step": 29879 + }, + { + "epoch": 0.9, + "learning_rate": 1.2962916109334727e-07, + "loss": 1.109, + "step": 29880 + }, + { + "epoch": 0.9, + "learning_rate": 1.2955164771785628e-07, + "loss": 1.1649, + "step": 29881 + }, + { + "epoch": 0.9, + "learning_rate": 1.2947415690789223e-07, + "loss": 1.1088, + "step": 29882 + }, + { + "epoch": 0.9, + "learning_rate": 1.293966886641923e-07, + "loss": 1.0913, + "step": 29883 + }, + { + "epoch": 0.9, + "learning_rate": 1.2931924298749454e-07, + "loss": 1.1545, + "step": 29884 + }, + { + "epoch": 0.9, + "learning_rate": 1.2924181987853558e-07, + "loss": 1.1486, + "step": 29885 + }, + { + "epoch": 0.9, + "learning_rate": 1.2916441933805256e-07, + "loss": 1.1802, + "step": 29886 + }, + { + "epoch": 0.9, + "learning_rate": 1.2908704136678246e-07, + "loss": 1.1425, + "step": 29887 + }, + { + "epoch": 0.9, + "learning_rate": 1.2900968596546188e-07, + "loss": 1.0375, + "step": 29888 + }, + { + "epoch": 0.9, + "learning_rate": 1.289323531348277e-07, + "loss": 1.0742, + "step": 29889 + }, + { + "epoch": 0.9, + "learning_rate": 1.2885504287561495e-07, + "loss": 1.1726, + "step": 29890 + }, + { + "epoch": 0.9, + "learning_rate": 1.287777551885605e-07, + "loss": 1.1285, + "step": 29891 + }, + { + "epoch": 0.9, + "learning_rate": 1.287004900743996e-07, + "loss": 1.2369, + "step": 29892 + }, + { + "epoch": 0.9, + "learning_rate": 1.2862324753386835e-07, + "loss": 1.2358, + "step": 29893 + }, + { + "epoch": 0.9, + "learning_rate": 1.285460275677014e-07, + "loss": 1.1302, + "step": 29894 + }, + { + "epoch": 0.9, + "learning_rate": 1.2846883017663403e-07, + "loss": 1.0162, + "step": 29895 + }, + { + "epoch": 0.9, + "learning_rate": 1.2839165536140148e-07, + "loss": 1.1655, + "step": 29896 + }, + { + "epoch": 0.9, + "learning_rate": 1.2831450312273785e-07, + "loss": 1.0595, + "step": 29897 + }, + { + "epoch": 0.9, + "learning_rate": 1.2823737346137815e-07, + "loss": 1.1299, + "step": 29898 + }, + { + "epoch": 0.9, + "learning_rate": 1.2816026637805623e-07, + "loss": 1.0855, + "step": 29899 + }, + { + "epoch": 0.9, + "learning_rate": 1.280831818735062e-07, + "loss": 1.0115, + "step": 29900 + }, + { + "epoch": 0.9, + "learning_rate": 1.2800611994846196e-07, + "loss": 1.0547, + "step": 29901 + }, + { + "epoch": 0.9, + "learning_rate": 1.279290806036576e-07, + "loss": 0.9868, + "step": 29902 + }, + { + "epoch": 0.9, + "learning_rate": 1.2785206383982535e-07, + "loss": 0.9448, + "step": 29903 + }, + { + "epoch": 0.9, + "learning_rate": 1.277750696576993e-07, + "loss": 1.0219, + "step": 29904 + }, + { + "epoch": 0.9, + "learning_rate": 1.276980980580117e-07, + "loss": 1.0599, + "step": 29905 + }, + { + "epoch": 0.9, + "learning_rate": 1.2762114904149637e-07, + "loss": 1.0958, + "step": 29906 + }, + { + "epoch": 0.9, + "learning_rate": 1.2754422260888466e-07, + "loss": 1.1199, + "step": 29907 + }, + { + "epoch": 0.9, + "learning_rate": 1.2746731876090907e-07, + "loss": 1.1342, + "step": 29908 + }, + { + "epoch": 0.9, + "learning_rate": 1.273904374983023e-07, + "loss": 1.2, + "step": 29909 + }, + { + "epoch": 0.9, + "learning_rate": 1.2731357882179608e-07, + "loss": 1.0284, + "step": 29910 + }, + { + "epoch": 0.9, + "learning_rate": 1.2723674273212166e-07, + "loss": 1.1088, + "step": 29911 + }, + { + "epoch": 0.9, + "learning_rate": 1.2715992923001046e-07, + "loss": 1.1134, + "step": 29912 + }, + { + "epoch": 0.9, + "learning_rate": 1.2708313831619412e-07, + "loss": 1.1433, + "step": 29913 + }, + { + "epoch": 0.9, + "learning_rate": 1.2700636999140342e-07, + "loss": 1.1089, + "step": 29914 + }, + { + "epoch": 0.9, + "learning_rate": 1.2692962425636945e-07, + "loss": 1.0308, + "step": 29915 + }, + { + "epoch": 0.9, + "learning_rate": 1.2685290111182218e-07, + "loss": 1.042, + "step": 29916 + }, + { + "epoch": 0.9, + "learning_rate": 1.2677620055849272e-07, + "loss": 1.1526, + "step": 29917 + }, + { + "epoch": 0.9, + "learning_rate": 1.2669952259711043e-07, + "loss": 1.0898, + "step": 29918 + }, + { + "epoch": 0.9, + "learning_rate": 1.2662286722840617e-07, + "loss": 1.0491, + "step": 29919 + }, + { + "epoch": 0.9, + "learning_rate": 1.2654623445310876e-07, + "loss": 1.0739, + "step": 29920 + }, + { + "epoch": 0.9, + "learning_rate": 1.264696242719482e-07, + "loss": 1.0835, + "step": 29921 + }, + { + "epoch": 0.9, + "learning_rate": 1.2639303668565362e-07, + "loss": 1.0686, + "step": 29922 + }, + { + "epoch": 0.9, + "learning_rate": 1.2631647169495416e-07, + "loss": 1.0155, + "step": 29923 + }, + { + "epoch": 0.9, + "learning_rate": 1.2623992930057865e-07, + "loss": 1.0833, + "step": 29924 + }, + { + "epoch": 0.9, + "learning_rate": 1.2616340950325572e-07, + "loss": 1.2207, + "step": 29925 + }, + { + "epoch": 0.9, + "learning_rate": 1.2608691230371394e-07, + "loss": 1.0942, + "step": 29926 + }, + { + "epoch": 0.9, + "learning_rate": 1.2601043770268162e-07, + "loss": 1.0275, + "step": 29927 + }, + { + "epoch": 0.9, + "learning_rate": 1.2593398570088678e-07, + "loss": 1.031, + "step": 29928 + }, + { + "epoch": 0.9, + "learning_rate": 1.258575562990566e-07, + "loss": 1.1374, + "step": 29929 + }, + { + "epoch": 0.9, + "learning_rate": 1.2578114949791886e-07, + "loss": 1.0054, + "step": 29930 + }, + { + "epoch": 0.9, + "learning_rate": 1.2570476529820157e-07, + "loss": 1.1519, + "step": 29931 + }, + { + "epoch": 0.9, + "learning_rate": 1.256284037006314e-07, + "loss": 1.0093, + "step": 29932 + }, + { + "epoch": 0.9, + "learning_rate": 1.2555206470593524e-07, + "loss": 0.9506, + "step": 29933 + }, + { + "epoch": 0.9, + "learning_rate": 1.2547574831483944e-07, + "loss": 1.0383, + "step": 29934 + }, + { + "epoch": 0.9, + "learning_rate": 1.2539945452807123e-07, + "loss": 1.0469, + "step": 29935 + }, + { + "epoch": 0.9, + "learning_rate": 1.2532318334635695e-07, + "loss": 1.1785, + "step": 29936 + }, + { + "epoch": 0.9, + "learning_rate": 1.252469347704216e-07, + "loss": 1.2156, + "step": 29937 + }, + { + "epoch": 0.9, + "learning_rate": 1.2517070880099208e-07, + "loss": 1.0858, + "step": 29938 + }, + { + "epoch": 0.9, + "learning_rate": 1.2509450543879338e-07, + "loss": 1.0344, + "step": 29939 + }, + { + "epoch": 0.9, + "learning_rate": 1.2501832468455154e-07, + "loss": 1.0657, + "step": 29940 + }, + { + "epoch": 0.9, + "learning_rate": 1.2494216653899134e-07, + "loss": 1.1002, + "step": 29941 + }, + { + "epoch": 0.9, + "learning_rate": 1.2486603100283767e-07, + "loss": 1.117, + "step": 29942 + }, + { + "epoch": 0.9, + "learning_rate": 1.2478991807681555e-07, + "loss": 1.1832, + "step": 29943 + }, + { + "epoch": 0.9, + "learning_rate": 1.2471382776164943e-07, + "loss": 1.0341, + "step": 29944 + }, + { + "epoch": 0.9, + "learning_rate": 1.2463776005806422e-07, + "loss": 1.0775, + "step": 29945 + }, + { + "epoch": 0.9, + "learning_rate": 1.24561714966783e-07, + "loss": 1.0898, + "step": 29946 + }, + { + "epoch": 0.9, + "learning_rate": 1.2448569248853016e-07, + "loss": 1.1509, + "step": 29947 + }, + { + "epoch": 0.9, + "learning_rate": 1.244096926240296e-07, + "loss": 1.0631, + "step": 29948 + }, + { + "epoch": 0.9, + "learning_rate": 1.243337153740043e-07, + "loss": 1.2437, + "step": 29949 + }, + { + "epoch": 0.9, + "learning_rate": 1.2425776073917818e-07, + "loss": 1.1146, + "step": 29950 + }, + { + "epoch": 0.9, + "learning_rate": 1.2418182872027397e-07, + "loss": 1.0345, + "step": 29951 + }, + { + "epoch": 0.9, + "learning_rate": 1.241059193180144e-07, + "loss": 1.1341, + "step": 29952 + }, + { + "epoch": 0.9, + "learning_rate": 1.2403003253312258e-07, + "loss": 1.0469, + "step": 29953 + }, + { + "epoch": 0.9, + "learning_rate": 1.2395416836632007e-07, + "loss": 1.1314, + "step": 29954 + }, + { + "epoch": 0.9, + "learning_rate": 1.2387832681832968e-07, + "loss": 1.1118, + "step": 29955 + }, + { + "epoch": 0.9, + "learning_rate": 1.238025078898733e-07, + "loss": 1.1094, + "step": 29956 + }, + { + "epoch": 0.9, + "learning_rate": 1.237267115816726e-07, + "loss": 1.1192, + "step": 29957 + }, + { + "epoch": 0.9, + "learning_rate": 1.236509378944495e-07, + "loss": 1.1899, + "step": 29958 + }, + { + "epoch": 0.9, + "learning_rate": 1.235751868289245e-07, + "loss": 1.0851, + "step": 29959 + }, + { + "epoch": 0.9, + "learning_rate": 1.2349945838581928e-07, + "loss": 1.0416, + "step": 29960 + }, + { + "epoch": 0.9, + "learning_rate": 1.2342375256585465e-07, + "loss": 1.0745, + "step": 29961 + }, + { + "epoch": 0.9, + "learning_rate": 1.2334806936975168e-07, + "loss": 1.0782, + "step": 29962 + }, + { + "epoch": 0.9, + "learning_rate": 1.232724087982301e-07, + "loss": 1.1011, + "step": 29963 + }, + { + "epoch": 0.9, + "learning_rate": 1.231967708520107e-07, + "loss": 0.9847, + "step": 29964 + }, + { + "epoch": 0.9, + "learning_rate": 1.2312115553181293e-07, + "loss": 1.0198, + "step": 29965 + }, + { + "epoch": 0.9, + "learning_rate": 1.2304556283835727e-07, + "loss": 1.0764, + "step": 29966 + }, + { + "epoch": 0.9, + "learning_rate": 1.229699927723635e-07, + "loss": 1.0841, + "step": 29967 + }, + { + "epoch": 0.9, + "learning_rate": 1.2289444533455013e-07, + "loss": 1.1717, + "step": 29968 + }, + { + "epoch": 0.9, + "learning_rate": 1.2281892052563666e-07, + "loss": 1.1828, + "step": 29969 + }, + { + "epoch": 0.9, + "learning_rate": 1.2274341834634246e-07, + "loss": 1.1138, + "step": 29970 + }, + { + "epoch": 0.9, + "learning_rate": 1.2266793879738613e-07, + "loss": 1.0284, + "step": 29971 + }, + { + "epoch": 0.9, + "learning_rate": 1.2259248187948576e-07, + "loss": 1.1899, + "step": 29972 + }, + { + "epoch": 0.9, + "learning_rate": 1.2251704759335986e-07, + "loss": 1.0279, + "step": 29973 + }, + { + "epoch": 0.9, + "learning_rate": 1.224416359397268e-07, + "loss": 1.1339, + "step": 29974 + }, + { + "epoch": 0.9, + "learning_rate": 1.223662469193046e-07, + "loss": 1.1258, + "step": 29975 + }, + { + "epoch": 0.9, + "learning_rate": 1.2229088053281017e-07, + "loss": 1.1218, + "step": 29976 + }, + { + "epoch": 0.9, + "learning_rate": 1.2221553678096133e-07, + "loss": 1.1778, + "step": 29977 + }, + { + "epoch": 0.9, + "learning_rate": 1.2214021566447577e-07, + "loss": 1.0186, + "step": 29978 + }, + { + "epoch": 0.9, + "learning_rate": 1.2206491718406989e-07, + "loss": 1.0687, + "step": 29979 + }, + { + "epoch": 0.9, + "learning_rate": 1.219896413404606e-07, + "loss": 1.0727, + "step": 29980 + }, + { + "epoch": 0.9, + "learning_rate": 1.2191438813436486e-07, + "loss": 1.1129, + "step": 29981 + }, + { + "epoch": 0.9, + "learning_rate": 1.2183915756649873e-07, + "loss": 0.9695, + "step": 29982 + }, + { + "epoch": 0.9, + "learning_rate": 1.217639496375786e-07, + "loss": 1.1434, + "step": 29983 + }, + { + "epoch": 0.9, + "learning_rate": 1.2168876434832056e-07, + "loss": 0.9997, + "step": 29984 + }, + { + "epoch": 0.9, + "learning_rate": 1.2161360169943958e-07, + "loss": 1.0587, + "step": 29985 + }, + { + "epoch": 0.9, + "learning_rate": 1.2153846169165178e-07, + "loss": 1.0972, + "step": 29986 + }, + { + "epoch": 0.9, + "learning_rate": 1.2146334432567214e-07, + "loss": 1.1393, + "step": 29987 + }, + { + "epoch": 0.9, + "learning_rate": 1.2138824960221645e-07, + "loss": 1.132, + "step": 29988 + }, + { + "epoch": 0.9, + "learning_rate": 1.2131317752199861e-07, + "loss": 1.1367, + "step": 29989 + }, + { + "epoch": 0.9, + "learning_rate": 1.2123812808573387e-07, + "loss": 1.0844, + "step": 29990 + }, + { + "epoch": 0.9, + "learning_rate": 1.2116310129413638e-07, + "loss": 1.1554, + "step": 29991 + }, + { + "epoch": 0.9, + "learning_rate": 1.2108809714792087e-07, + "loss": 1.2034, + "step": 29992 + }, + { + "epoch": 0.9, + "learning_rate": 1.2101311564780034e-07, + "loss": 1.3423, + "step": 29993 + }, + { + "epoch": 0.9, + "learning_rate": 1.209381567944895e-07, + "loss": 1.2115, + "step": 29994 + }, + { + "epoch": 0.9, + "learning_rate": 1.2086322058870142e-07, + "loss": 1.1189, + "step": 29995 + }, + { + "epoch": 0.9, + "learning_rate": 1.2078830703114967e-07, + "loss": 1.0844, + "step": 29996 + }, + { + "epoch": 0.9, + "learning_rate": 1.2071341612254788e-07, + "loss": 1.0754, + "step": 29997 + }, + { + "epoch": 0.9, + "learning_rate": 1.2063854786360795e-07, + "loss": 1.0289, + "step": 29998 + }, + { + "epoch": 0.9, + "learning_rate": 1.205637022550432e-07, + "loss": 1.1599, + "step": 29999 + }, + { + "epoch": 0.9, + "learning_rate": 1.2048887929756614e-07, + "loss": 1.1059, + "step": 30000 + }, + { + "epoch": 0.9, + "learning_rate": 1.2041407899188895e-07, + "loss": 1.1181, + "step": 30001 + }, + { + "epoch": 0.9, + "learning_rate": 1.2033930133872356e-07, + "loss": 1.0063, + "step": 30002 + }, + { + "epoch": 0.9, + "learning_rate": 1.2026454633878194e-07, + "loss": 1.0369, + "step": 30003 + }, + { + "epoch": 0.9, + "learning_rate": 1.201898139927757e-07, + "loss": 1.152, + "step": 30004 + }, + { + "epoch": 0.9, + "learning_rate": 1.2011510430141622e-07, + "loss": 1.1018, + "step": 30005 + }, + { + "epoch": 0.9, + "learning_rate": 1.2004041726541487e-07, + "loss": 1.1316, + "step": 30006 + }, + { + "epoch": 0.9, + "learning_rate": 1.199657528854825e-07, + "loss": 1.0516, + "step": 30007 + }, + { + "epoch": 0.9, + "learning_rate": 1.1989111116232966e-07, + "loss": 1.0403, + "step": 30008 + }, + { + "epoch": 0.9, + "learning_rate": 1.198164920966674e-07, + "loss": 1.2139, + "step": 30009 + }, + { + "epoch": 0.9, + "learning_rate": 1.1974189568920602e-07, + "loss": 1.0143, + "step": 30010 + }, + { + "epoch": 0.9, + "learning_rate": 1.1966732194065522e-07, + "loss": 1.1433, + "step": 30011 + }, + { + "epoch": 0.9, + "learning_rate": 1.19592770851725e-07, + "loss": 1.1647, + "step": 30012 + }, + { + "epoch": 0.9, + "learning_rate": 1.195182424231253e-07, + "loss": 1.0352, + "step": 30013 + }, + { + "epoch": 0.9, + "learning_rate": 1.1944373665556564e-07, + "loss": 1.0272, + "step": 30014 + }, + { + "epoch": 0.9, + "learning_rate": 1.193692535497548e-07, + "loss": 1.0472, + "step": 30015 + }, + { + "epoch": 0.9, + "learning_rate": 1.1929479310640203e-07, + "loss": 1.1987, + "step": 30016 + }, + { + "epoch": 0.9, + "learning_rate": 1.192203553262164e-07, + "loss": 1.1168, + "step": 30017 + }, + { + "epoch": 0.9, + "learning_rate": 1.1914594020990655e-07, + "loss": 1.2404, + "step": 30018 + }, + { + "epoch": 0.9, + "learning_rate": 1.1907154775818026e-07, + "loss": 1.2094, + "step": 30019 + }, + { + "epoch": 0.9, + "learning_rate": 1.1899717797174637e-07, + "loss": 1.0231, + "step": 30020 + }, + { + "epoch": 0.9, + "learning_rate": 1.189228308513124e-07, + "loss": 1.1437, + "step": 30021 + }, + { + "epoch": 0.9, + "learning_rate": 1.1884850639758667e-07, + "loss": 1.0867, + "step": 30022 + }, + { + "epoch": 0.9, + "learning_rate": 1.1877420461127636e-07, + "loss": 1.0322, + "step": 30023 + }, + { + "epoch": 0.9, + "learning_rate": 1.1869992549308845e-07, + "loss": 1.144, + "step": 30024 + }, + { + "epoch": 0.9, + "learning_rate": 1.1862566904373068e-07, + "loss": 0.9772, + "step": 30025 + }, + { + "epoch": 0.9, + "learning_rate": 1.1855143526390944e-07, + "loss": 1.1503, + "step": 30026 + }, + { + "epoch": 0.9, + "learning_rate": 1.1847722415433193e-07, + "loss": 1.1447, + "step": 30027 + }, + { + "epoch": 0.9, + "learning_rate": 1.18403035715704e-07, + "loss": 1.0629, + "step": 30028 + }, + { + "epoch": 0.9, + "learning_rate": 1.18328869948732e-07, + "loss": 1.1633, + "step": 30029 + }, + { + "epoch": 0.9, + "learning_rate": 1.1825472685412204e-07, + "loss": 1.0452, + "step": 30030 + }, + { + "epoch": 0.9, + "learning_rate": 1.1818060643258022e-07, + "loss": 1.0978, + "step": 30031 + }, + { + "epoch": 0.9, + "learning_rate": 1.1810650868481183e-07, + "loss": 1.0995, + "step": 30032 + }, + { + "epoch": 0.9, + "learning_rate": 1.1803243361152239e-07, + "loss": 1.1071, + "step": 30033 + }, + { + "epoch": 0.9, + "learning_rate": 1.1795838121341691e-07, + "loss": 1.1386, + "step": 30034 + }, + { + "epoch": 0.9, + "learning_rate": 1.1788435149120064e-07, + "loss": 1.0488, + "step": 30035 + }, + { + "epoch": 0.9, + "learning_rate": 1.1781034444557776e-07, + "loss": 1.0903, + "step": 30036 + }, + { + "epoch": 0.9, + "learning_rate": 1.1773636007725325e-07, + "loss": 1.0414, + "step": 30037 + }, + { + "epoch": 0.9, + "learning_rate": 1.1766239838693128e-07, + "loss": 1.0726, + "step": 30038 + }, + { + "epoch": 0.9, + "learning_rate": 1.1758845937531571e-07, + "loss": 1.1637, + "step": 30039 + }, + { + "epoch": 0.9, + "learning_rate": 1.17514543043111e-07, + "loss": 1.1257, + "step": 30040 + }, + { + "epoch": 0.9, + "learning_rate": 1.1744064939102018e-07, + "loss": 1.1379, + "step": 30041 + }, + { + "epoch": 0.91, + "learning_rate": 1.1736677841974687e-07, + "loss": 1.2188, + "step": 30042 + }, + { + "epoch": 0.91, + "learning_rate": 1.172929301299941e-07, + "loss": 1.1658, + "step": 30043 + }, + { + "epoch": 0.91, + "learning_rate": 1.1721910452246577e-07, + "loss": 1.1807, + "step": 30044 + }, + { + "epoch": 0.91, + "learning_rate": 1.1714530159786325e-07, + "loss": 1.195, + "step": 30045 + }, + { + "epoch": 0.91, + "learning_rate": 1.1707152135689015e-07, + "loss": 1.1077, + "step": 30046 + }, + { + "epoch": 0.91, + "learning_rate": 1.169977638002484e-07, + "loss": 1.0818, + "step": 30047 + }, + { + "epoch": 0.91, + "learning_rate": 1.1692402892864025e-07, + "loss": 1.1751, + "step": 30048 + }, + { + "epoch": 0.91, + "learning_rate": 1.1685031674276786e-07, + "loss": 1.1019, + "step": 30049 + }, + { + "epoch": 0.91, + "learning_rate": 1.1677662724333238e-07, + "loss": 1.1711, + "step": 30050 + }, + { + "epoch": 0.91, + "learning_rate": 1.1670296043103574e-07, + "loss": 1.1219, + "step": 30051 + }, + { + "epoch": 0.91, + "learning_rate": 1.1662931630657904e-07, + "loss": 1.0776, + "step": 30052 + }, + { + "epoch": 0.91, + "learning_rate": 1.1655569487066365e-07, + "loss": 1.1326, + "step": 30053 + }, + { + "epoch": 0.91, + "learning_rate": 1.1648209612398986e-07, + "loss": 1.1784, + "step": 30054 + }, + { + "epoch": 0.91, + "learning_rate": 1.164085200672585e-07, + "loss": 1.1161, + "step": 30055 + }, + { + "epoch": 0.91, + "learning_rate": 1.1633496670117011e-07, + "loss": 1.0923, + "step": 30056 + }, + { + "epoch": 0.91, + "learning_rate": 1.1626143602642526e-07, + "loss": 1.0942, + "step": 30057 + }, + { + "epoch": 0.91, + "learning_rate": 1.1618792804372308e-07, + "loss": 1.2051, + "step": 30058 + }, + { + "epoch": 0.91, + "learning_rate": 1.161144427537636e-07, + "loss": 1.007, + "step": 30059 + }, + { + "epoch": 0.91, + "learning_rate": 1.1604098015724653e-07, + "loss": 1.0847, + "step": 30060 + }, + { + "epoch": 0.91, + "learning_rate": 1.1596754025487128e-07, + "loss": 1.1364, + "step": 30061 + }, + { + "epoch": 0.91, + "learning_rate": 1.1589412304733705e-07, + "loss": 1.1619, + "step": 30062 + }, + { + "epoch": 0.91, + "learning_rate": 1.1582072853534216e-07, + "loss": 1.1634, + "step": 30063 + }, + { + "epoch": 0.91, + "learning_rate": 1.1574735671958603e-07, + "loss": 1.0276, + "step": 30064 + }, + { + "epoch": 0.91, + "learning_rate": 1.1567400760076648e-07, + "loss": 1.0551, + "step": 30065 + }, + { + "epoch": 0.91, + "learning_rate": 1.1560068117958234e-07, + "loss": 1.1418, + "step": 30066 + }, + { + "epoch": 0.91, + "learning_rate": 1.1552737745673115e-07, + "loss": 1.0754, + "step": 30067 + }, + { + "epoch": 0.91, + "learning_rate": 1.1545409643291094e-07, + "loss": 1.2084, + "step": 30068 + }, + { + "epoch": 0.91, + "learning_rate": 1.153808381088195e-07, + "loss": 1.0921, + "step": 30069 + }, + { + "epoch": 0.91, + "learning_rate": 1.1530760248515404e-07, + "loss": 1.0364, + "step": 30070 + }, + { + "epoch": 0.91, + "learning_rate": 1.1523438956261152e-07, + "loss": 1.1009, + "step": 30071 + }, + { + "epoch": 0.91, + "learning_rate": 1.1516119934188885e-07, + "loss": 1.1877, + "step": 30072 + }, + { + "epoch": 0.91, + "learning_rate": 1.1508803182368328e-07, + "loss": 1.1906, + "step": 30073 + }, + { + "epoch": 0.91, + "learning_rate": 1.150148870086909e-07, + "loss": 0.9792, + "step": 30074 + }, + { + "epoch": 0.91, + "learning_rate": 1.1494176489760839e-07, + "loss": 1.1789, + "step": 30075 + }, + { + "epoch": 0.91, + "learning_rate": 1.148686654911313e-07, + "loss": 1.0574, + "step": 30076 + }, + { + "epoch": 0.91, + "learning_rate": 1.1479558878995601e-07, + "loss": 1.0323, + "step": 30077 + }, + { + "epoch": 0.91, + "learning_rate": 1.147225347947778e-07, + "loss": 1.1774, + "step": 30078 + }, + { + "epoch": 0.91, + "learning_rate": 1.146495035062925e-07, + "loss": 1.0082, + "step": 30079 + }, + { + "epoch": 0.91, + "learning_rate": 1.1457649492519484e-07, + "loss": 1.1264, + "step": 30080 + }, + { + "epoch": 0.91, + "learning_rate": 1.1450350905218011e-07, + "loss": 1.1104, + "step": 30081 + }, + { + "epoch": 0.91, + "learning_rate": 1.14430545887943e-07, + "loss": 1.0831, + "step": 30082 + }, + { + "epoch": 0.91, + "learning_rate": 1.1435760543317881e-07, + "loss": 1.1395, + "step": 30083 + }, + { + "epoch": 0.91, + "learning_rate": 1.1428468768858058e-07, + "loss": 1.0284, + "step": 30084 + }, + { + "epoch": 0.91, + "learning_rate": 1.1421179265484333e-07, + "loss": 1.1282, + "step": 30085 + }, + { + "epoch": 0.91, + "learning_rate": 1.1413892033266066e-07, + "loss": 1.1411, + "step": 30086 + }, + { + "epoch": 0.91, + "learning_rate": 1.1406607072272619e-07, + "loss": 1.212, + "step": 30087 + }, + { + "epoch": 0.91, + "learning_rate": 1.1399324382573407e-07, + "loss": 0.9887, + "step": 30088 + }, + { + "epoch": 0.91, + "learning_rate": 1.1392043964237681e-07, + "loss": 1.1452, + "step": 30089 + }, + { + "epoch": 0.91, + "learning_rate": 1.1384765817334802e-07, + "loss": 1.1702, + "step": 30090 + }, + { + "epoch": 0.91, + "learning_rate": 1.1377489941933994e-07, + "loss": 1.1761, + "step": 30091 + }, + { + "epoch": 0.91, + "learning_rate": 1.1370216338104617e-07, + "loss": 1.1677, + "step": 30092 + }, + { + "epoch": 0.91, + "learning_rate": 1.1362945005915838e-07, + "loss": 1.1571, + "step": 30093 + }, + { + "epoch": 0.91, + "learning_rate": 1.135567594543685e-07, + "loss": 1.1685, + "step": 30094 + }, + { + "epoch": 0.91, + "learning_rate": 1.1348409156736906e-07, + "loss": 1.0127, + "step": 30095 + }, + { + "epoch": 0.91, + "learning_rate": 1.1341144639885226e-07, + "loss": 0.9685, + "step": 30096 + }, + { + "epoch": 0.91, + "learning_rate": 1.1333882394950841e-07, + "loss": 1.0914, + "step": 30097 + }, + { + "epoch": 0.91, + "learning_rate": 1.132662242200297e-07, + "loss": 1.1302, + "step": 30098 + }, + { + "epoch": 0.91, + "learning_rate": 1.1319364721110698e-07, + "loss": 1.0237, + "step": 30099 + }, + { + "epoch": 0.91, + "learning_rate": 1.1312109292343138e-07, + "loss": 1.1332, + "step": 30100 + }, + { + "epoch": 0.91, + "learning_rate": 1.1304856135769343e-07, + "loss": 1.072, + "step": 30101 + }, + { + "epoch": 0.91, + "learning_rate": 1.1297605251458343e-07, + "loss": 1.0743, + "step": 30102 + }, + { + "epoch": 0.91, + "learning_rate": 1.1290356639479166e-07, + "loss": 1.11, + "step": 30103 + }, + { + "epoch": 0.91, + "learning_rate": 1.128311029990084e-07, + "loss": 1.112, + "step": 30104 + }, + { + "epoch": 0.91, + "learning_rate": 1.1275866232792365e-07, + "loss": 1.058, + "step": 30105 + }, + { + "epoch": 0.91, + "learning_rate": 1.1268624438222631e-07, + "loss": 1.0443, + "step": 30106 + }, + { + "epoch": 0.91, + "learning_rate": 1.1261384916260637e-07, + "loss": 1.1503, + "step": 30107 + }, + { + "epoch": 0.91, + "learning_rate": 1.1254147666975245e-07, + "loss": 1.0897, + "step": 30108 + }, + { + "epoch": 0.91, + "learning_rate": 1.124691269043543e-07, + "loss": 1.1759, + "step": 30109 + }, + { + "epoch": 0.91, + "learning_rate": 1.1239679986709995e-07, + "loss": 1.1547, + "step": 30110 + }, + { + "epoch": 0.91, + "learning_rate": 1.1232449555867803e-07, + "loss": 0.9899, + "step": 30111 + }, + { + "epoch": 0.91, + "learning_rate": 1.1225221397977714e-07, + "loss": 1.1426, + "step": 30112 + }, + { + "epoch": 0.91, + "learning_rate": 1.121799551310851e-07, + "loss": 1.0906, + "step": 30113 + }, + { + "epoch": 0.91, + "learning_rate": 1.1210771901328993e-07, + "loss": 1.1703, + "step": 30114 + }, + { + "epoch": 0.91, + "learning_rate": 1.1203550562707915e-07, + "loss": 1.1172, + "step": 30115 + }, + { + "epoch": 0.91, + "learning_rate": 1.1196331497314028e-07, + "loss": 1.1083, + "step": 30116 + }, + { + "epoch": 0.91, + "learning_rate": 1.1189114705216081e-07, + "loss": 1.1182, + "step": 30117 + }, + { + "epoch": 0.91, + "learning_rate": 1.1181900186482713e-07, + "loss": 1.215, + "step": 30118 + }, + { + "epoch": 0.91, + "learning_rate": 1.1174687941182649e-07, + "loss": 0.9201, + "step": 30119 + }, + { + "epoch": 0.91, + "learning_rate": 1.1167477969384527e-07, + "loss": 1.0752, + "step": 30120 + }, + { + "epoch": 0.91, + "learning_rate": 1.1160270271156987e-07, + "loss": 1.1213, + "step": 30121 + }, + { + "epoch": 0.91, + "learning_rate": 1.1153064846568667e-07, + "loss": 1.0459, + "step": 30122 + }, + { + "epoch": 0.91, + "learning_rate": 1.1145861695688126e-07, + "loss": 1.0925, + "step": 30123 + }, + { + "epoch": 0.91, + "learning_rate": 1.1138660818583919e-07, + "loss": 1.0859, + "step": 30124 + }, + { + "epoch": 0.91, + "learning_rate": 1.1131462215324657e-07, + "loss": 1.1299, + "step": 30125 + }, + { + "epoch": 0.91, + "learning_rate": 1.1124265885978813e-07, + "loss": 1.0651, + "step": 30126 + }, + { + "epoch": 0.91, + "learning_rate": 1.1117071830614945e-07, + "loss": 1.0829, + "step": 30127 + }, + { + "epoch": 0.91, + "learning_rate": 1.1109880049301469e-07, + "loss": 0.9779, + "step": 30128 + }, + { + "epoch": 0.91, + "learning_rate": 1.1102690542106887e-07, + "loss": 1.0634, + "step": 30129 + }, + { + "epoch": 0.91, + "learning_rate": 1.1095503309099614e-07, + "loss": 1.1985, + "step": 30130 + }, + { + "epoch": 0.91, + "learning_rate": 1.1088318350348126e-07, + "loss": 1.0929, + "step": 30131 + }, + { + "epoch": 0.91, + "learning_rate": 1.1081135665920783e-07, + "loss": 1.1545, + "step": 30132 + }, + { + "epoch": 0.91, + "learning_rate": 1.1073955255885921e-07, + "loss": 1.075, + "step": 30133 + }, + { + "epoch": 0.91, + "learning_rate": 1.1066777120311956e-07, + "loss": 1.1537, + "step": 30134 + }, + { + "epoch": 0.91, + "learning_rate": 1.105960125926725e-07, + "loss": 1.0349, + "step": 30135 + }, + { + "epoch": 0.91, + "learning_rate": 1.1052427672819998e-07, + "loss": 1.1884, + "step": 30136 + }, + { + "epoch": 0.91, + "learning_rate": 1.1045256361038565e-07, + "loss": 0.9839, + "step": 30137 + }, + { + "epoch": 0.91, + "learning_rate": 1.1038087323991197e-07, + "loss": 1.0698, + "step": 30138 + }, + { + "epoch": 0.91, + "learning_rate": 1.1030920561746178e-07, + "loss": 1.0944, + "step": 30139 + }, + { + "epoch": 0.91, + "learning_rate": 1.1023756074371699e-07, + "loss": 1.0729, + "step": 30140 + }, + { + "epoch": 0.91, + "learning_rate": 1.1016593861935959e-07, + "loss": 1.136, + "step": 30141 + }, + { + "epoch": 0.91, + "learning_rate": 1.1009433924507152e-07, + "loss": 1.0079, + "step": 30142 + }, + { + "epoch": 0.91, + "learning_rate": 1.1002276262153416e-07, + "loss": 1.0829, + "step": 30143 + }, + { + "epoch": 0.91, + "learning_rate": 1.0995120874942893e-07, + "loss": 1.0803, + "step": 30144 + }, + { + "epoch": 0.91, + "learning_rate": 1.0987967762943725e-07, + "loss": 1.0894, + "step": 30145 + }, + { + "epoch": 0.91, + "learning_rate": 1.0980816926223992e-07, + "loss": 1.106, + "step": 30146 + }, + { + "epoch": 0.91, + "learning_rate": 1.097366836485178e-07, + "loss": 1.0002, + "step": 30147 + }, + { + "epoch": 0.91, + "learning_rate": 1.0966522078895147e-07, + "loss": 1.2068, + "step": 30148 + }, + { + "epoch": 0.91, + "learning_rate": 1.0959378068422066e-07, + "loss": 1.1108, + "step": 30149 + }, + { + "epoch": 0.91, + "learning_rate": 1.0952236333500594e-07, + "loss": 1.0667, + "step": 30150 + }, + { + "epoch": 0.91, + "learning_rate": 1.0945096874198674e-07, + "loss": 1.105, + "step": 30151 + }, + { + "epoch": 0.91, + "learning_rate": 1.093795969058431e-07, + "loss": 1.0487, + "step": 30152 + }, + { + "epoch": 0.91, + "learning_rate": 1.0930824782725474e-07, + "loss": 1.0914, + "step": 30153 + }, + { + "epoch": 0.91, + "learning_rate": 1.092369215069003e-07, + "loss": 1.1458, + "step": 30154 + }, + { + "epoch": 0.91, + "learning_rate": 1.0916561794545865e-07, + "loss": 1.0807, + "step": 30155 + }, + { + "epoch": 0.91, + "learning_rate": 1.0909433714360901e-07, + "loss": 1.072, + "step": 30156 + }, + { + "epoch": 0.91, + "learning_rate": 1.0902307910202997e-07, + "loss": 1.0776, + "step": 30157 + }, + { + "epoch": 0.91, + "learning_rate": 1.0895184382139962e-07, + "loss": 1.1892, + "step": 30158 + }, + { + "epoch": 0.91, + "learning_rate": 1.0888063130239573e-07, + "loss": 1.0361, + "step": 30159 + }, + { + "epoch": 0.91, + "learning_rate": 1.0880944154569694e-07, + "loss": 1.0978, + "step": 30160 + }, + { + "epoch": 0.91, + "learning_rate": 1.0873827455198104e-07, + "loss": 1.1135, + "step": 30161 + }, + { + "epoch": 0.91, + "learning_rate": 1.0866713032192444e-07, + "loss": 1.0961, + "step": 30162 + }, + { + "epoch": 0.91, + "learning_rate": 1.085960088562052e-07, + "loss": 1.0698, + "step": 30163 + }, + { + "epoch": 0.91, + "learning_rate": 1.0852491015550026e-07, + "loss": 1.1536, + "step": 30164 + }, + { + "epoch": 0.91, + "learning_rate": 1.0845383422048689e-07, + "loss": 1.0351, + "step": 30165 + }, + { + "epoch": 0.91, + "learning_rate": 1.0838278105184064e-07, + "loss": 1.0402, + "step": 30166 + }, + { + "epoch": 0.91, + "learning_rate": 1.0831175065023846e-07, + "loss": 1.0153, + "step": 30167 + }, + { + "epoch": 0.91, + "learning_rate": 1.0824074301635679e-07, + "loss": 1.0403, + "step": 30168 + }, + { + "epoch": 0.91, + "learning_rate": 1.0816975815087116e-07, + "loss": 1.1765, + "step": 30169 + }, + { + "epoch": 0.91, + "learning_rate": 1.0809879605445745e-07, + "loss": 1.0632, + "step": 30170 + }, + { + "epoch": 0.91, + "learning_rate": 1.0802785672779121e-07, + "loss": 1.1648, + "step": 30171 + }, + { + "epoch": 0.91, + "learning_rate": 1.0795694017154773e-07, + "loss": 1.1264, + "step": 30172 + }, + { + "epoch": 0.91, + "learning_rate": 1.0788604638640232e-07, + "loss": 1.2218, + "step": 30173 + }, + { + "epoch": 0.91, + "learning_rate": 1.0781517537302971e-07, + "loss": 1.1274, + "step": 30174 + }, + { + "epoch": 0.91, + "learning_rate": 1.0774432713210437e-07, + "loss": 1.1586, + "step": 30175 + }, + { + "epoch": 0.91, + "learning_rate": 1.0767350166430101e-07, + "loss": 1.1007, + "step": 30176 + }, + { + "epoch": 0.91, + "learning_rate": 1.0760269897029357e-07, + "loss": 1.1707, + "step": 30177 + }, + { + "epoch": 0.91, + "learning_rate": 1.075319190507565e-07, + "loss": 1.1369, + "step": 30178 + }, + { + "epoch": 0.91, + "learning_rate": 1.0746116190636313e-07, + "loss": 1.1356, + "step": 30179 + }, + { + "epoch": 0.91, + "learning_rate": 1.073904275377871e-07, + "loss": 1.1366, + "step": 30180 + }, + { + "epoch": 0.91, + "learning_rate": 1.0731971594570206e-07, + "loss": 1.1762, + "step": 30181 + }, + { + "epoch": 0.91, + "learning_rate": 1.0724902713078078e-07, + "loss": 1.1076, + "step": 30182 + }, + { + "epoch": 0.91, + "learning_rate": 1.0717836109369661e-07, + "loss": 1.0903, + "step": 30183 + }, + { + "epoch": 0.91, + "learning_rate": 1.071077178351218e-07, + "loss": 1.0933, + "step": 30184 + }, + { + "epoch": 0.91, + "learning_rate": 1.0703709735572914e-07, + "loss": 1.0546, + "step": 30185 + }, + { + "epoch": 0.91, + "learning_rate": 1.0696649965619088e-07, + "loss": 1.111, + "step": 30186 + }, + { + "epoch": 0.91, + "learning_rate": 1.0689592473717924e-07, + "loss": 1.0284, + "step": 30187 + }, + { + "epoch": 0.91, + "learning_rate": 1.0682537259936538e-07, + "loss": 1.0992, + "step": 30188 + }, + { + "epoch": 0.91, + "learning_rate": 1.067548432434215e-07, + "loss": 1.0661, + "step": 30189 + }, + { + "epoch": 0.91, + "learning_rate": 1.0668433667001904e-07, + "loss": 1.028, + "step": 30190 + }, + { + "epoch": 0.91, + "learning_rate": 1.0661385287982912e-07, + "loss": 1.1108, + "step": 30191 + }, + { + "epoch": 0.91, + "learning_rate": 1.0654339187352231e-07, + "loss": 1.1819, + "step": 30192 + }, + { + "epoch": 0.91, + "learning_rate": 1.0647295365177002e-07, + "loss": 1.1506, + "step": 30193 + }, + { + "epoch": 0.91, + "learning_rate": 1.0640253821524199e-07, + "loss": 1.1664, + "step": 30194 + }, + { + "epoch": 0.91, + "learning_rate": 1.0633214556460936e-07, + "loss": 1.025, + "step": 30195 + }, + { + "epoch": 0.91, + "learning_rate": 1.0626177570054158e-07, + "loss": 1.0486, + "step": 30196 + }, + { + "epoch": 0.91, + "learning_rate": 1.0619142862370896e-07, + "loss": 1.1199, + "step": 30197 + }, + { + "epoch": 0.91, + "learning_rate": 1.0612110433478123e-07, + "loss": 1.0844, + "step": 30198 + }, + { + "epoch": 0.91, + "learning_rate": 1.0605080283442759e-07, + "loss": 1.142, + "step": 30199 + }, + { + "epoch": 0.91, + "learning_rate": 1.0598052412331722e-07, + "loss": 0.9826, + "step": 30200 + }, + { + "epoch": 0.91, + "learning_rate": 1.059102682021193e-07, + "loss": 1.1019, + "step": 30201 + }, + { + "epoch": 0.91, + "learning_rate": 1.0584003507150276e-07, + "loss": 1.1794, + "step": 30202 + }, + { + "epoch": 0.91, + "learning_rate": 1.0576982473213565e-07, + "loss": 1.0066, + "step": 30203 + }, + { + "epoch": 0.91, + "learning_rate": 1.0569963718468718e-07, + "loss": 1.1012, + "step": 30204 + }, + { + "epoch": 0.91, + "learning_rate": 1.0562947242982485e-07, + "loss": 1.0739, + "step": 30205 + }, + { + "epoch": 0.91, + "learning_rate": 1.0555933046821676e-07, + "loss": 1.223, + "step": 30206 + }, + { + "epoch": 0.91, + "learning_rate": 1.0548921130053041e-07, + "loss": 1.0874, + "step": 30207 + }, + { + "epoch": 0.91, + "learning_rate": 1.0541911492743362e-07, + "loss": 1.0314, + "step": 30208 + }, + { + "epoch": 0.91, + "learning_rate": 1.053490413495939e-07, + "loss": 1.1464, + "step": 30209 + }, + { + "epoch": 0.91, + "learning_rate": 1.0527899056767792e-07, + "loss": 1.0441, + "step": 30210 + }, + { + "epoch": 0.91, + "learning_rate": 1.0520896258235242e-07, + "loss": 1.0737, + "step": 30211 + }, + { + "epoch": 0.91, + "learning_rate": 1.0513895739428403e-07, + "loss": 1.1869, + "step": 30212 + }, + { + "epoch": 0.91, + "learning_rate": 1.0506897500414003e-07, + "loss": 1.1655, + "step": 30213 + }, + { + "epoch": 0.91, + "learning_rate": 1.0499901541258545e-07, + "loss": 1.07, + "step": 30214 + }, + { + "epoch": 0.91, + "learning_rate": 1.0492907862028668e-07, + "loss": 0.9963, + "step": 30215 + }, + { + "epoch": 0.91, + "learning_rate": 1.0485916462790985e-07, + "loss": 1.0417, + "step": 30216 + }, + { + "epoch": 0.91, + "learning_rate": 1.0478927343612028e-07, + "loss": 1.1667, + "step": 30217 + }, + { + "epoch": 0.91, + "learning_rate": 1.0471940504558325e-07, + "loss": 1.1489, + "step": 30218 + }, + { + "epoch": 0.91, + "learning_rate": 1.0464955945696353e-07, + "loss": 1.0305, + "step": 30219 + }, + { + "epoch": 0.91, + "learning_rate": 1.045797366709267e-07, + "loss": 1.0667, + "step": 30220 + }, + { + "epoch": 0.91, + "learning_rate": 1.0450993668813692e-07, + "loss": 1.1262, + "step": 30221 + }, + { + "epoch": 0.91, + "learning_rate": 1.0444015950925895e-07, + "loss": 1.0638, + "step": 30222 + }, + { + "epoch": 0.91, + "learning_rate": 1.0437040513495699e-07, + "loss": 1.0271, + "step": 30223 + }, + { + "epoch": 0.91, + "learning_rate": 1.0430067356589469e-07, + "loss": 1.2325, + "step": 30224 + }, + { + "epoch": 0.91, + "learning_rate": 1.042309648027362e-07, + "loss": 0.9403, + "step": 30225 + }, + { + "epoch": 0.91, + "learning_rate": 1.0416127884614518e-07, + "loss": 1.0981, + "step": 30226 + }, + { + "epoch": 0.91, + "learning_rate": 1.04091615696785e-07, + "loss": 1.2012, + "step": 30227 + }, + { + "epoch": 0.91, + "learning_rate": 1.0402197535531872e-07, + "loss": 1.0907, + "step": 30228 + }, + { + "epoch": 0.91, + "learning_rate": 1.0395235782240914e-07, + "loss": 1.0908, + "step": 30229 + }, + { + "epoch": 0.91, + "learning_rate": 1.0388276309871937e-07, + "loss": 1.0824, + "step": 30230 + }, + { + "epoch": 0.91, + "learning_rate": 1.0381319118491162e-07, + "loss": 1.2488, + "step": 30231 + }, + { + "epoch": 0.91, + "learning_rate": 1.0374364208164817e-07, + "loss": 1.0852, + "step": 30232 + }, + { + "epoch": 0.91, + "learning_rate": 1.0367411578959125e-07, + "loss": 1.0557, + "step": 30233 + }, + { + "epoch": 0.91, + "learning_rate": 1.0360461230940228e-07, + "loss": 1.1377, + "step": 30234 + }, + { + "epoch": 0.91, + "learning_rate": 1.0353513164174406e-07, + "loss": 1.0313, + "step": 30235 + }, + { + "epoch": 0.91, + "learning_rate": 1.0346567378727663e-07, + "loss": 1.2109, + "step": 30236 + }, + { + "epoch": 0.91, + "learning_rate": 1.0339623874666166e-07, + "loss": 1.041, + "step": 30237 + }, + { + "epoch": 0.91, + "learning_rate": 1.0332682652056059e-07, + "loss": 1.1484, + "step": 30238 + }, + { + "epoch": 0.91, + "learning_rate": 1.0325743710963398e-07, + "loss": 1.072, + "step": 30239 + }, + { + "epoch": 0.91, + "learning_rate": 1.0318807051454188e-07, + "loss": 1.0203, + "step": 30240 + }, + { + "epoch": 0.91, + "learning_rate": 1.0311872673594514e-07, + "loss": 1.1251, + "step": 30241 + }, + { + "epoch": 0.91, + "learning_rate": 1.0304940577450351e-07, + "loss": 1.1777, + "step": 30242 + }, + { + "epoch": 0.91, + "learning_rate": 1.0298010763087757e-07, + "loss": 1.0991, + "step": 30243 + }, + { + "epoch": 0.91, + "learning_rate": 1.0291083230572623e-07, + "loss": 1.1956, + "step": 30244 + }, + { + "epoch": 0.91, + "learning_rate": 1.0284157979970954e-07, + "loss": 1.131, + "step": 30245 + }, + { + "epoch": 0.91, + "learning_rate": 1.0277235011348612e-07, + "loss": 0.9976, + "step": 30246 + }, + { + "epoch": 0.91, + "learning_rate": 1.0270314324771574e-07, + "loss": 1.0422, + "step": 30247 + }, + { + "epoch": 0.91, + "learning_rate": 1.0263395920305675e-07, + "loss": 1.1157, + "step": 30248 + }, + { + "epoch": 0.91, + "learning_rate": 1.0256479798016777e-07, + "loss": 1.1427, + "step": 30249 + }, + { + "epoch": 0.91, + "learning_rate": 1.0249565957970747e-07, + "loss": 1.0043, + "step": 30250 + }, + { + "epoch": 0.91, + "learning_rate": 1.0242654400233365e-07, + "loss": 1.071, + "step": 30251 + }, + { + "epoch": 0.91, + "learning_rate": 1.0235745124870439e-07, + "loss": 1.1201, + "step": 30252 + }, + { + "epoch": 0.91, + "learning_rate": 1.022883813194775e-07, + "loss": 1.0264, + "step": 30253 + }, + { + "epoch": 0.91, + "learning_rate": 1.0221933421531022e-07, + "loss": 1.0884, + "step": 30254 + }, + { + "epoch": 0.91, + "learning_rate": 1.0215030993686038e-07, + "loss": 1.1501, + "step": 30255 + }, + { + "epoch": 0.91, + "learning_rate": 1.0208130848478493e-07, + "loss": 1.0922, + "step": 30256 + }, + { + "epoch": 0.91, + "learning_rate": 1.0201232985974002e-07, + "loss": 1.0502, + "step": 30257 + }, + { + "epoch": 0.91, + "learning_rate": 1.0194337406238319e-07, + "loss": 1.0939, + "step": 30258 + }, + { + "epoch": 0.91, + "learning_rate": 1.018744410933703e-07, + "loss": 1.076, + "step": 30259 + }, + { + "epoch": 0.91, + "learning_rate": 1.0180553095335777e-07, + "loss": 1.1203, + "step": 30260 + }, + { + "epoch": 0.91, + "learning_rate": 1.0173664364300202e-07, + "loss": 1.1708, + "step": 30261 + }, + { + "epoch": 0.91, + "learning_rate": 1.0166777916295778e-07, + "loss": 1.1263, + "step": 30262 + }, + { + "epoch": 0.91, + "learning_rate": 1.015989375138815e-07, + "loss": 1.1046, + "step": 30263 + }, + { + "epoch": 0.91, + "learning_rate": 1.0153011869642792e-07, + "loss": 1.0416, + "step": 30264 + }, + { + "epoch": 0.91, + "learning_rate": 1.014613227112532e-07, + "loss": 1.0682, + "step": 30265 + }, + { + "epoch": 0.91, + "learning_rate": 1.0139254955901095e-07, + "loss": 1.1908, + "step": 30266 + }, + { + "epoch": 0.91, + "learning_rate": 1.0132379924035624e-07, + "loss": 1.1316, + "step": 30267 + }, + { + "epoch": 0.91, + "learning_rate": 1.0125507175594406e-07, + "loss": 1.194, + "step": 30268 + }, + { + "epoch": 0.91, + "learning_rate": 1.0118636710642838e-07, + "loss": 1.1383, + "step": 30269 + }, + { + "epoch": 0.91, + "learning_rate": 1.0111768529246307e-07, + "loss": 1.0144, + "step": 30270 + }, + { + "epoch": 0.91, + "learning_rate": 1.0104902631470181e-07, + "loss": 0.9127, + "step": 30271 + }, + { + "epoch": 0.91, + "learning_rate": 1.0098039017379852e-07, + "loss": 1.1296, + "step": 30272 + }, + { + "epoch": 0.91, + "learning_rate": 1.0091177687040681e-07, + "loss": 1.1442, + "step": 30273 + }, + { + "epoch": 0.91, + "learning_rate": 1.0084318640517953e-07, + "loss": 1.1926, + "step": 30274 + }, + { + "epoch": 0.91, + "learning_rate": 1.0077461877876948e-07, + "loss": 1.0847, + "step": 30275 + }, + { + "epoch": 0.91, + "learning_rate": 1.0070607399182947e-07, + "loss": 1.1053, + "step": 30276 + }, + { + "epoch": 0.91, + "learning_rate": 1.0063755204501203e-07, + "loss": 1.113, + "step": 30277 + }, + { + "epoch": 0.91, + "learning_rate": 1.0056905293896967e-07, + "loss": 1.0003, + "step": 30278 + }, + { + "epoch": 0.91, + "learning_rate": 1.0050057667435414e-07, + "loss": 1.1357, + "step": 30279 + }, + { + "epoch": 0.91, + "learning_rate": 1.0043212325181767e-07, + "loss": 1.2367, + "step": 30280 + }, + { + "epoch": 0.91, + "learning_rate": 1.0036369267201169e-07, + "loss": 1.1922, + "step": 30281 + }, + { + "epoch": 0.91, + "learning_rate": 1.0029528493558788e-07, + "loss": 1.1457, + "step": 30282 + }, + { + "epoch": 0.91, + "learning_rate": 1.0022690004319685e-07, + "loss": 1.1838, + "step": 30283 + }, + { + "epoch": 0.91, + "learning_rate": 1.001585379954903e-07, + "loss": 1.0746, + "step": 30284 + }, + { + "epoch": 0.91, + "learning_rate": 1.0009019879311826e-07, + "loss": 1.0298, + "step": 30285 + }, + { + "epoch": 0.91, + "learning_rate": 1.0002188243673188e-07, + "loss": 1.0428, + "step": 30286 + }, + { + "epoch": 0.91, + "learning_rate": 9.995358892698149e-08, + "loss": 1.2178, + "step": 30287 + }, + { + "epoch": 0.91, + "learning_rate": 9.988531826451681e-08, + "loss": 1.0825, + "step": 30288 + }, + { + "epoch": 0.91, + "learning_rate": 9.981707044998817e-08, + "loss": 1.1985, + "step": 30289 + }, + { + "epoch": 0.91, + "learning_rate": 9.974884548404478e-08, + "loss": 1.1217, + "step": 30290 + }, + { + "epoch": 0.91, + "learning_rate": 9.968064336733669e-08, + "loss": 1.1909, + "step": 30291 + }, + { + "epoch": 0.91, + "learning_rate": 9.961246410051279e-08, + "loss": 1.2288, + "step": 30292 + }, + { + "epoch": 0.91, + "learning_rate": 9.954430768422201e-08, + "loss": 1.2471, + "step": 30293 + }, + { + "epoch": 0.91, + "learning_rate": 9.947617411911331e-08, + "loss": 1.0167, + "step": 30294 + }, + { + "epoch": 0.91, + "learning_rate": 9.940806340583559e-08, + "loss": 1.1023, + "step": 30295 + }, + { + "epoch": 0.91, + "learning_rate": 9.933997554503665e-08, + "loss": 1.0363, + "step": 30296 + }, + { + "epoch": 0.91, + "learning_rate": 9.92719105373649e-08, + "loss": 1.0713, + "step": 30297 + }, + { + "epoch": 0.91, + "learning_rate": 9.92038683834684e-08, + "loss": 1.1255, + "step": 30298 + }, + { + "epoch": 0.91, + "learning_rate": 9.91358490839947e-08, + "loss": 1.1127, + "step": 30299 + }, + { + "epoch": 0.91, + "learning_rate": 9.90678526395919e-08, + "loss": 1.1151, + "step": 30300 + }, + { + "epoch": 0.91, + "learning_rate": 9.899987905090641e-08, + "loss": 1.1649, + "step": 30301 + }, + { + "epoch": 0.91, + "learning_rate": 9.893192831858577e-08, + "loss": 1.134, + "step": 30302 + }, + { + "epoch": 0.91, + "learning_rate": 9.886400044327671e-08, + "loss": 1.0986, + "step": 30303 + }, + { + "epoch": 0.91, + "learning_rate": 9.879609542562618e-08, + "loss": 1.1624, + "step": 30304 + }, + { + "epoch": 0.91, + "learning_rate": 9.872821326628007e-08, + "loss": 1.2322, + "step": 30305 + }, + { + "epoch": 0.91, + "learning_rate": 9.866035396588508e-08, + "loss": 1.1051, + "step": 30306 + }, + { + "epoch": 0.91, + "learning_rate": 9.859251752508681e-08, + "loss": 1.0684, + "step": 30307 + }, + { + "epoch": 0.91, + "learning_rate": 9.852470394453112e-08, + "loss": 1.2218, + "step": 30308 + }, + { + "epoch": 0.91, + "learning_rate": 9.84569132248639e-08, + "loss": 1.1389, + "step": 30309 + }, + { + "epoch": 0.91, + "learning_rate": 9.838914536673016e-08, + "loss": 1.1479, + "step": 30310 + }, + { + "epoch": 0.91, + "learning_rate": 9.832140037077498e-08, + "loss": 1.2616, + "step": 30311 + }, + { + "epoch": 0.91, + "learning_rate": 9.825367823764364e-08, + "loss": 1.0634, + "step": 30312 + }, + { + "epoch": 0.91, + "learning_rate": 9.818597896798065e-08, + "loss": 1.1763, + "step": 30313 + }, + { + "epoch": 0.91, + "learning_rate": 9.811830256243021e-08, + "loss": 1.0643, + "step": 30314 + }, + { + "epoch": 0.91, + "learning_rate": 9.805064902163652e-08, + "loss": 1.0906, + "step": 30315 + }, + { + "epoch": 0.91, + "learning_rate": 9.798301834624408e-08, + "loss": 1.0898, + "step": 30316 + }, + { + "epoch": 0.91, + "learning_rate": 9.791541053689679e-08, + "loss": 1.171, + "step": 30317 + }, + { + "epoch": 0.91, + "learning_rate": 9.78478255942375e-08, + "loss": 1.002, + "step": 30318 + }, + { + "epoch": 0.91, + "learning_rate": 9.778026351890985e-08, + "loss": 1.1608, + "step": 30319 + }, + { + "epoch": 0.91, + "learning_rate": 9.771272431155721e-08, + "loss": 1.0861, + "step": 30320 + }, + { + "epoch": 0.91, + "learning_rate": 9.764520797282295e-08, + "loss": 1.0458, + "step": 30321 + }, + { + "epoch": 0.91, + "learning_rate": 9.75777145033488e-08, + "loss": 1.048, + "step": 30322 + }, + { + "epoch": 0.91, + "learning_rate": 9.751024390377784e-08, + "loss": 1.0442, + "step": 30323 + }, + { + "epoch": 0.91, + "learning_rate": 9.744279617475233e-08, + "loss": 1.186, + "step": 30324 + }, + { + "epoch": 0.91, + "learning_rate": 9.737537131691427e-08, + "loss": 0.986, + "step": 30325 + }, + { + "epoch": 0.91, + "learning_rate": 9.730796933090564e-08, + "loss": 1.013, + "step": 30326 + }, + { + "epoch": 0.91, + "learning_rate": 9.724059021736787e-08, + "loss": 1.0962, + "step": 30327 + }, + { + "epoch": 0.91, + "learning_rate": 9.71732339769424e-08, + "loss": 1.0745, + "step": 30328 + }, + { + "epoch": 0.91, + "learning_rate": 9.710590061027065e-08, + "loss": 1.0826, + "step": 30329 + }, + { + "epoch": 0.91, + "learning_rate": 9.70385901179935e-08, + "loss": 1.1052, + "step": 30330 + }, + { + "epoch": 0.91, + "learning_rate": 9.697130250075154e-08, + "loss": 1.2551, + "step": 30331 + }, + { + "epoch": 0.91, + "learning_rate": 9.69040377591854e-08, + "loss": 1.1078, + "step": 30332 + }, + { + "epoch": 0.91, + "learning_rate": 9.683679589393535e-08, + "loss": 1.0211, + "step": 30333 + }, + { + "epoch": 0.91, + "learning_rate": 9.676957690564176e-08, + "loss": 1.0665, + "step": 30334 + }, + { + "epoch": 0.91, + "learning_rate": 9.670238079494437e-08, + "loss": 1.1661, + "step": 30335 + }, + { + "epoch": 0.91, + "learning_rate": 9.663520756248269e-08, + "loss": 1.1434, + "step": 30336 + }, + { + "epoch": 0.91, + "learning_rate": 9.656805720889645e-08, + "loss": 1.122, + "step": 30337 + }, + { + "epoch": 0.91, + "learning_rate": 9.65009297348246e-08, + "loss": 1.0194, + "step": 30338 + }, + { + "epoch": 0.91, + "learning_rate": 9.643382514090694e-08, + "loss": 1.0815, + "step": 30339 + }, + { + "epoch": 0.91, + "learning_rate": 9.636674342778097e-08, + "loss": 1.0017, + "step": 30340 + }, + { + "epoch": 0.91, + "learning_rate": 9.629968459608619e-08, + "loss": 1.1663, + "step": 30341 + }, + { + "epoch": 0.91, + "learning_rate": 9.623264864646098e-08, + "loss": 1.1552, + "step": 30342 + }, + { + "epoch": 0.91, + "learning_rate": 9.616563557954317e-08, + "loss": 1.1179, + "step": 30343 + }, + { + "epoch": 0.91, + "learning_rate": 9.609864539597058e-08, + "loss": 1.2257, + "step": 30344 + }, + { + "epoch": 0.91, + "learning_rate": 9.60316780963813e-08, + "loss": 1.0997, + "step": 30345 + }, + { + "epoch": 0.91, + "learning_rate": 9.596473368141262e-08, + "loss": 0.9774, + "step": 30346 + }, + { + "epoch": 0.91, + "learning_rate": 9.589781215170207e-08, + "loss": 1.0636, + "step": 30347 + }, + { + "epoch": 0.91, + "learning_rate": 9.583091350788609e-08, + "loss": 1.1517, + "step": 30348 + }, + { + "epoch": 0.91, + "learning_rate": 9.576403775060223e-08, + "loss": 1.0599, + "step": 30349 + }, + { + "epoch": 0.91, + "learning_rate": 9.569718488048662e-08, + "loss": 1.0758, + "step": 30350 + }, + { + "epoch": 0.91, + "learning_rate": 9.563035489817602e-08, + "loss": 1.1433, + "step": 30351 + }, + { + "epoch": 0.91, + "learning_rate": 9.556354780430627e-08, + "loss": 1.2188, + "step": 30352 + }, + { + "epoch": 0.91, + "learning_rate": 9.549676359951355e-08, + "loss": 1.0825, + "step": 30353 + }, + { + "epoch": 0.91, + "learning_rate": 9.543000228443373e-08, + "loss": 1.0635, + "step": 30354 + }, + { + "epoch": 0.91, + "learning_rate": 9.536326385970213e-08, + "loss": 1.0839, + "step": 30355 + }, + { + "epoch": 0.91, + "learning_rate": 9.529654832595437e-08, + "loss": 0.9891, + "step": 30356 + }, + { + "epoch": 0.91, + "learning_rate": 9.522985568382492e-08, + "loss": 1.0396, + "step": 30357 + }, + { + "epoch": 0.91, + "learning_rate": 9.516318593394913e-08, + "loss": 1.2145, + "step": 30358 + }, + { + "epoch": 0.91, + "learning_rate": 9.509653907696176e-08, + "loss": 1.017, + "step": 30359 + }, + { + "epoch": 0.91, + "learning_rate": 9.502991511349702e-08, + "loss": 1.0858, + "step": 30360 + }, + { + "epoch": 0.91, + "learning_rate": 9.496331404418913e-08, + "loss": 1.0364, + "step": 30361 + }, + { + "epoch": 0.91, + "learning_rate": 9.48967358696723e-08, + "loss": 1.1296, + "step": 30362 + }, + { + "epoch": 0.91, + "learning_rate": 9.483018059058018e-08, + "loss": 1.1488, + "step": 30363 + }, + { + "epoch": 0.91, + "learning_rate": 9.476364820754674e-08, + "loss": 1.0193, + "step": 30364 + }, + { + "epoch": 0.91, + "learning_rate": 9.469713872120451e-08, + "loss": 0.9943, + "step": 30365 + }, + { + "epoch": 0.91, + "learning_rate": 9.463065213218714e-08, + "loss": 1.0171, + "step": 30366 + }, + { + "epoch": 0.91, + "learning_rate": 9.456418844112747e-08, + "loss": 1.108, + "step": 30367 + }, + { + "epoch": 0.91, + "learning_rate": 9.449774764865832e-08, + "loss": 1.1568, + "step": 30368 + }, + { + "epoch": 0.91, + "learning_rate": 9.443132975541225e-08, + "loss": 1.0705, + "step": 30369 + }, + { + "epoch": 0.91, + "learning_rate": 9.436493476202124e-08, + "loss": 1.0365, + "step": 30370 + }, + { + "epoch": 0.91, + "learning_rate": 9.42985626691173e-08, + "loss": 1.1221, + "step": 30371 + }, + { + "epoch": 0.91, + "learning_rate": 9.423221347733242e-08, + "loss": 0.9843, + "step": 30372 + }, + { + "epoch": 0.91, + "learning_rate": 9.416588718729858e-08, + "loss": 1.1678, + "step": 30373 + }, + { + "epoch": 0.92, + "learning_rate": 9.409958379964668e-08, + "loss": 1.2143, + "step": 30374 + }, + { + "epoch": 0.92, + "learning_rate": 9.40333033150076e-08, + "loss": 1.1132, + "step": 30375 + }, + { + "epoch": 0.92, + "learning_rate": 9.396704573401305e-08, + "loss": 1.0312, + "step": 30376 + }, + { + "epoch": 0.92, + "learning_rate": 9.390081105729366e-08, + "loss": 1.1953, + "step": 30377 + }, + { + "epoch": 0.92, + "learning_rate": 9.383459928547944e-08, + "loss": 0.991, + "step": 30378 + }, + { + "epoch": 0.92, + "learning_rate": 9.376841041920076e-08, + "loss": 1.1502, + "step": 30379 + }, + { + "epoch": 0.92, + "learning_rate": 9.37022444590882e-08, + "loss": 1.0414, + "step": 30380 + }, + { + "epoch": 0.92, + "learning_rate": 9.363610140577128e-08, + "loss": 1.1029, + "step": 30381 + }, + { + "epoch": 0.92, + "learning_rate": 9.356998125988004e-08, + "loss": 1.1242, + "step": 30382 + }, + { + "epoch": 0.92, + "learning_rate": 9.350388402204341e-08, + "loss": 1.1713, + "step": 30383 + }, + { + "epoch": 0.92, + "learning_rate": 9.343780969289062e-08, + "loss": 1.0089, + "step": 30384 + }, + { + "epoch": 0.92, + "learning_rate": 9.33717582730509e-08, + "loss": 1.1522, + "step": 30385 + }, + { + "epoch": 0.92, + "learning_rate": 9.330572976315344e-08, + "loss": 1.0726, + "step": 30386 + }, + { + "epoch": 0.92, + "learning_rate": 9.323972416382582e-08, + "loss": 1.0391, + "step": 30387 + }, + { + "epoch": 0.92, + "learning_rate": 9.317374147569697e-08, + "loss": 1.1496, + "step": 30388 + }, + { + "epoch": 0.92, + "learning_rate": 9.310778169939472e-08, + "loss": 1.0824, + "step": 30389 + }, + { + "epoch": 0.92, + "learning_rate": 9.304184483554746e-08, + "loss": 1.0789, + "step": 30390 + }, + { + "epoch": 0.92, + "learning_rate": 9.297593088478246e-08, + "loss": 1.05, + "step": 30391 + }, + { + "epoch": 0.92, + "learning_rate": 9.291003984772757e-08, + "loss": 1.1237, + "step": 30392 + }, + { + "epoch": 0.92, + "learning_rate": 9.284417172500948e-08, + "loss": 0.985, + "step": 30393 + }, + { + "epoch": 0.92, + "learning_rate": 9.277832651725577e-08, + "loss": 1.0894, + "step": 30394 + }, + { + "epoch": 0.92, + "learning_rate": 9.271250422509315e-08, + "loss": 1.0644, + "step": 30395 + }, + { + "epoch": 0.92, + "learning_rate": 9.264670484914806e-08, + "loss": 1.1415, + "step": 30396 + }, + { + "epoch": 0.92, + "learning_rate": 9.258092839004667e-08, + "loss": 1.0966, + "step": 30397 + }, + { + "epoch": 0.92, + "learning_rate": 9.251517484841544e-08, + "loss": 1.2117, + "step": 30398 + }, + { + "epoch": 0.92, + "learning_rate": 9.244944422488078e-08, + "loss": 1.121, + "step": 30399 + }, + { + "epoch": 0.92, + "learning_rate": 9.238373652006722e-08, + "loss": 1.0259, + "step": 30400 + }, + { + "epoch": 0.92, + "learning_rate": 9.231805173460117e-08, + "loss": 1.0891, + "step": 30401 + }, + { + "epoch": 0.92, + "learning_rate": 9.225238986910773e-08, + "loss": 1.0615, + "step": 30402 + }, + { + "epoch": 0.92, + "learning_rate": 9.21867509242122e-08, + "loss": 1.1944, + "step": 30403 + }, + { + "epoch": 0.92, + "learning_rate": 9.21211349005388e-08, + "loss": 1.0731, + "step": 30404 + }, + { + "epoch": 0.92, + "learning_rate": 9.205554179871262e-08, + "loss": 1.1587, + "step": 30405 + }, + { + "epoch": 0.92, + "learning_rate": 9.198997161935786e-08, + "loss": 1.1902, + "step": 30406 + }, + { + "epoch": 0.92, + "learning_rate": 9.192442436309872e-08, + "loss": 0.9587, + "step": 30407 + }, + { + "epoch": 0.92, + "learning_rate": 9.185890003055975e-08, + "loss": 1.1149, + "step": 30408 + }, + { + "epoch": 0.92, + "learning_rate": 9.179339862236403e-08, + "loss": 1.1191, + "step": 30409 + }, + { + "epoch": 0.92, + "learning_rate": 9.172792013913523e-08, + "loss": 1.166, + "step": 30410 + }, + { + "epoch": 0.92, + "learning_rate": 9.166246458149674e-08, + "loss": 1.1046, + "step": 30411 + }, + { + "epoch": 0.92, + "learning_rate": 9.159703195007197e-08, + "loss": 1.1839, + "step": 30412 + }, + { + "epoch": 0.92, + "learning_rate": 9.153162224548346e-08, + "loss": 0.9775, + "step": 30413 + }, + { + "epoch": 0.92, + "learning_rate": 9.146623546835376e-08, + "loss": 1.0676, + "step": 30414 + }, + { + "epoch": 0.92, + "learning_rate": 9.140087161930545e-08, + "loss": 0.9849, + "step": 30415 + }, + { + "epoch": 0.92, + "learning_rate": 9.133553069896078e-08, + "loss": 1.0186, + "step": 30416 + }, + { + "epoch": 0.92, + "learning_rate": 9.127021270794206e-08, + "loss": 1.0588, + "step": 30417 + }, + { + "epoch": 0.92, + "learning_rate": 9.120491764687073e-08, + "loss": 1.0319, + "step": 30418 + }, + { + "epoch": 0.92, + "learning_rate": 9.113964551636823e-08, + "loss": 0.966, + "step": 30419 + }, + { + "epoch": 0.92, + "learning_rate": 9.107439631705656e-08, + "loss": 1.0743, + "step": 30420 + }, + { + "epoch": 0.92, + "learning_rate": 9.100917004955634e-08, + "loss": 1.0274, + "step": 30421 + }, + { + "epoch": 0.92, + "learning_rate": 9.094396671448873e-08, + "loss": 1.0374, + "step": 30422 + }, + { + "epoch": 0.92, + "learning_rate": 9.08787863124741e-08, + "loss": 1.0643, + "step": 30423 + }, + { + "epoch": 0.92, + "learning_rate": 9.081362884413303e-08, + "loss": 1.2008, + "step": 30424 + }, + { + "epoch": 0.92, + "learning_rate": 9.074849431008642e-08, + "loss": 1.213, + "step": 30425 + }, + { + "epoch": 0.92, + "learning_rate": 9.06833827109535e-08, + "loss": 1.05, + "step": 30426 + }, + { + "epoch": 0.92, + "learning_rate": 9.061829404735434e-08, + "loss": 1.0911, + "step": 30427 + }, + { + "epoch": 0.92, + "learning_rate": 9.055322831990843e-08, + "loss": 1.0226, + "step": 30428 + }, + { + "epoch": 0.92, + "learning_rate": 9.048818552923583e-08, + "loss": 1.2062, + "step": 30429 + }, + { + "epoch": 0.92, + "learning_rate": 9.042316567595494e-08, + "loss": 1.1703, + "step": 30430 + }, + { + "epoch": 0.92, + "learning_rate": 9.035816876068527e-08, + "loss": 1.1321, + "step": 30431 + }, + { + "epoch": 0.92, + "learning_rate": 9.029319478404492e-08, + "loss": 1.1107, + "step": 30432 + }, + { + "epoch": 0.92, + "learning_rate": 9.022824374665312e-08, + "loss": 1.1783, + "step": 30433 + }, + { + "epoch": 0.92, + "learning_rate": 9.0163315649128e-08, + "loss": 1.1313, + "step": 30434 + }, + { + "epoch": 0.92, + "learning_rate": 9.009841049208712e-08, + "loss": 1.0481, + "step": 30435 + }, + { + "epoch": 0.92, + "learning_rate": 9.003352827614887e-08, + "loss": 1.0588, + "step": 30436 + }, + { + "epoch": 0.92, + "learning_rate": 8.996866900193051e-08, + "loss": 1.0737, + "step": 30437 + }, + { + "epoch": 0.92, + "learning_rate": 8.990383267005021e-08, + "loss": 1.2253, + "step": 30438 + }, + { + "epoch": 0.92, + "learning_rate": 8.983901928112438e-08, + "loss": 1.0887, + "step": 30439 + }, + { + "epoch": 0.92, + "learning_rate": 8.977422883577031e-08, + "loss": 1.1049, + "step": 30440 + }, + { + "epoch": 0.92, + "learning_rate": 8.970946133460473e-08, + "loss": 0.9782, + "step": 30441 + }, + { + "epoch": 0.92, + "learning_rate": 8.964471677824438e-08, + "loss": 1.2352, + "step": 30442 + }, + { + "epoch": 0.92, + "learning_rate": 8.957999516730515e-08, + "loss": 1.2133, + "step": 30443 + }, + { + "epoch": 0.92, + "learning_rate": 8.951529650240376e-08, + "loss": 1.0993, + "step": 30444 + }, + { + "epoch": 0.92, + "learning_rate": 8.945062078415556e-08, + "loss": 1.0892, + "step": 30445 + }, + { + "epoch": 0.92, + "learning_rate": 8.938596801317701e-08, + "loss": 1.148, + "step": 30446 + }, + { + "epoch": 0.92, + "learning_rate": 8.932133819008287e-08, + "loss": 1.1074, + "step": 30447 + }, + { + "epoch": 0.92, + "learning_rate": 8.925673131548823e-08, + "loss": 1.0212, + "step": 30448 + }, + { + "epoch": 0.92, + "learning_rate": 8.91921473900087e-08, + "loss": 1.1466, + "step": 30449 + }, + { + "epoch": 0.92, + "learning_rate": 8.912758641425878e-08, + "loss": 1.011, + "step": 30450 + }, + { + "epoch": 0.92, + "learning_rate": 8.906304838885326e-08, + "loss": 1.0765, + "step": 30451 + }, + { + "epoch": 0.92, + "learning_rate": 8.899853331440639e-08, + "loss": 1.0986, + "step": 30452 + }, + { + "epoch": 0.92, + "learning_rate": 8.893404119153209e-08, + "loss": 0.9589, + "step": 30453 + }, + { + "epoch": 0.92, + "learning_rate": 8.886957202084434e-08, + "loss": 1.0779, + "step": 30454 + }, + { + "epoch": 0.92, + "learning_rate": 8.880512580295764e-08, + "loss": 1.1797, + "step": 30455 + }, + { + "epoch": 0.92, + "learning_rate": 8.874070253848455e-08, + "loss": 1.1885, + "step": 30456 + }, + { + "epoch": 0.92, + "learning_rate": 8.867630222803846e-08, + "loss": 1.1421, + "step": 30457 + }, + { + "epoch": 0.92, + "learning_rate": 8.86119248722328e-08, + "loss": 1.1725, + "step": 30458 + }, + { + "epoch": 0.92, + "learning_rate": 8.854757047168011e-08, + "loss": 1.065, + "step": 30459 + }, + { + "epoch": 0.92, + "learning_rate": 8.848323902699352e-08, + "loss": 1.1372, + "step": 30460 + }, + { + "epoch": 0.92, + "learning_rate": 8.841893053878503e-08, + "loss": 1.1373, + "step": 30461 + }, + { + "epoch": 0.92, + "learning_rate": 8.835464500766638e-08, + "loss": 1.1039, + "step": 30462 + }, + { + "epoch": 0.92, + "learning_rate": 8.829038243425042e-08, + "loss": 1.1251, + "step": 30463 + }, + { + "epoch": 0.92, + "learning_rate": 8.82261428191486e-08, + "loss": 1.1587, + "step": 30464 + }, + { + "epoch": 0.92, + "learning_rate": 8.816192616297209e-08, + "loss": 1.1401, + "step": 30465 + }, + { + "epoch": 0.92, + "learning_rate": 8.809773246633263e-08, + "loss": 1.1097, + "step": 30466 + }, + { + "epoch": 0.92, + "learning_rate": 8.803356172984085e-08, + "loss": 1.1063, + "step": 30467 + }, + { + "epoch": 0.92, + "learning_rate": 8.796941395410846e-08, + "loss": 1.0992, + "step": 30468 + }, + { + "epoch": 0.92, + "learning_rate": 8.7905289139745e-08, + "loss": 1.1382, + "step": 30469 + }, + { + "epoch": 0.92, + "learning_rate": 8.784118728736163e-08, + "loss": 1.0737, + "step": 30470 + }, + { + "epoch": 0.92, + "learning_rate": 8.77771083975687e-08, + "loss": 1.0503, + "step": 30471 + }, + { + "epoch": 0.92, + "learning_rate": 8.771305247097544e-08, + "loss": 1.0841, + "step": 30472 + }, + { + "epoch": 0.92, + "learning_rate": 8.764901950819249e-08, + "loss": 1.046, + "step": 30473 + }, + { + "epoch": 0.92, + "learning_rate": 8.758500950982879e-08, + "loss": 1.2051, + "step": 30474 + }, + { + "epoch": 0.92, + "learning_rate": 8.752102247649413e-08, + "loss": 1.0961, + "step": 30475 + }, + { + "epoch": 0.92, + "learning_rate": 8.745705840879748e-08, + "loss": 1.0496, + "step": 30476 + }, + { + "epoch": 0.92, + "learning_rate": 8.739311730734779e-08, + "loss": 1.0963, + "step": 30477 + }, + { + "epoch": 0.92, + "learning_rate": 8.732919917275373e-08, + "loss": 0.9777, + "step": 30478 + }, + { + "epoch": 0.92, + "learning_rate": 8.726530400562344e-08, + "loss": 1.0782, + "step": 30479 + }, + { + "epoch": 0.92, + "learning_rate": 8.720143180656532e-08, + "loss": 1.003, + "step": 30480 + }, + { + "epoch": 0.92, + "learning_rate": 8.713758257618804e-08, + "loss": 1.1273, + "step": 30481 + }, + { + "epoch": 0.92, + "learning_rate": 8.707375631509863e-08, + "loss": 1.0551, + "step": 30482 + }, + { + "epoch": 0.92, + "learning_rate": 8.700995302390491e-08, + "loss": 1.09, + "step": 30483 + }, + { + "epoch": 0.92, + "learning_rate": 8.694617270321421e-08, + "loss": 1.0632, + "step": 30484 + }, + { + "epoch": 0.92, + "learning_rate": 8.688241535363379e-08, + "loss": 1.1705, + "step": 30485 + }, + { + "epoch": 0.92, + "learning_rate": 8.681868097577095e-08, + "loss": 0.956, + "step": 30486 + }, + { + "epoch": 0.92, + "learning_rate": 8.675496957023161e-08, + "loss": 1.2267, + "step": 30487 + }, + { + "epoch": 0.92, + "learning_rate": 8.669128113762305e-08, + "loss": 1.0955, + "step": 30488 + }, + { + "epoch": 0.92, + "learning_rate": 8.662761567855087e-08, + "loss": 1.217, + "step": 30489 + }, + { + "epoch": 0.92, + "learning_rate": 8.656397319362186e-08, + "loss": 1.1616, + "step": 30490 + }, + { + "epoch": 0.92, + "learning_rate": 8.650035368344106e-08, + "loss": 1.04, + "step": 30491 + }, + { + "epoch": 0.92, + "learning_rate": 8.643675714861466e-08, + "loss": 1.1689, + "step": 30492 + }, + { + "epoch": 0.92, + "learning_rate": 8.6373183589748e-08, + "loss": 1.1791, + "step": 30493 + }, + { + "epoch": 0.92, + "learning_rate": 8.630963300744644e-08, + "loss": 1.1668, + "step": 30494 + }, + { + "epoch": 0.92, + "learning_rate": 8.624610540231421e-08, + "loss": 1.0726, + "step": 30495 + }, + { + "epoch": 0.92, + "learning_rate": 8.618260077495665e-08, + "loss": 1.0926, + "step": 30496 + }, + { + "epoch": 0.92, + "learning_rate": 8.611911912597831e-08, + "loss": 1.1602, + "step": 30497 + }, + { + "epoch": 0.92, + "learning_rate": 8.605566045598312e-08, + "loss": 1.1158, + "step": 30498 + }, + { + "epoch": 0.92, + "learning_rate": 8.599222476557589e-08, + "loss": 1.034, + "step": 30499 + }, + { + "epoch": 0.92, + "learning_rate": 8.592881205535974e-08, + "loss": 1.1796, + "step": 30500 + }, + { + "epoch": 0.92, + "learning_rate": 8.586542232593864e-08, + "loss": 1.1564, + "step": 30501 + }, + { + "epoch": 0.92, + "learning_rate": 8.580205557791599e-08, + "loss": 1.1589, + "step": 30502 + }, + { + "epoch": 0.92, + "learning_rate": 8.573871181189547e-08, + "loss": 1.1059, + "step": 30503 + }, + { + "epoch": 0.92, + "learning_rate": 8.567539102847939e-08, + "loss": 1.1472, + "step": 30504 + }, + { + "epoch": 0.92, + "learning_rate": 8.561209322827086e-08, + "loss": 1.157, + "step": 30505 + }, + { + "epoch": 0.92, + "learning_rate": 8.554881841187217e-08, + "loss": 1.0976, + "step": 30506 + }, + { + "epoch": 0.92, + "learning_rate": 8.548556657988649e-08, + "loss": 0.9608, + "step": 30507 + }, + { + "epoch": 0.92, + "learning_rate": 8.54223377329147e-08, + "loss": 1.0883, + "step": 30508 + }, + { + "epoch": 0.92, + "learning_rate": 8.535913187155964e-08, + "loss": 1.0617, + "step": 30509 + }, + { + "epoch": 0.92, + "learning_rate": 8.529594899642252e-08, + "loss": 1.2209, + "step": 30510 + }, + { + "epoch": 0.92, + "learning_rate": 8.523278910810506e-08, + "loss": 1.1141, + "step": 30511 + }, + { + "epoch": 0.92, + "learning_rate": 8.516965220720902e-08, + "loss": 0.9969, + "step": 30512 + }, + { + "epoch": 0.92, + "learning_rate": 8.510653829433418e-08, + "loss": 1.2489, + "step": 30513 + }, + { + "epoch": 0.92, + "learning_rate": 8.50434473700823e-08, + "loss": 1.1693, + "step": 30514 + }, + { + "epoch": 0.92, + "learning_rate": 8.498037943505344e-08, + "loss": 1.1241, + "step": 30515 + }, + { + "epoch": 0.92, + "learning_rate": 8.491733448984879e-08, + "loss": 1.1484, + "step": 30516 + }, + { + "epoch": 0.92, + "learning_rate": 8.48543125350676e-08, + "loss": 1.1508, + "step": 30517 + }, + { + "epoch": 0.92, + "learning_rate": 8.47913135713102e-08, + "loss": 1.1929, + "step": 30518 + }, + { + "epoch": 0.92, + "learning_rate": 8.472833759917642e-08, + "loss": 1.0512, + "step": 30519 + }, + { + "epoch": 0.92, + "learning_rate": 8.466538461926576e-08, + "loss": 1.2024, + "step": 30520 + }, + { + "epoch": 0.92, + "learning_rate": 8.460245463217692e-08, + "loss": 1.0602, + "step": 30521 + }, + { + "epoch": 0.92, + "learning_rate": 8.453954763850969e-08, + "loss": 1.0209, + "step": 30522 + }, + { + "epoch": 0.92, + "learning_rate": 8.447666363886248e-08, + "loss": 0.9625, + "step": 30523 + }, + { + "epoch": 0.92, + "learning_rate": 8.441380263383425e-08, + "loss": 1.2227, + "step": 30524 + }, + { + "epoch": 0.92, + "learning_rate": 8.435096462402315e-08, + "loss": 1.1405, + "step": 30525 + }, + { + "epoch": 0.92, + "learning_rate": 8.428814961002757e-08, + "loss": 1.0876, + "step": 30526 + }, + { + "epoch": 0.92, + "learning_rate": 8.42253575924451e-08, + "loss": 1.1743, + "step": 30527 + }, + { + "epoch": 0.92, + "learning_rate": 8.416258857187387e-08, + "loss": 1.0023, + "step": 30528 + }, + { + "epoch": 0.92, + "learning_rate": 8.409984254891174e-08, + "loss": 1.0104, + "step": 30529 + }, + { + "epoch": 0.92, + "learning_rate": 8.403711952415489e-08, + "loss": 1.1945, + "step": 30530 + }, + { + "epoch": 0.92, + "learning_rate": 8.397441949820145e-08, + "loss": 1.1052, + "step": 30531 + }, + { + "epoch": 0.92, + "learning_rate": 8.391174247164791e-08, + "loss": 1.0769, + "step": 30532 + }, + { + "epoch": 0.92, + "learning_rate": 8.384908844509099e-08, + "loss": 1.2246, + "step": 30533 + }, + { + "epoch": 0.92, + "learning_rate": 8.378645741912688e-08, + "loss": 1.0657, + "step": 30534 + }, + { + "epoch": 0.92, + "learning_rate": 8.372384939435235e-08, + "loss": 1.0405, + "step": 30535 + }, + { + "epoch": 0.92, + "learning_rate": 8.366126437136274e-08, + "loss": 1.2288, + "step": 30536 + }, + { + "epoch": 0.92, + "learning_rate": 8.359870235075451e-08, + "loss": 1.1039, + "step": 30537 + }, + { + "epoch": 0.92, + "learning_rate": 8.353616333312248e-08, + "loss": 1.0627, + "step": 30538 + }, + { + "epoch": 0.92, + "learning_rate": 8.347364731906226e-08, + "loss": 1.007, + "step": 30539 + }, + { + "epoch": 0.92, + "learning_rate": 8.341115430916952e-08, + "loss": 1.0574, + "step": 30540 + }, + { + "epoch": 0.92, + "learning_rate": 8.33486843040382e-08, + "loss": 1.0883, + "step": 30541 + }, + { + "epoch": 0.92, + "learning_rate": 8.328623730426422e-08, + "loss": 1.0951, + "step": 30542 + }, + { + "epoch": 0.92, + "learning_rate": 8.322381331044071e-08, + "loss": 1.1556, + "step": 30543 + }, + { + "epoch": 0.92, + "learning_rate": 8.316141232316277e-08, + "loss": 1.0987, + "step": 30544 + }, + { + "epoch": 0.92, + "learning_rate": 8.309903434302407e-08, + "loss": 1.1225, + "step": 30545 + }, + { + "epoch": 0.92, + "learning_rate": 8.303667937061887e-08, + "loss": 1.0955, + "step": 30546 + }, + { + "epoch": 0.92, + "learning_rate": 8.29743474065403e-08, + "loss": 1.0833, + "step": 30547 + }, + { + "epoch": 0.92, + "learning_rate": 8.291203845138179e-08, + "loss": 1.1027, + "step": 30548 + }, + { + "epoch": 0.92, + "learning_rate": 8.284975250573646e-08, + "loss": 1.1443, + "step": 30549 + }, + { + "epoch": 0.92, + "learning_rate": 8.278748957019717e-08, + "loss": 1.05, + "step": 30550 + }, + { + "epoch": 0.92, + "learning_rate": 8.272524964535733e-08, + "loss": 1.101, + "step": 30551 + }, + { + "epoch": 0.92, + "learning_rate": 8.26630327318087e-08, + "loss": 1.0634, + "step": 30552 + }, + { + "epoch": 0.92, + "learning_rate": 8.260083883014358e-08, + "loss": 1.0057, + "step": 30553 + }, + { + "epoch": 0.92, + "learning_rate": 8.253866794095456e-08, + "loss": 1.0273, + "step": 30554 + }, + { + "epoch": 0.92, + "learning_rate": 8.247652006483281e-08, + "loss": 1.1104, + "step": 30555 + }, + { + "epoch": 0.92, + "learning_rate": 8.241439520237037e-08, + "loss": 1.0883, + "step": 30556 + }, + { + "epoch": 0.92, + "learning_rate": 8.235229335415845e-08, + "loss": 1.0142, + "step": 30557 + }, + { + "epoch": 0.92, + "learning_rate": 8.229021452078823e-08, + "loss": 1.0903, + "step": 30558 + }, + { + "epoch": 0.92, + "learning_rate": 8.222815870285116e-08, + "loss": 1.0501, + "step": 30559 + }, + { + "epoch": 0.92, + "learning_rate": 8.216612590093737e-08, + "loss": 1.0735, + "step": 30560 + }, + { + "epoch": 0.92, + "learning_rate": 8.210411611563773e-08, + "loss": 1.1668, + "step": 30561 + }, + { + "epoch": 0.92, + "learning_rate": 8.204212934754207e-08, + "loss": 1.1851, + "step": 30562 + }, + { + "epoch": 0.92, + "learning_rate": 8.198016559724132e-08, + "loss": 1.0135, + "step": 30563 + }, + { + "epoch": 0.92, + "learning_rate": 8.191822486532441e-08, + "loss": 1.1516, + "step": 30564 + }, + { + "epoch": 0.92, + "learning_rate": 8.185630715238147e-08, + "loss": 1.1046, + "step": 30565 + }, + { + "epoch": 0.92, + "learning_rate": 8.179441245900199e-08, + "loss": 1.1033, + "step": 30566 + }, + { + "epoch": 0.92, + "learning_rate": 8.173254078577498e-08, + "loss": 1.0989, + "step": 30567 + }, + { + "epoch": 0.92, + "learning_rate": 8.167069213328966e-08, + "loss": 1.1301, + "step": 30568 + }, + { + "epoch": 0.92, + "learning_rate": 8.160886650213445e-08, + "loss": 1.201, + "step": 30569 + }, + { + "epoch": 0.92, + "learning_rate": 8.154706389289807e-08, + "loss": 1.0704, + "step": 30570 + }, + { + "epoch": 0.92, + "learning_rate": 8.148528430616892e-08, + "loss": 1.0829, + "step": 30571 + }, + { + "epoch": 0.92, + "learning_rate": 8.142352774253543e-08, + "loss": 1.063, + "step": 30572 + }, + { + "epoch": 0.92, + "learning_rate": 8.136179420258461e-08, + "loss": 0.9626, + "step": 30573 + }, + { + "epoch": 0.92, + "learning_rate": 8.130008368690489e-08, + "loss": 1.1294, + "step": 30574 + }, + { + "epoch": 0.92, + "learning_rate": 8.123839619608332e-08, + "loss": 1.0543, + "step": 30575 + }, + { + "epoch": 0.92, + "learning_rate": 8.117673173070772e-08, + "loss": 1.0355, + "step": 30576 + }, + { + "epoch": 0.92, + "learning_rate": 8.111509029136433e-08, + "loss": 1.0939, + "step": 30577 + }, + { + "epoch": 0.92, + "learning_rate": 8.105347187864044e-08, + "loss": 1.1318, + "step": 30578 + }, + { + "epoch": 0.92, + "learning_rate": 8.099187649312223e-08, + "loss": 1.1124, + "step": 30579 + }, + { + "epoch": 0.92, + "learning_rate": 8.093030413539648e-08, + "loss": 1.1084, + "step": 30580 + }, + { + "epoch": 0.92, + "learning_rate": 8.086875480604911e-08, + "loss": 1.2719, + "step": 30581 + }, + { + "epoch": 0.92, + "learning_rate": 8.08072285056663e-08, + "loss": 1.0742, + "step": 30582 + }, + { + "epoch": 0.92, + "learning_rate": 8.074572523483342e-08, + "loss": 1.0484, + "step": 30583 + }, + { + "epoch": 0.92, + "learning_rate": 8.068424499413586e-08, + "loss": 1.085, + "step": 30584 + }, + { + "epoch": 0.92, + "learning_rate": 8.062278778415977e-08, + "loss": 1.1362, + "step": 30585 + }, + { + "epoch": 0.92, + "learning_rate": 8.056135360548889e-08, + "loss": 1.1782, + "step": 30586 + }, + { + "epoch": 0.92, + "learning_rate": 8.049994245870884e-08, + "loss": 1.1513, + "step": 30587 + }, + { + "epoch": 0.92, + "learning_rate": 8.043855434440417e-08, + "loss": 1.1465, + "step": 30588 + }, + { + "epoch": 0.92, + "learning_rate": 8.03771892631594e-08, + "loss": 1.0614, + "step": 30589 + }, + { + "epoch": 0.92, + "learning_rate": 8.031584721555796e-08, + "loss": 1.0335, + "step": 30590 + }, + { + "epoch": 0.92, + "learning_rate": 8.025452820218465e-08, + "loss": 1.1329, + "step": 30591 + }, + { + "epoch": 0.92, + "learning_rate": 8.019323222362263e-08, + "loss": 1.0732, + "step": 30592 + }, + { + "epoch": 0.92, + "learning_rate": 8.013195928045559e-08, + "loss": 1.1572, + "step": 30593 + }, + { + "epoch": 0.92, + "learning_rate": 8.007070937326722e-08, + "loss": 1.1501, + "step": 30594 + }, + { + "epoch": 0.92, + "learning_rate": 8.000948250263985e-08, + "loss": 1.165, + "step": 30595 + }, + { + "epoch": 0.92, + "learning_rate": 7.994827866915689e-08, + "loss": 1.1085, + "step": 30596 + }, + { + "epoch": 0.92, + "learning_rate": 7.988709787340066e-08, + "loss": 1.1391, + "step": 30597 + }, + { + "epoch": 0.92, + "learning_rate": 7.982594011595374e-08, + "loss": 1.0449, + "step": 30598 + }, + { + "epoch": 0.92, + "learning_rate": 7.976480539739844e-08, + "loss": 1.0677, + "step": 30599 + }, + { + "epoch": 0.92, + "learning_rate": 7.970369371831627e-08, + "loss": 1.1476, + "step": 30600 + }, + { + "epoch": 0.92, + "learning_rate": 7.964260507928922e-08, + "loss": 1.0673, + "step": 30601 + }, + { + "epoch": 0.92, + "learning_rate": 7.958153948089936e-08, + "loss": 1.1002, + "step": 30602 + }, + { + "epoch": 0.92, + "learning_rate": 7.952049692372732e-08, + "loss": 1.0645, + "step": 30603 + }, + { + "epoch": 0.92, + "learning_rate": 7.945947740835402e-08, + "loss": 1.0286, + "step": 30604 + }, + { + "epoch": 0.92, + "learning_rate": 7.939848093536095e-08, + "loss": 1.0975, + "step": 30605 + }, + { + "epoch": 0.92, + "learning_rate": 7.933750750532876e-08, + "loss": 1.0598, + "step": 30606 + }, + { + "epoch": 0.92, + "learning_rate": 7.927655711883753e-08, + "loss": 1.0823, + "step": 30607 + }, + { + "epoch": 0.92, + "learning_rate": 7.921562977646735e-08, + "loss": 1.0822, + "step": 30608 + }, + { + "epoch": 0.92, + "learning_rate": 7.915472547879888e-08, + "loss": 1.0577, + "step": 30609 + }, + { + "epoch": 0.92, + "learning_rate": 7.909384422641108e-08, + "loss": 1.0541, + "step": 30610 + }, + { + "epoch": 0.92, + "learning_rate": 7.903298601988463e-08, + "loss": 1.1808, + "step": 30611 + }, + { + "epoch": 0.92, + "learning_rate": 7.897215085979764e-08, + "loss": 1.1544, + "step": 30612 + }, + { + "epoch": 0.92, + "learning_rate": 7.891133874672996e-08, + "loss": 1.0802, + "step": 30613 + }, + { + "epoch": 0.92, + "learning_rate": 7.885054968126e-08, + "loss": 1.0895, + "step": 30614 + }, + { + "epoch": 0.92, + "learning_rate": 7.878978366396728e-08, + "loss": 1.058, + "step": 30615 + }, + { + "epoch": 0.92, + "learning_rate": 7.872904069542942e-08, + "loss": 1.1178, + "step": 30616 + }, + { + "epoch": 0.92, + "learning_rate": 7.866832077622483e-08, + "loss": 1.1858, + "step": 30617 + }, + { + "epoch": 0.92, + "learning_rate": 7.860762390693193e-08, + "loss": 0.9603, + "step": 30618 + }, + { + "epoch": 0.92, + "learning_rate": 7.854695008812807e-08, + "loss": 1.0609, + "step": 30619 + }, + { + "epoch": 0.92, + "learning_rate": 7.848629932039137e-08, + "loss": 1.0275, + "step": 30620 + }, + { + "epoch": 0.92, + "learning_rate": 7.842567160429832e-08, + "loss": 1.0592, + "step": 30621 + }, + { + "epoch": 0.92, + "learning_rate": 7.836506694042705e-08, + "loss": 1.1694, + "step": 30622 + }, + { + "epoch": 0.92, + "learning_rate": 7.83044853293538e-08, + "loss": 1.1402, + "step": 30623 + }, + { + "epoch": 0.92, + "learning_rate": 7.824392677165587e-08, + "loss": 1.1599, + "step": 30624 + }, + { + "epoch": 0.92, + "learning_rate": 7.818339126790892e-08, + "loss": 1.104, + "step": 30625 + }, + { + "epoch": 0.92, + "learning_rate": 7.812287881868997e-08, + "loss": 1.1316, + "step": 30626 + }, + { + "epoch": 0.92, + "learning_rate": 7.806238942457467e-08, + "loss": 1.012, + "step": 30627 + }, + { + "epoch": 0.92, + "learning_rate": 7.800192308613924e-08, + "loss": 1.0432, + "step": 30628 + }, + { + "epoch": 0.92, + "learning_rate": 7.794147980395878e-08, + "loss": 0.9991, + "step": 30629 + }, + { + "epoch": 0.92, + "learning_rate": 7.788105957860892e-08, + "loss": 1.1276, + "step": 30630 + }, + { + "epoch": 0.92, + "learning_rate": 7.782066241066477e-08, + "loss": 1.0999, + "step": 30631 + }, + { + "epoch": 0.92, + "learning_rate": 7.776028830070142e-08, + "loss": 1.0798, + "step": 30632 + }, + { + "epoch": 0.92, + "learning_rate": 7.769993724929398e-08, + "loss": 1.0998, + "step": 30633 + }, + { + "epoch": 0.92, + "learning_rate": 7.763960925701613e-08, + "loss": 1.1025, + "step": 30634 + }, + { + "epoch": 0.92, + "learning_rate": 7.757930432444244e-08, + "loss": 1.1008, + "step": 30635 + }, + { + "epoch": 0.92, + "learning_rate": 7.751902245214715e-08, + "loss": 1.1185, + "step": 30636 + }, + { + "epoch": 0.92, + "learning_rate": 7.745876364070399e-08, + "loss": 1.1906, + "step": 30637 + }, + { + "epoch": 0.92, + "learning_rate": 7.739852789068692e-08, + "loss": 0.9509, + "step": 30638 + }, + { + "epoch": 0.92, + "learning_rate": 7.733831520266882e-08, + "loss": 1.1423, + "step": 30639 + }, + { + "epoch": 0.92, + "learning_rate": 7.727812557722314e-08, + "loss": 1.0574, + "step": 30640 + }, + { + "epoch": 0.92, + "learning_rate": 7.72179590149233e-08, + "loss": 1.0655, + "step": 30641 + }, + { + "epoch": 0.92, + "learning_rate": 7.715781551634133e-08, + "loss": 1.0873, + "step": 30642 + }, + { + "epoch": 0.92, + "learning_rate": 7.709769508205012e-08, + "loss": 0.9855, + "step": 30643 + }, + { + "epoch": 0.92, + "learning_rate": 7.703759771262199e-08, + "loss": 1.1409, + "step": 30644 + }, + { + "epoch": 0.92, + "learning_rate": 7.697752340862896e-08, + "loss": 1.0752, + "step": 30645 + }, + { + "epoch": 0.92, + "learning_rate": 7.69174721706431e-08, + "loss": 1.1098, + "step": 30646 + }, + { + "epoch": 0.92, + "learning_rate": 7.685744399923589e-08, + "loss": 0.9827, + "step": 30647 + }, + { + "epoch": 0.92, + "learning_rate": 7.679743889497854e-08, + "loss": 1.1846, + "step": 30648 + }, + { + "epoch": 0.92, + "learning_rate": 7.673745685844253e-08, + "loss": 1.122, + "step": 30649 + }, + { + "epoch": 0.92, + "learning_rate": 7.667749789019907e-08, + "loss": 1.029, + "step": 30650 + }, + { + "epoch": 0.92, + "learning_rate": 7.661756199081855e-08, + "loss": 1.0733, + "step": 30651 + }, + { + "epoch": 0.92, + "learning_rate": 7.655764916087189e-08, + "loss": 1.1695, + "step": 30652 + }, + { + "epoch": 0.92, + "learning_rate": 7.649775940092891e-08, + "loss": 1.0843, + "step": 30653 + }, + { + "epoch": 0.92, + "learning_rate": 7.643789271156054e-08, + "loss": 1.0363, + "step": 30654 + }, + { + "epoch": 0.92, + "learning_rate": 7.63780490933358e-08, + "loss": 1.1336, + "step": 30655 + }, + { + "epoch": 0.92, + "learning_rate": 7.631822854682502e-08, + "loss": 1.1376, + "step": 30656 + }, + { + "epoch": 0.92, + "learning_rate": 7.625843107259723e-08, + "loss": 1.0814, + "step": 30657 + }, + { + "epoch": 0.92, + "learning_rate": 7.619865667122167e-08, + "loss": 1.1558, + "step": 30658 + }, + { + "epoch": 0.92, + "learning_rate": 7.613890534326818e-08, + "loss": 1.0652, + "step": 30659 + }, + { + "epoch": 0.92, + "learning_rate": 7.607917708930435e-08, + "loss": 1.0194, + "step": 30660 + }, + { + "epoch": 0.92, + "learning_rate": 7.601947190989972e-08, + "loss": 1.0654, + "step": 30661 + }, + { + "epoch": 0.92, + "learning_rate": 7.59597898056219e-08, + "loss": 1.0372, + "step": 30662 + }, + { + "epoch": 0.92, + "learning_rate": 7.590013077703962e-08, + "loss": 1.1396, + "step": 30663 + }, + { + "epoch": 0.92, + "learning_rate": 7.584049482472072e-08, + "loss": 1.0148, + "step": 30664 + }, + { + "epoch": 0.92, + "learning_rate": 7.578088194923256e-08, + "loss": 1.0956, + "step": 30665 + }, + { + "epoch": 0.92, + "learning_rate": 7.572129215114299e-08, + "loss": 1.1593, + "step": 30666 + }, + { + "epoch": 0.92, + "learning_rate": 7.566172543101935e-08, + "loss": 1.1046, + "step": 30667 + }, + { + "epoch": 0.92, + "learning_rate": 7.56021817894284e-08, + "loss": 1.1355, + "step": 30668 + }, + { + "epoch": 0.92, + "learning_rate": 7.554266122693693e-08, + "loss": 1.1516, + "step": 30669 + }, + { + "epoch": 0.92, + "learning_rate": 7.548316374411169e-08, + "loss": 1.1938, + "step": 30670 + }, + { + "epoch": 0.92, + "learning_rate": 7.542368934151889e-08, + "loss": 1.0941, + "step": 30671 + }, + { + "epoch": 0.92, + "learning_rate": 7.536423801972531e-08, + "loss": 1.0675, + "step": 30672 + }, + { + "epoch": 0.92, + "learning_rate": 7.530480977929605e-08, + "loss": 1.1665, + "step": 30673 + }, + { + "epoch": 0.92, + "learning_rate": 7.524540462079732e-08, + "loss": 1.1281, + "step": 30674 + }, + { + "epoch": 0.92, + "learning_rate": 7.518602254479451e-08, + "loss": 1.1456, + "step": 30675 + }, + { + "epoch": 0.92, + "learning_rate": 7.512666355185299e-08, + "loss": 1.0975, + "step": 30676 + }, + { + "epoch": 0.92, + "learning_rate": 7.506732764253787e-08, + "loss": 1.0509, + "step": 30677 + }, + { + "epoch": 0.92, + "learning_rate": 7.50080148174137e-08, + "loss": 1.0517, + "step": 30678 + }, + { + "epoch": 0.92, + "learning_rate": 7.494872507704531e-08, + "loss": 1.1227, + "step": 30679 + }, + { + "epoch": 0.92, + "learning_rate": 7.488945842199752e-08, + "loss": 1.0679, + "step": 30680 + }, + { + "epoch": 0.92, + "learning_rate": 7.483021485283376e-08, + "loss": 1.1375, + "step": 30681 + }, + { + "epoch": 0.92, + "learning_rate": 7.47709943701183e-08, + "loss": 1.1508, + "step": 30682 + }, + { + "epoch": 0.92, + "learning_rate": 7.471179697441489e-08, + "loss": 1.1603, + "step": 30683 + }, + { + "epoch": 0.92, + "learning_rate": 7.46526226662872e-08, + "loss": 1.0898, + "step": 30684 + }, + { + "epoch": 0.92, + "learning_rate": 7.45934714462987e-08, + "loss": 1.1282, + "step": 30685 + }, + { + "epoch": 0.92, + "learning_rate": 7.453434331501197e-08, + "loss": 1.022, + "step": 30686 + }, + { + "epoch": 0.92, + "learning_rate": 7.44752382729902e-08, + "loss": 1.2087, + "step": 30687 + }, + { + "epoch": 0.92, + "learning_rate": 7.441615632079596e-08, + "loss": 1.0925, + "step": 30688 + }, + { + "epoch": 0.92, + "learning_rate": 7.43570974589916e-08, + "loss": 1.1952, + "step": 30689 + }, + { + "epoch": 0.92, + "learning_rate": 7.429806168813975e-08, + "loss": 1.1181, + "step": 30690 + }, + { + "epoch": 0.92, + "learning_rate": 7.423904900880185e-08, + "loss": 1.0826, + "step": 30691 + }, + { + "epoch": 0.92, + "learning_rate": 7.418005942154e-08, + "loss": 1.1595, + "step": 30692 + }, + { + "epoch": 0.92, + "learning_rate": 7.412109292691567e-08, + "loss": 1.138, + "step": 30693 + }, + { + "epoch": 0.92, + "learning_rate": 7.406214952549035e-08, + "loss": 1.0889, + "step": 30694 + }, + { + "epoch": 0.92, + "learning_rate": 7.400322921782471e-08, + "loss": 1.1063, + "step": 30695 + }, + { + "epoch": 0.92, + "learning_rate": 7.394433200447997e-08, + "loss": 1.0376, + "step": 30696 + }, + { + "epoch": 0.92, + "learning_rate": 7.388545788601681e-08, + "loss": 0.9965, + "step": 30697 + }, + { + "epoch": 0.92, + "learning_rate": 7.382660686299587e-08, + "loss": 1.1772, + "step": 30698 + }, + { + "epoch": 0.92, + "learning_rate": 7.376777893597697e-08, + "loss": 1.0776, + "step": 30699 + }, + { + "epoch": 0.92, + "learning_rate": 7.370897410552025e-08, + "loss": 1.0886, + "step": 30700 + }, + { + "epoch": 0.92, + "learning_rate": 7.365019237218552e-08, + "loss": 1.163, + "step": 30701 + }, + { + "epoch": 0.92, + "learning_rate": 7.35914337365326e-08, + "loss": 1.0336, + "step": 30702 + }, + { + "epoch": 0.92, + "learning_rate": 7.353269819912051e-08, + "loss": 1.1246, + "step": 30703 + }, + { + "epoch": 0.92, + "learning_rate": 7.347398576050852e-08, + "loss": 1.1182, + "step": 30704 + }, + { + "epoch": 0.92, + "learning_rate": 7.341529642125533e-08, + "loss": 1.1709, + "step": 30705 + }, + { + "epoch": 0.93, + "learning_rate": 7.335663018192024e-08, + "loss": 1.21, + "step": 30706 + }, + { + "epoch": 0.93, + "learning_rate": 7.329798704306112e-08, + "loss": 1.075, + "step": 30707 + }, + { + "epoch": 0.93, + "learning_rate": 7.323936700523615e-08, + "loss": 1.06, + "step": 30708 + }, + { + "epoch": 0.93, + "learning_rate": 7.318077006900404e-08, + "loss": 1.1212, + "step": 30709 + }, + { + "epoch": 0.93, + "learning_rate": 7.312219623492184e-08, + "loss": 1.0229, + "step": 30710 + }, + { + "epoch": 0.93, + "learning_rate": 7.306364550354799e-08, + "loss": 1.0942, + "step": 30711 + }, + { + "epoch": 0.93, + "learning_rate": 7.300511787543902e-08, + "loss": 1.0807, + "step": 30712 + }, + { + "epoch": 0.93, + "learning_rate": 7.29466133511525e-08, + "loss": 1.1318, + "step": 30713 + }, + { + "epoch": 0.93, + "learning_rate": 7.288813193124522e-08, + "loss": 1.1026, + "step": 30714 + }, + { + "epoch": 0.93, + "learning_rate": 7.282967361627424e-08, + "loss": 1.1161, + "step": 30715 + }, + { + "epoch": 0.93, + "learning_rate": 7.277123840679579e-08, + "loss": 1.0812, + "step": 30716 + }, + { + "epoch": 0.93, + "learning_rate": 7.271282630336579e-08, + "loss": 1.1769, + "step": 30717 + }, + { + "epoch": 0.93, + "learning_rate": 7.265443730654103e-08, + "loss": 1.2069, + "step": 30718 + }, + { + "epoch": 0.93, + "learning_rate": 7.259607141687664e-08, + "loss": 1.1172, + "step": 30719 + }, + { + "epoch": 0.93, + "learning_rate": 7.253772863492881e-08, + "loss": 1.111, + "step": 30720 + }, + { + "epoch": 0.93, + "learning_rate": 7.247940896125266e-08, + "loss": 1.1535, + "step": 30721 + }, + { + "epoch": 0.93, + "learning_rate": 7.242111239640331e-08, + "loss": 1.1101, + "step": 30722 + }, + { + "epoch": 0.93, + "learning_rate": 7.236283894093615e-08, + "loss": 1.1687, + "step": 30723 + }, + { + "epoch": 0.93, + "learning_rate": 7.230458859540517e-08, + "loss": 0.971, + "step": 30724 + }, + { + "epoch": 0.93, + "learning_rate": 7.22463613603655e-08, + "loss": 1.0965, + "step": 30725 + }, + { + "epoch": 0.93, + "learning_rate": 7.218815723637112e-08, + "loss": 1.0715, + "step": 30726 + }, + { + "epoch": 0.93, + "learning_rate": 7.212997622397633e-08, + "loss": 1.0887, + "step": 30727 + }, + { + "epoch": 0.93, + "learning_rate": 7.207181832373483e-08, + "loss": 1.0558, + "step": 30728 + }, + { + "epoch": 0.93, + "learning_rate": 7.201368353620036e-08, + "loss": 1.0311, + "step": 30729 + }, + { + "epoch": 0.93, + "learning_rate": 7.19555718619261e-08, + "loss": 1.1321, + "step": 30730 + }, + { + "epoch": 0.93, + "learning_rate": 7.189748330146545e-08, + "loss": 1.0734, + "step": 30731 + }, + { + "epoch": 0.93, + "learning_rate": 7.183941785537163e-08, + "loss": 0.9744, + "step": 30732 + }, + { + "epoch": 0.93, + "learning_rate": 7.178137552419667e-08, + "loss": 1.0937, + "step": 30733 + }, + { + "epoch": 0.93, + "learning_rate": 7.172335630849375e-08, + "loss": 1.1313, + "step": 30734 + }, + { + "epoch": 0.93, + "learning_rate": 7.166536020881493e-08, + "loss": 1.1775, + "step": 30735 + }, + { + "epoch": 0.93, + "learning_rate": 7.160738722571254e-08, + "loss": 1.238, + "step": 30736 + }, + { + "epoch": 0.93, + "learning_rate": 7.154943735973807e-08, + "loss": 1.0865, + "step": 30737 + }, + { + "epoch": 0.93, + "learning_rate": 7.149151061144333e-08, + "loss": 1.1992, + "step": 30738 + }, + { + "epoch": 0.93, + "learning_rate": 7.14336069813798e-08, + "loss": 1.1265, + "step": 30739 + }, + { + "epoch": 0.93, + "learning_rate": 7.137572647009872e-08, + "loss": 1.0411, + "step": 30740 + }, + { + "epoch": 0.93, + "learning_rate": 7.13178690781513e-08, + "loss": 1.136, + "step": 30741 + }, + { + "epoch": 0.93, + "learning_rate": 7.126003480608795e-08, + "loss": 1.0416, + "step": 30742 + }, + { + "epoch": 0.93, + "learning_rate": 7.120222365445906e-08, + "loss": 1.1703, + "step": 30743 + }, + { + "epoch": 0.93, + "learning_rate": 7.114443562381557e-08, + "loss": 1.0835, + "step": 30744 + }, + { + "epoch": 0.93, + "learning_rate": 7.108667071470704e-08, + "loss": 1.0715, + "step": 30745 + }, + { + "epoch": 0.93, + "learning_rate": 7.10289289276836e-08, + "loss": 1.0442, + "step": 30746 + }, + { + "epoch": 0.93, + "learning_rate": 7.097121026329507e-08, + "loss": 1.0239, + "step": 30747 + }, + { + "epoch": 0.93, + "learning_rate": 7.091351472209074e-08, + "loss": 1.0775, + "step": 30748 + }, + { + "epoch": 0.93, + "learning_rate": 7.085584230462017e-08, + "loss": 1.0516, + "step": 30749 + }, + { + "epoch": 0.93, + "learning_rate": 7.079819301143154e-08, + "loss": 1.1494, + "step": 30750 + }, + { + "epoch": 0.93, + "learning_rate": 7.07405668430744e-08, + "loss": 1.0337, + "step": 30751 + }, + { + "epoch": 0.93, + "learning_rate": 7.068296380009721e-08, + "loss": 1.1262, + "step": 30752 + }, + { + "epoch": 0.93, + "learning_rate": 7.062538388304785e-08, + "loss": 1.0052, + "step": 30753 + }, + { + "epoch": 0.93, + "learning_rate": 7.056782709247533e-08, + "loss": 1.1575, + "step": 30754 + }, + { + "epoch": 0.93, + "learning_rate": 7.051029342892673e-08, + "loss": 1.1248, + "step": 30755 + }, + { + "epoch": 0.93, + "learning_rate": 7.045278289294993e-08, + "loss": 1.1708, + "step": 30756 + }, + { + "epoch": 0.93, + "learning_rate": 7.039529548509283e-08, + "loss": 1.1108, + "step": 30757 + }, + { + "epoch": 0.93, + "learning_rate": 7.033783120590221e-08, + "loss": 1.1567, + "step": 30758 + }, + { + "epoch": 0.93, + "learning_rate": 7.02803900559254e-08, + "loss": 1.198, + "step": 30759 + }, + { + "epoch": 0.93, + "learning_rate": 7.022297203570893e-08, + "loss": 1.0408, + "step": 30760 + }, + { + "epoch": 0.93, + "learning_rate": 7.016557714579958e-08, + "loss": 1.2306, + "step": 30761 + }, + { + "epoch": 0.93, + "learning_rate": 7.010820538674385e-08, + "loss": 1.1153, + "step": 30762 + }, + { + "epoch": 0.93, + "learning_rate": 7.00508567590874e-08, + "loss": 1.062, + "step": 30763 + }, + { + "epoch": 0.93, + "learning_rate": 6.999353126337677e-08, + "loss": 1.0692, + "step": 30764 + }, + { + "epoch": 0.93, + "learning_rate": 6.993622890015706e-08, + "loss": 1.0834, + "step": 30765 + }, + { + "epoch": 0.93, + "learning_rate": 6.987894966997422e-08, + "loss": 1.04, + "step": 30766 + }, + { + "epoch": 0.93, + "learning_rate": 6.982169357337393e-08, + "loss": 1.1181, + "step": 30767 + }, + { + "epoch": 0.93, + "learning_rate": 6.97644606109002e-08, + "loss": 1.1124, + "step": 30768 + }, + { + "epoch": 0.93, + "learning_rate": 6.970725078309814e-08, + "loss": 1.0764, + "step": 30769 + }, + { + "epoch": 0.93, + "learning_rate": 6.96500640905129e-08, + "loss": 1.0857, + "step": 30770 + }, + { + "epoch": 0.93, + "learning_rate": 6.959290053368845e-08, + "loss": 1.059, + "step": 30771 + }, + { + "epoch": 0.93, + "learning_rate": 6.953576011316909e-08, + "loss": 1.1082, + "step": 30772 + }, + { + "epoch": 0.93, + "learning_rate": 6.947864282949884e-08, + "loss": 1.1439, + "step": 30773 + }, + { + "epoch": 0.93, + "learning_rate": 6.942154868322116e-08, + "loss": 1.1569, + "step": 30774 + }, + { + "epoch": 0.93, + "learning_rate": 6.936447767488002e-08, + "loss": 1.0706, + "step": 30775 + }, + { + "epoch": 0.93, + "learning_rate": 6.930742980501836e-08, + "loss": 1.0485, + "step": 30776 + }, + { + "epoch": 0.93, + "learning_rate": 6.925040507417907e-08, + "loss": 1.0971, + "step": 30777 + }, + { + "epoch": 0.93, + "learning_rate": 6.919340348290532e-08, + "loss": 1.0084, + "step": 30778 + }, + { + "epoch": 0.93, + "learning_rate": 6.913642503173945e-08, + "loss": 1.1305, + "step": 30779 + }, + { + "epoch": 0.93, + "learning_rate": 6.907946972122464e-08, + "loss": 1.0756, + "step": 30780 + }, + { + "epoch": 0.93, + "learning_rate": 6.902253755190214e-08, + "loss": 1.1714, + "step": 30781 + }, + { + "epoch": 0.93, + "learning_rate": 6.896562852431427e-08, + "loss": 1.1064, + "step": 30782 + }, + { + "epoch": 0.93, + "learning_rate": 6.890874263900282e-08, + "loss": 1.0712, + "step": 30783 + }, + { + "epoch": 0.93, + "learning_rate": 6.88518798965096e-08, + "loss": 1.0967, + "step": 30784 + }, + { + "epoch": 0.93, + "learning_rate": 6.879504029737499e-08, + "loss": 1.1074, + "step": 30785 + }, + { + "epoch": 0.93, + "learning_rate": 6.873822384214107e-08, + "loss": 1.0457, + "step": 30786 + }, + { + "epoch": 0.93, + "learning_rate": 6.868143053134823e-08, + "loss": 1.0732, + "step": 30787 + }, + { + "epoch": 0.93, + "learning_rate": 6.862466036553744e-08, + "loss": 1.1296, + "step": 30788 + }, + { + "epoch": 0.93, + "learning_rate": 6.856791334524854e-08, + "loss": 0.9824, + "step": 30789 + }, + { + "epoch": 0.93, + "learning_rate": 6.85111894710222e-08, + "loss": 1.0837, + "step": 30790 + }, + { + "epoch": 0.93, + "learning_rate": 6.845448874339828e-08, + "loss": 1.1108, + "step": 30791 + }, + { + "epoch": 0.93, + "learning_rate": 6.83978111629166e-08, + "loss": 1.1322, + "step": 30792 + }, + { + "epoch": 0.93, + "learning_rate": 6.834115673011676e-08, + "loss": 1.0284, + "step": 30793 + }, + { + "epoch": 0.93, + "learning_rate": 6.828452544553804e-08, + "loss": 1.1453, + "step": 30794 + }, + { + "epoch": 0.93, + "learning_rate": 6.822791730971917e-08, + "loss": 1.0989, + "step": 30795 + }, + { + "epoch": 0.93, + "learning_rate": 6.817133232319945e-08, + "loss": 1.0936, + "step": 30796 + }, + { + "epoch": 0.93, + "learning_rate": 6.811477048651733e-08, + "loss": 1.0264, + "step": 30797 + }, + { + "epoch": 0.93, + "learning_rate": 6.805823180021182e-08, + "loss": 1.055, + "step": 30798 + }, + { + "epoch": 0.93, + "learning_rate": 6.800171626482028e-08, + "loss": 1.0484, + "step": 30799 + }, + { + "epoch": 0.93, + "learning_rate": 6.794522388088116e-08, + "loss": 1.1406, + "step": 30800 + }, + { + "epoch": 0.93, + "learning_rate": 6.788875464893235e-08, + "loss": 1.0436, + "step": 30801 + }, + { + "epoch": 0.93, + "learning_rate": 6.783230856951095e-08, + "loss": 1.1438, + "step": 30802 + }, + { + "epoch": 0.93, + "learning_rate": 6.777588564315485e-08, + "loss": 0.9891, + "step": 30803 + }, + { + "epoch": 0.93, + "learning_rate": 6.771948587040084e-08, + "loss": 1.1594, + "step": 30804 + }, + { + "epoch": 0.93, + "learning_rate": 6.76631092517857e-08, + "loss": 1.2147, + "step": 30805 + }, + { + "epoch": 0.93, + "learning_rate": 6.760675578784681e-08, + "loss": 1.1118, + "step": 30806 + }, + { + "epoch": 0.93, + "learning_rate": 6.755042547911983e-08, + "loss": 1.0166, + "step": 30807 + }, + { + "epoch": 0.93, + "learning_rate": 6.749411832614127e-08, + "loss": 1.1112, + "step": 30808 + }, + { + "epoch": 0.93, + "learning_rate": 6.743783432944712e-08, + "loss": 1.0369, + "step": 30809 + }, + { + "epoch": 0.93, + "learning_rate": 6.738157348957358e-08, + "loss": 1.0752, + "step": 30810 + }, + { + "epoch": 0.93, + "learning_rate": 6.732533580705552e-08, + "loss": 1.1857, + "step": 30811 + }, + { + "epoch": 0.93, + "learning_rate": 6.726912128242862e-08, + "loss": 1.1941, + "step": 30812 + }, + { + "epoch": 0.93, + "learning_rate": 6.721292991622802e-08, + "loss": 1.0972, + "step": 30813 + }, + { + "epoch": 0.93, + "learning_rate": 6.71567617089891e-08, + "loss": 1.1719, + "step": 30814 + }, + { + "epoch": 0.93, + "learning_rate": 6.710061666124562e-08, + "loss": 1.0741, + "step": 30815 + }, + { + "epoch": 0.93, + "learning_rate": 6.70444947735327e-08, + "loss": 0.9015, + "step": 30816 + }, + { + "epoch": 0.93, + "learning_rate": 6.698839604638436e-08, + "loss": 1.1161, + "step": 30817 + }, + { + "epoch": 0.93, + "learning_rate": 6.693232048033488e-08, + "loss": 1.0814, + "step": 30818 + }, + { + "epoch": 0.93, + "learning_rate": 6.687626807591802e-08, + "loss": 0.9781, + "step": 30819 + }, + { + "epoch": 0.93, + "learning_rate": 6.682023883366695e-08, + "loss": 1.1339, + "step": 30820 + }, + { + "epoch": 0.93, + "learning_rate": 6.676423275411543e-08, + "loss": 1.1399, + "step": 30821 + }, + { + "epoch": 0.93, + "learning_rate": 6.670824983779634e-08, + "loss": 1.2057, + "step": 30822 + }, + { + "epoch": 0.93, + "learning_rate": 6.665229008524344e-08, + "loss": 1.1254, + "step": 30823 + }, + { + "epoch": 0.93, + "learning_rate": 6.659635349698824e-08, + "loss": 1.1173, + "step": 30824 + }, + { + "epoch": 0.93, + "learning_rate": 6.654044007356392e-08, + "loss": 1.2308, + "step": 30825 + }, + { + "epoch": 0.93, + "learning_rate": 6.648454981550256e-08, + "loss": 1.0899, + "step": 30826 + }, + { + "epoch": 0.93, + "learning_rate": 6.642868272333624e-08, + "loss": 1.111, + "step": 30827 + }, + { + "epoch": 0.93, + "learning_rate": 6.637283879759676e-08, + "loss": 1.1253, + "step": 30828 + }, + { + "epoch": 0.93, + "learning_rate": 6.63170180388159e-08, + "loss": 1.1411, + "step": 30829 + }, + { + "epoch": 0.93, + "learning_rate": 6.626122044752493e-08, + "loss": 1.1605, + "step": 30830 + }, + { + "epoch": 0.93, + "learning_rate": 6.620544602425505e-08, + "loss": 1.1309, + "step": 30831 + }, + { + "epoch": 0.93, + "learning_rate": 6.614969476953725e-08, + "loss": 1.0281, + "step": 30832 + }, + { + "epoch": 0.93, + "learning_rate": 6.609396668390195e-08, + "loss": 1.055, + "step": 30833 + }, + { + "epoch": 0.93, + "learning_rate": 6.603826176788008e-08, + "loss": 1.0139, + "step": 30834 + }, + { + "epoch": 0.93, + "learning_rate": 6.598258002200154e-08, + "loss": 0.9702, + "step": 30835 + }, + { + "epoch": 0.93, + "learning_rate": 6.59269214467967e-08, + "loss": 1.1152, + "step": 30836 + }, + { + "epoch": 0.93, + "learning_rate": 6.587128604279541e-08, + "loss": 1.2303, + "step": 30837 + }, + { + "epoch": 0.93, + "learning_rate": 6.581567381052673e-08, + "loss": 1.077, + "step": 30838 + }, + { + "epoch": 0.93, + "learning_rate": 6.576008475052076e-08, + "loss": 1.0427, + "step": 30839 + }, + { + "epoch": 0.93, + "learning_rate": 6.570451886330681e-08, + "loss": 0.9981, + "step": 30840 + }, + { + "epoch": 0.93, + "learning_rate": 6.564897614941279e-08, + "loss": 0.9983, + "step": 30841 + }, + { + "epoch": 0.93, + "learning_rate": 6.559345660936828e-08, + "loss": 1.2135, + "step": 30842 + }, + { + "epoch": 0.93, + "learning_rate": 6.553796024370174e-08, + "loss": 1.1733, + "step": 30843 + }, + { + "epoch": 0.93, + "learning_rate": 6.548248705294108e-08, + "loss": 1.1406, + "step": 30844 + }, + { + "epoch": 0.93, + "learning_rate": 6.542703703761505e-08, + "loss": 0.9605, + "step": 30845 + }, + { + "epoch": 0.93, + "learning_rate": 6.5371610198251e-08, + "loss": 0.9961, + "step": 30846 + }, + { + "epoch": 0.93, + "learning_rate": 6.531620653537656e-08, + "loss": 1.1332, + "step": 30847 + }, + { + "epoch": 0.93, + "learning_rate": 6.526082604951912e-08, + "loss": 1.0925, + "step": 30848 + }, + { + "epoch": 0.93, + "learning_rate": 6.520546874120626e-08, + "loss": 1.1119, + "step": 30849 + }, + { + "epoch": 0.93, + "learning_rate": 6.515013461096453e-08, + "loss": 1.0815, + "step": 30850 + }, + { + "epoch": 0.93, + "learning_rate": 6.509482365932074e-08, + "loss": 1.0805, + "step": 30851 + }, + { + "epoch": 0.93, + "learning_rate": 6.503953588680167e-08, + "loss": 1.0201, + "step": 30852 + }, + { + "epoch": 0.93, + "learning_rate": 6.498427129393359e-08, + "loss": 1.0916, + "step": 30853 + }, + { + "epoch": 0.93, + "learning_rate": 6.492902988124245e-08, + "loss": 1.1446, + "step": 30854 + }, + { + "epoch": 0.93, + "learning_rate": 6.487381164925394e-08, + "loss": 1.1567, + "step": 30855 + }, + { + "epoch": 0.93, + "learning_rate": 6.48186165984943e-08, + "loss": 1.0458, + "step": 30856 + }, + { + "epoch": 0.93, + "learning_rate": 6.476344472948842e-08, + "loss": 0.9964, + "step": 30857 + }, + { + "epoch": 0.93, + "learning_rate": 6.470829604276197e-08, + "loss": 1.0895, + "step": 30858 + }, + { + "epoch": 0.93, + "learning_rate": 6.465317053883924e-08, + "loss": 1.1189, + "step": 30859 + }, + { + "epoch": 0.93, + "learning_rate": 6.459806821824565e-08, + "loss": 1.0782, + "step": 30860 + }, + { + "epoch": 0.93, + "learning_rate": 6.454298908150553e-08, + "loss": 1.1669, + "step": 30861 + }, + { + "epoch": 0.93, + "learning_rate": 6.448793312914314e-08, + "loss": 1.1698, + "step": 30862 + }, + { + "epoch": 0.93, + "learning_rate": 6.443290036168282e-08, + "loss": 1.1201, + "step": 30863 + }, + { + "epoch": 0.93, + "learning_rate": 6.437789077964802e-08, + "loss": 1.1348, + "step": 30864 + }, + { + "epoch": 0.93, + "learning_rate": 6.432290438356276e-08, + "loss": 1.0842, + "step": 30865 + }, + { + "epoch": 0.93, + "learning_rate": 6.426794117395053e-08, + "loss": 1.0463, + "step": 30866 + }, + { + "epoch": 0.93, + "learning_rate": 6.421300115133423e-08, + "loss": 1.1008, + "step": 30867 + }, + { + "epoch": 0.93, + "learning_rate": 6.415808431623705e-08, + "loss": 1.1053, + "step": 30868 + }, + { + "epoch": 0.93, + "learning_rate": 6.410319066918164e-08, + "loss": 1.1152, + "step": 30869 + }, + { + "epoch": 0.93, + "learning_rate": 6.404832021069091e-08, + "loss": 1.043, + "step": 30870 + }, + { + "epoch": 0.93, + "learning_rate": 6.399347294128721e-08, + "loss": 1.0164, + "step": 30871 + }, + { + "epoch": 0.93, + "learning_rate": 6.393864886149209e-08, + "loss": 0.9865, + "step": 30872 + }, + { + "epoch": 0.93, + "learning_rate": 6.388384797182761e-08, + "loss": 1.0197, + "step": 30873 + }, + { + "epoch": 0.93, + "learning_rate": 6.382907027281588e-08, + "loss": 1.1812, + "step": 30874 + }, + { + "epoch": 0.93, + "learning_rate": 6.37743157649784e-08, + "loss": 1.0669, + "step": 30875 + }, + { + "epoch": 0.93, + "learning_rate": 6.371958444883558e-08, + "loss": 1.1008, + "step": 30876 + }, + { + "epoch": 0.93, + "learning_rate": 6.366487632490925e-08, + "loss": 1.1152, + "step": 30877 + }, + { + "epoch": 0.93, + "learning_rate": 6.361019139371954e-08, + "loss": 0.9877, + "step": 30878 + }, + { + "epoch": 0.93, + "learning_rate": 6.35555296557877e-08, + "loss": 1.1229, + "step": 30879 + }, + { + "epoch": 0.93, + "learning_rate": 6.350089111163416e-08, + "loss": 1.0869, + "step": 30880 + }, + { + "epoch": 0.93, + "learning_rate": 6.34462757617782e-08, + "loss": 1.1405, + "step": 30881 + }, + { + "epoch": 0.93, + "learning_rate": 6.339168360674025e-08, + "loss": 1.1789, + "step": 30882 + }, + { + "epoch": 0.93, + "learning_rate": 6.33371146470399e-08, + "loss": 1.0963, + "step": 30883 + }, + { + "epoch": 0.93, + "learning_rate": 6.328256888319672e-08, + "loss": 1.0596, + "step": 30884 + }, + { + "epoch": 0.93, + "learning_rate": 6.322804631573005e-08, + "loss": 1.0942, + "step": 30885 + }, + { + "epoch": 0.93, + "learning_rate": 6.317354694515859e-08, + "loss": 1.0983, + "step": 30886 + }, + { + "epoch": 0.93, + "learning_rate": 6.31190707720014e-08, + "loss": 1.2254, + "step": 30887 + }, + { + "epoch": 0.93, + "learning_rate": 6.306461779677753e-08, + "loss": 1.032, + "step": 30888 + }, + { + "epoch": 0.93, + "learning_rate": 6.30101880200043e-08, + "loss": 1.1088, + "step": 30889 + }, + { + "epoch": 0.93, + "learning_rate": 6.29557814422005e-08, + "loss": 1.0834, + "step": 30890 + }, + { + "epoch": 0.93, + "learning_rate": 6.290139806388373e-08, + "loss": 0.9915, + "step": 30891 + }, + { + "epoch": 0.93, + "learning_rate": 6.284703788557223e-08, + "loss": 1.1487, + "step": 30892 + }, + { + "epoch": 0.93, + "learning_rate": 6.279270090778306e-08, + "loss": 1.0583, + "step": 30893 + }, + { + "epoch": 0.93, + "learning_rate": 6.273838713103358e-08, + "loss": 1.0944, + "step": 30894 + }, + { + "epoch": 0.93, + "learning_rate": 6.268409655584062e-08, + "loss": 1.0723, + "step": 30895 + }, + { + "epoch": 0.93, + "learning_rate": 6.262982918272182e-08, + "loss": 1.1932, + "step": 30896 + }, + { + "epoch": 0.93, + "learning_rate": 6.257558501219257e-08, + "loss": 1.2135, + "step": 30897 + }, + { + "epoch": 0.93, + "learning_rate": 6.252136404477e-08, + "loss": 1.0673, + "step": 30898 + }, + { + "epoch": 0.93, + "learning_rate": 6.246716628097005e-08, + "loss": 1.0764, + "step": 30899 + }, + { + "epoch": 0.93, + "learning_rate": 6.241299172130872e-08, + "loss": 1.1578, + "step": 30900 + }, + { + "epoch": 0.93, + "learning_rate": 6.235884036630196e-08, + "loss": 1.043, + "step": 30901 + }, + { + "epoch": 0.93, + "learning_rate": 6.230471221646495e-08, + "loss": 1.0322, + "step": 30902 + }, + { + "epoch": 0.93, + "learning_rate": 6.22506072723128e-08, + "loss": 0.9703, + "step": 30903 + }, + { + "epoch": 0.93, + "learning_rate": 6.219652553436095e-08, + "loss": 1.1196, + "step": 30904 + }, + { + "epoch": 0.93, + "learning_rate": 6.214246700312427e-08, + "loss": 1.1626, + "step": 30905 + }, + { + "epoch": 0.93, + "learning_rate": 6.208843167911705e-08, + "loss": 1.179, + "step": 30906 + }, + { + "epoch": 0.93, + "learning_rate": 6.203441956285389e-08, + "loss": 1.0377, + "step": 30907 + }, + { + "epoch": 0.93, + "learning_rate": 6.198043065484882e-08, + "loss": 1.1041, + "step": 30908 + }, + { + "epoch": 0.93, + "learning_rate": 6.192646495561561e-08, + "loss": 1.0102, + "step": 30909 + }, + { + "epoch": 0.93, + "learning_rate": 6.187252246566855e-08, + "loss": 1.1104, + "step": 30910 + }, + { + "epoch": 0.93, + "learning_rate": 6.181860318552058e-08, + "loss": 1.1157, + "step": 30911 + }, + { + "epoch": 0.93, + "learning_rate": 6.176470711568544e-08, + "loss": 1.1906, + "step": 30912 + }, + { + "epoch": 0.93, + "learning_rate": 6.171083425667607e-08, + "loss": 1.1226, + "step": 30913 + }, + { + "epoch": 0.93, + "learning_rate": 6.165698460900538e-08, + "loss": 1.0537, + "step": 30914 + }, + { + "epoch": 0.93, + "learning_rate": 6.160315817318546e-08, + "loss": 1.0817, + "step": 30915 + }, + { + "epoch": 0.93, + "learning_rate": 6.154935494972925e-08, + "loss": 1.1949, + "step": 30916 + }, + { + "epoch": 0.93, + "learning_rate": 6.149557493914881e-08, + "loss": 1.1405, + "step": 30917 + }, + { + "epoch": 0.93, + "learning_rate": 6.144181814195627e-08, + "loss": 1.0219, + "step": 30918 + }, + { + "epoch": 0.93, + "learning_rate": 6.138808455866285e-08, + "loss": 1.0428, + "step": 30919 + }, + { + "epoch": 0.93, + "learning_rate": 6.133437418978038e-08, + "loss": 1.1264, + "step": 30920 + }, + { + "epoch": 0.93, + "learning_rate": 6.128068703582013e-08, + "loss": 1.1533, + "step": 30921 + }, + { + "epoch": 0.93, + "learning_rate": 6.122702309729362e-08, + "loss": 1.038, + "step": 30922 + }, + { + "epoch": 0.93, + "learning_rate": 6.117338237471099e-08, + "loss": 1.1329, + "step": 30923 + }, + { + "epoch": 0.93, + "learning_rate": 6.111976486858324e-08, + "loss": 1.1113, + "step": 30924 + }, + { + "epoch": 0.93, + "learning_rate": 6.106617057942077e-08, + "loss": 1.0195, + "step": 30925 + }, + { + "epoch": 0.93, + "learning_rate": 6.101259950773347e-08, + "loss": 1.0983, + "step": 30926 + }, + { + "epoch": 0.93, + "learning_rate": 6.095905165403204e-08, + "loss": 0.9696, + "step": 30927 + }, + { + "epoch": 0.93, + "learning_rate": 6.090552701882551e-08, + "loss": 1.0118, + "step": 30928 + }, + { + "epoch": 0.93, + "learning_rate": 6.085202560262349e-08, + "loss": 1.1288, + "step": 30929 + }, + { + "epoch": 0.93, + "learning_rate": 6.079854740593555e-08, + "loss": 1.0632, + "step": 30930 + }, + { + "epoch": 0.93, + "learning_rate": 6.074509242927101e-08, + "loss": 1.0461, + "step": 30931 + }, + { + "epoch": 0.93, + "learning_rate": 6.069166067313808e-08, + "loss": 1.1617, + "step": 30932 + }, + { + "epoch": 0.93, + "learning_rate": 6.063825213804553e-08, + "loss": 1.0812, + "step": 30933 + }, + { + "epoch": 0.93, + "learning_rate": 6.05848668245021e-08, + "loss": 0.9465, + "step": 30934 + }, + { + "epoch": 0.93, + "learning_rate": 6.0531504733016e-08, + "loss": 0.9752, + "step": 30935 + }, + { + "epoch": 0.93, + "learning_rate": 6.047816586409517e-08, + "loss": 1.073, + "step": 30936 + }, + { + "epoch": 0.93, + "learning_rate": 6.042485021824696e-08, + "loss": 1.1833, + "step": 30937 + }, + { + "epoch": 0.93, + "learning_rate": 6.037155779597959e-08, + "loss": 1.0445, + "step": 30938 + }, + { + "epoch": 0.93, + "learning_rate": 6.031828859779987e-08, + "loss": 1.1072, + "step": 30939 + }, + { + "epoch": 0.93, + "learning_rate": 6.026504262421517e-08, + "loss": 1.0637, + "step": 30940 + }, + { + "epoch": 0.93, + "learning_rate": 6.021181987573205e-08, + "loss": 1.0046, + "step": 30941 + }, + { + "epoch": 0.93, + "learning_rate": 6.015862035285758e-08, + "loss": 1.0983, + "step": 30942 + }, + { + "epoch": 0.93, + "learning_rate": 6.010544405609775e-08, + "loss": 1.2784, + "step": 30943 + }, + { + "epoch": 0.93, + "learning_rate": 6.005229098595938e-08, + "loss": 1.0524, + "step": 30944 + }, + { + "epoch": 0.93, + "learning_rate": 5.999916114294763e-08, + "loss": 1.1776, + "step": 30945 + }, + { + "epoch": 0.93, + "learning_rate": 5.994605452756902e-08, + "loss": 1.0074, + "step": 30946 + }, + { + "epoch": 0.93, + "learning_rate": 5.989297114032871e-08, + "loss": 1.0896, + "step": 30947 + }, + { + "epoch": 0.93, + "learning_rate": 5.983991098173214e-08, + "loss": 1.1061, + "step": 30948 + }, + { + "epoch": 0.93, + "learning_rate": 5.978687405228444e-08, + "loss": 1.1756, + "step": 30949 + }, + { + "epoch": 0.93, + "learning_rate": 5.973386035249024e-08, + "loss": 1.164, + "step": 30950 + }, + { + "epoch": 0.93, + "learning_rate": 5.968086988285465e-08, + "loss": 1.0497, + "step": 30951 + }, + { + "epoch": 0.93, + "learning_rate": 5.962790264388174e-08, + "loss": 1.0189, + "step": 30952 + }, + { + "epoch": 0.93, + "learning_rate": 5.95749586360761e-08, + "loss": 1.1367, + "step": 30953 + }, + { + "epoch": 0.93, + "learning_rate": 5.9522037859941204e-08, + "loss": 1.0998, + "step": 30954 + }, + { + "epoch": 0.93, + "learning_rate": 5.946914031598111e-08, + "loss": 1.2452, + "step": 30955 + }, + { + "epoch": 0.93, + "learning_rate": 5.9416266004699577e-08, + "loss": 1.118, + "step": 30956 + }, + { + "epoch": 0.93, + "learning_rate": 5.936341492659981e-08, + "loss": 1.0687, + "step": 30957 + }, + { + "epoch": 0.93, + "learning_rate": 5.931058708218473e-08, + "loss": 1.0703, + "step": 30958 + }, + { + "epoch": 0.93, + "learning_rate": 5.925778247195757e-08, + "loss": 1.1603, + "step": 30959 + }, + { + "epoch": 0.93, + "learning_rate": 5.920500109642069e-08, + "loss": 1.1653, + "step": 30960 + }, + { + "epoch": 0.93, + "learning_rate": 5.9152242956076465e-08, + "loss": 1.0251, + "step": 30961 + }, + { + "epoch": 0.93, + "learning_rate": 5.909950805142783e-08, + "loss": 0.9598, + "step": 30962 + }, + { + "epoch": 0.93, + "learning_rate": 5.9046796382976054e-08, + "loss": 1.0497, + "step": 30963 + }, + { + "epoch": 0.93, + "learning_rate": 5.899410795122296e-08, + "loss": 1.0797, + "step": 30964 + }, + { + "epoch": 0.93, + "learning_rate": 5.8941442756670354e-08, + "loss": 1.09, + "step": 30965 + }, + { + "epoch": 0.93, + "learning_rate": 5.888880079981979e-08, + "loss": 1.1602, + "step": 30966 + }, + { + "epoch": 0.93, + "learning_rate": 5.883618208117198e-08, + "loss": 1.111, + "step": 30967 + }, + { + "epoch": 0.93, + "learning_rate": 5.878358660122818e-08, + "loss": 1.0403, + "step": 30968 + }, + { + "epoch": 0.93, + "learning_rate": 5.8731014360488834e-08, + "loss": 1.1771, + "step": 30969 + }, + { + "epoch": 0.93, + "learning_rate": 5.867846535945465e-08, + "loss": 1.1031, + "step": 30970 + }, + { + "epoch": 0.93, + "learning_rate": 5.86259395986255e-08, + "loss": 1.0783, + "step": 30971 + }, + { + "epoch": 0.93, + "learning_rate": 5.857343707850155e-08, + "loss": 1.1238, + "step": 30972 + }, + { + "epoch": 0.93, + "learning_rate": 5.8520957799582666e-08, + "loss": 1.1032, + "step": 30973 + }, + { + "epoch": 0.93, + "learning_rate": 5.846850176236874e-08, + "loss": 1.0682, + "step": 30974 + }, + { + "epoch": 0.93, + "learning_rate": 5.841606896735852e-08, + "loss": 1.1255, + "step": 30975 + }, + { + "epoch": 0.93, + "learning_rate": 5.8363659415051345e-08, + "loss": 1.0807, + "step": 30976 + }, + { + "epoch": 0.93, + "learning_rate": 5.8311273105946255e-08, + "loss": 1.0077, + "step": 30977 + }, + { + "epoch": 0.93, + "learning_rate": 5.825891004054174e-08, + "loss": 1.0784, + "step": 30978 + }, + { + "epoch": 0.93, + "learning_rate": 5.820657021933685e-08, + "loss": 1.0859, + "step": 30979 + }, + { + "epoch": 0.93, + "learning_rate": 5.815425364282895e-08, + "loss": 1.1349, + "step": 30980 + }, + { + "epoch": 0.93, + "learning_rate": 5.810196031151683e-08, + "loss": 0.9949, + "step": 30981 + }, + { + "epoch": 0.93, + "learning_rate": 5.8049690225897845e-08, + "loss": 1.0942, + "step": 30982 + }, + { + "epoch": 0.93, + "learning_rate": 5.799744338646995e-08, + "loss": 1.0535, + "step": 30983 + }, + { + "epoch": 0.93, + "learning_rate": 5.7945219793729965e-08, + "loss": 1.0581, + "step": 30984 + }, + { + "epoch": 0.93, + "learning_rate": 5.7893019448175545e-08, + "loss": 1.1306, + "step": 30985 + }, + { + "epoch": 0.93, + "learning_rate": 5.784084235030324e-08, + "loss": 1.0345, + "step": 30986 + }, + { + "epoch": 0.93, + "learning_rate": 5.7788688500610145e-08, + "loss": 1.1368, + "step": 30987 + }, + { + "epoch": 0.93, + "learning_rate": 5.7736557899592537e-08, + "loss": 1.0134, + "step": 30988 + }, + { + "epoch": 0.93, + "learning_rate": 5.768445054774641e-08, + "loss": 1.0534, + "step": 30989 + }, + { + "epoch": 0.93, + "learning_rate": 5.7632366445568024e-08, + "loss": 1.1521, + "step": 30990 + }, + { + "epoch": 0.93, + "learning_rate": 5.758030559355338e-08, + "loss": 1.1238, + "step": 30991 + }, + { + "epoch": 0.93, + "learning_rate": 5.7528267992197904e-08, + "loss": 1.1274, + "step": 30992 + }, + { + "epoch": 0.93, + "learning_rate": 5.747625364199705e-08, + "loss": 1.0156, + "step": 30993 + }, + { + "epoch": 0.93, + "learning_rate": 5.742426254344569e-08, + "loss": 1.0529, + "step": 30994 + }, + { + "epoch": 0.93, + "learning_rate": 5.7372294697039255e-08, + "loss": 1.0521, + "step": 30995 + }, + { + "epoch": 0.93, + "learning_rate": 5.732035010327208e-08, + "loss": 1.0987, + "step": 30996 + }, + { + "epoch": 0.93, + "learning_rate": 5.726842876263877e-08, + "loss": 1.1135, + "step": 30997 + }, + { + "epoch": 0.93, + "learning_rate": 5.721653067563337e-08, + "loss": 1.138, + "step": 30998 + }, + { + "epoch": 0.93, + "learning_rate": 5.716465584275022e-08, + "loss": 1.1522, + "step": 30999 + }, + { + "epoch": 0.93, + "learning_rate": 5.7112804264483345e-08, + "loss": 1.081, + "step": 31000 + }, + { + "epoch": 0.93, + "learning_rate": 5.70609759413257e-08, + "loss": 1.0541, + "step": 31001 + }, + { + "epoch": 0.93, + "learning_rate": 5.700917087377106e-08, + "loss": 1.1306, + "step": 31002 + }, + { + "epoch": 0.93, + "learning_rate": 5.695738906231235e-08, + "loss": 1.1525, + "step": 31003 + }, + { + "epoch": 0.93, + "learning_rate": 5.69056305074428e-08, + "loss": 1.1094, + "step": 31004 + }, + { + "epoch": 0.93, + "learning_rate": 5.685389520965534e-08, + "loss": 1.1109, + "step": 31005 + }, + { + "epoch": 0.93, + "learning_rate": 5.6802183169441804e-08, + "loss": 1.0854, + "step": 31006 + }, + { + "epoch": 0.93, + "learning_rate": 5.675049438729485e-08, + "loss": 1.0549, + "step": 31007 + }, + { + "epoch": 0.93, + "learning_rate": 5.669882886370631e-08, + "loss": 1.1214, + "step": 31008 + }, + { + "epoch": 0.93, + "learning_rate": 5.664718659916857e-08, + "loss": 1.0465, + "step": 31009 + }, + { + "epoch": 0.93, + "learning_rate": 5.659556759417262e-08, + "loss": 1.0067, + "step": 31010 + }, + { + "epoch": 0.93, + "learning_rate": 5.654397184921001e-08, + "loss": 1.0523, + "step": 31011 + }, + { + "epoch": 0.93, + "learning_rate": 5.6492399364772024e-08, + "loss": 1.0923, + "step": 31012 + }, + { + "epoch": 0.93, + "learning_rate": 5.644085014134992e-08, + "loss": 1.1244, + "step": 31013 + }, + { + "epoch": 0.93, + "learning_rate": 5.638932417943388e-08, + "loss": 1.0625, + "step": 31014 + }, + { + "epoch": 0.93, + "learning_rate": 5.6337821479514335e-08, + "loss": 1.0118, + "step": 31015 + }, + { + "epoch": 0.93, + "learning_rate": 5.6286342042082e-08, + "loss": 1.2158, + "step": 31016 + }, + { + "epoch": 0.93, + "learning_rate": 5.623488586762649e-08, + "loss": 1.1586, + "step": 31017 + }, + { + "epoch": 0.93, + "learning_rate": 5.618345295663824e-08, + "loss": 1.0418, + "step": 31018 + }, + { + "epoch": 0.93, + "learning_rate": 5.613204330960631e-08, + "loss": 1.005, + "step": 31019 + }, + { + "epoch": 0.93, + "learning_rate": 5.608065692702031e-08, + "loss": 1.1562, + "step": 31020 + }, + { + "epoch": 0.93, + "learning_rate": 5.602929380936956e-08, + "loss": 1.0735, + "step": 31021 + }, + { + "epoch": 0.93, + "learning_rate": 5.5977953957143116e-08, + "loss": 1.1331, + "step": 31022 + }, + { + "epoch": 0.93, + "learning_rate": 5.5926637370829206e-08, + "loss": 1.0203, + "step": 31023 + }, + { + "epoch": 0.93, + "learning_rate": 5.58753440509166e-08, + "loss": 1.1042, + "step": 31024 + }, + { + "epoch": 0.93, + "learning_rate": 5.582407399789352e-08, + "loss": 1.0464, + "step": 31025 + }, + { + "epoch": 0.93, + "learning_rate": 5.577282721224847e-08, + "loss": 1.1485, + "step": 31026 + }, + { + "epoch": 0.93, + "learning_rate": 5.572160369446855e-08, + "loss": 1.0877, + "step": 31027 + }, + { + "epoch": 0.93, + "learning_rate": 5.567040344504171e-08, + "loss": 1.0238, + "step": 31028 + }, + { + "epoch": 0.93, + "learning_rate": 5.561922646445561e-08, + "loss": 1.0778, + "step": 31029 + }, + { + "epoch": 0.93, + "learning_rate": 5.556807275319709e-08, + "loss": 1.0834, + "step": 31030 + }, + { + "epoch": 0.93, + "learning_rate": 5.551694231175353e-08, + "loss": 1.1578, + "step": 31031 + }, + { + "epoch": 0.93, + "learning_rate": 5.5465835140610936e-08, + "loss": 1.1484, + "step": 31032 + }, + { + "epoch": 0.93, + "learning_rate": 5.5414751240256416e-08, + "loss": 1.0652, + "step": 31033 + }, + { + "epoch": 0.93, + "learning_rate": 5.5363690611176245e-08, + "loss": 1.0815, + "step": 31034 + }, + { + "epoch": 0.93, + "learning_rate": 5.531265325385643e-08, + "loss": 1.2014, + "step": 31035 + }, + { + "epoch": 0.93, + "learning_rate": 5.5261639168782686e-08, + "loss": 1.0997, + "step": 31036 + }, + { + "epoch": 0.93, + "learning_rate": 5.521064835644047e-08, + "loss": 1.1891, + "step": 31037 + }, + { + "epoch": 0.94, + "learning_rate": 5.515968081731549e-08, + "loss": 1.1257, + "step": 31038 + }, + { + "epoch": 0.94, + "learning_rate": 5.5108736551893193e-08, + "loss": 1.1855, + "step": 31039 + }, + { + "epoch": 0.94, + "learning_rate": 5.50578155606582e-08, + "loss": 1.0293, + "step": 31040 + }, + { + "epoch": 0.94, + "learning_rate": 5.500691784409484e-08, + "loss": 1.0103, + "step": 31041 + }, + { + "epoch": 0.94, + "learning_rate": 5.495604340268829e-08, + "loss": 1.0809, + "step": 31042 + }, + { + "epoch": 0.94, + "learning_rate": 5.490519223692259e-08, + "loss": 0.9029, + "step": 31043 + }, + { + "epoch": 0.94, + "learning_rate": 5.4854364347282085e-08, + "loss": 1.1344, + "step": 31044 + }, + { + "epoch": 0.94, + "learning_rate": 5.480355973425028e-08, + "loss": 0.9663, + "step": 31045 + }, + { + "epoch": 0.94, + "learning_rate": 5.4752778398310946e-08, + "loss": 1.2206, + "step": 31046 + }, + { + "epoch": 0.94, + "learning_rate": 5.470202033994731e-08, + "loss": 1.0612, + "step": 31047 + }, + { + "epoch": 0.94, + "learning_rate": 5.4651285559642886e-08, + "loss": 0.8832, + "step": 31048 + }, + { + "epoch": 0.94, + "learning_rate": 5.4600574057880604e-08, + "loss": 1.1361, + "step": 31049 + }, + { + "epoch": 0.94, + "learning_rate": 5.454988583514287e-08, + "loss": 1.1545, + "step": 31050 + }, + { + "epoch": 0.94, + "learning_rate": 5.449922089191262e-08, + "loss": 1.0818, + "step": 31051 + }, + { + "epoch": 0.94, + "learning_rate": 5.444857922867225e-08, + "loss": 1.0177, + "step": 31052 + }, + { + "epoch": 0.94, + "learning_rate": 5.439796084590332e-08, + "loss": 1.0134, + "step": 31053 + }, + { + "epoch": 0.94, + "learning_rate": 5.434736574408794e-08, + "loss": 1.0406, + "step": 31054 + }, + { + "epoch": 0.94, + "learning_rate": 5.429679392370768e-08, + "loss": 1.0549, + "step": 31055 + }, + { + "epoch": 0.94, + "learning_rate": 5.424624538524409e-08, + "loss": 1.1595, + "step": 31056 + }, + { + "epoch": 0.94, + "learning_rate": 5.4195720129178455e-08, + "loss": 1.1266, + "step": 31057 + }, + { + "epoch": 0.94, + "learning_rate": 5.4145218155991774e-08, + "loss": 1.1585, + "step": 31058 + }, + { + "epoch": 0.94, + "learning_rate": 5.409473946616423e-08, + "loss": 1.1031, + "step": 31059 + }, + { + "epoch": 0.94, + "learning_rate": 5.404428406017709e-08, + "loss": 1.0515, + "step": 31060 + }, + { + "epoch": 0.94, + "learning_rate": 5.399385193851026e-08, + "loss": 1.2819, + "step": 31061 + }, + { + "epoch": 0.94, + "learning_rate": 5.39434431016439e-08, + "loss": 1.072, + "step": 31062 + }, + { + "epoch": 0.94, + "learning_rate": 5.3893057550057915e-08, + "loss": 1.0392, + "step": 31063 + }, + { + "epoch": 0.94, + "learning_rate": 5.384269528423192e-08, + "loss": 1.2041, + "step": 31064 + }, + { + "epoch": 0.94, + "learning_rate": 5.379235630464552e-08, + "loss": 1.1093, + "step": 31065 + }, + { + "epoch": 0.94, + "learning_rate": 5.374204061177751e-08, + "loss": 0.9891, + "step": 31066 + }, + { + "epoch": 0.94, + "learning_rate": 5.369174820610723e-08, + "loss": 1.1615, + "step": 31067 + }, + { + "epoch": 0.94, + "learning_rate": 5.364147908811346e-08, + "loss": 1.0382, + "step": 31068 + }, + { + "epoch": 0.94, + "learning_rate": 5.359123325827442e-08, + "loss": 1.0294, + "step": 31069 + }, + { + "epoch": 0.94, + "learning_rate": 5.354101071706863e-08, + "loss": 1.1403, + "step": 31070 + }, + { + "epoch": 0.94, + "learning_rate": 5.349081146497431e-08, + "loss": 1.0068, + "step": 31071 + }, + { + "epoch": 0.94, + "learning_rate": 5.3440635502468866e-08, + "loss": 1.1085, + "step": 31072 + }, + { + "epoch": 0.94, + "learning_rate": 5.339048283003051e-08, + "loss": 1.1243, + "step": 31073 + }, + { + "epoch": 0.94, + "learning_rate": 5.334035344813637e-08, + "loss": 1.0619, + "step": 31074 + }, + { + "epoch": 0.94, + "learning_rate": 5.329024735726357e-08, + "loss": 1.2241, + "step": 31075 + }, + { + "epoch": 0.94, + "learning_rate": 5.3240164557889494e-08, + "loss": 1.0836, + "step": 31076 + }, + { + "epoch": 0.94, + "learning_rate": 5.3190105050490435e-08, + "loss": 1.0591, + "step": 31077 + }, + { + "epoch": 0.94, + "learning_rate": 5.3140068835543514e-08, + "loss": 1.0876, + "step": 31078 + }, + { + "epoch": 0.94, + "learning_rate": 5.3090055913524175e-08, + "loss": 1.1411, + "step": 31079 + }, + { + "epoch": 0.94, + "learning_rate": 5.3040066284909264e-08, + "loss": 1.2538, + "step": 31080 + }, + { + "epoch": 0.94, + "learning_rate": 5.299009995017451e-08, + "loss": 1.2189, + "step": 31081 + }, + { + "epoch": 0.94, + "learning_rate": 5.2940156909795646e-08, + "loss": 1.0954, + "step": 31082 + }, + { + "epoch": 0.94, + "learning_rate": 5.289023716424757e-08, + "loss": 1.1189, + "step": 31083 + }, + { + "epoch": 0.94, + "learning_rate": 5.284034071400601e-08, + "loss": 1.0424, + "step": 31084 + }, + { + "epoch": 0.94, + "learning_rate": 5.279046755954587e-08, + "loss": 1.19, + "step": 31085 + }, + { + "epoch": 0.94, + "learning_rate": 5.2740617701341754e-08, + "loss": 1.0423, + "step": 31086 + }, + { + "epoch": 0.94, + "learning_rate": 5.269079113986858e-08, + "loss": 1.1532, + "step": 31087 + }, + { + "epoch": 0.94, + "learning_rate": 5.2640987875600127e-08, + "loss": 1.0822, + "step": 31088 + }, + { + "epoch": 0.94, + "learning_rate": 5.259120790901101e-08, + "loss": 0.9902, + "step": 31089 + }, + { + "epoch": 0.94, + "learning_rate": 5.254145124057447e-08, + "loss": 1.0452, + "step": 31090 + }, + { + "epoch": 0.94, + "learning_rate": 5.2491717870765127e-08, + "loss": 1.1678, + "step": 31091 + }, + { + "epoch": 0.94, + "learning_rate": 5.244200780005565e-08, + "loss": 1.1803, + "step": 31092 + }, + { + "epoch": 0.94, + "learning_rate": 5.2392321028919276e-08, + "loss": 1.2394, + "step": 31093 + }, + { + "epoch": 0.94, + "learning_rate": 5.2342657557829245e-08, + "loss": 1.3077, + "step": 31094 + }, + { + "epoch": 0.94, + "learning_rate": 5.2293017387258506e-08, + "loss": 1.0294, + "step": 31095 + }, + { + "epoch": 0.94, + "learning_rate": 5.2243400517679176e-08, + "loss": 1.0469, + "step": 31096 + }, + { + "epoch": 0.94, + "learning_rate": 5.219380694956394e-08, + "loss": 1.1168, + "step": 31097 + }, + { + "epoch": 0.94, + "learning_rate": 5.214423668338464e-08, + "loss": 1.1254, + "step": 31098 + }, + { + "epoch": 0.94, + "learning_rate": 5.20946897196134e-08, + "loss": 1.1139, + "step": 31099 + }, + { + "epoch": 0.94, + "learning_rate": 5.2045166058721506e-08, + "loss": 1.1007, + "step": 31100 + }, + { + "epoch": 0.94, + "learning_rate": 5.199566570118081e-08, + "loss": 1.1196, + "step": 31101 + }, + { + "epoch": 0.94, + "learning_rate": 5.194618864746231e-08, + "loss": 1.0652, + "step": 31102 + }, + { + "epoch": 0.94, + "learning_rate": 5.1896734898037313e-08, + "loss": 1.0381, + "step": 31103 + }, + { + "epoch": 0.94, + "learning_rate": 5.184730445337627e-08, + "loss": 1.0577, + "step": 31104 + }, + { + "epoch": 0.94, + "learning_rate": 5.179789731394963e-08, + "loss": 1.0853, + "step": 31105 + }, + { + "epoch": 0.94, + "learning_rate": 5.174851348022814e-08, + "loss": 1.1501, + "step": 31106 + }, + { + "epoch": 0.94, + "learning_rate": 5.169915295268141e-08, + "loss": 1.0825, + "step": 31107 + }, + { + "epoch": 0.94, + "learning_rate": 5.1649815731780185e-08, + "loss": 1.0579, + "step": 31108 + }, + { + "epoch": 0.94, + "learning_rate": 5.1600501817992975e-08, + "loss": 1.1053, + "step": 31109 + }, + { + "epoch": 0.94, + "learning_rate": 5.155121121178996e-08, + "loss": 1.1082, + "step": 31110 + }, + { + "epoch": 0.94, + "learning_rate": 5.1501943913640215e-08, + "loss": 1.215, + "step": 31111 + }, + { + "epoch": 0.94, + "learning_rate": 5.145269992401253e-08, + "loss": 1.1609, + "step": 31112 + }, + { + "epoch": 0.94, + "learning_rate": 5.140347924337624e-08, + "loss": 1.0209, + "step": 31113 + }, + { + "epoch": 0.94, + "learning_rate": 5.135428187219932e-08, + "loss": 1.1258, + "step": 31114 + }, + { + "epoch": 0.94, + "learning_rate": 5.130510781095027e-08, + "loss": 1.0991, + "step": 31115 + }, + { + "epoch": 0.94, + "learning_rate": 5.125595706009734e-08, + "loss": 1.1084, + "step": 31116 + }, + { + "epoch": 0.94, + "learning_rate": 5.1206829620108756e-08, + "loss": 1.0601, + "step": 31117 + }, + { + "epoch": 0.94, + "learning_rate": 5.115772549145109e-08, + "loss": 1.207, + "step": 31118 + }, + { + "epoch": 0.94, + "learning_rate": 5.1108644674592865e-08, + "loss": 1.1276, + "step": 31119 + }, + { + "epoch": 0.94, + "learning_rate": 5.1059587170000643e-08, + "loss": 1.0524, + "step": 31120 + }, + { + "epoch": 0.94, + "learning_rate": 5.1010552978142115e-08, + "loss": 1.022, + "step": 31121 + }, + { + "epoch": 0.94, + "learning_rate": 5.0961542099483566e-08, + "loss": 1.1374, + "step": 31122 + }, + { + "epoch": 0.94, + "learning_rate": 5.091255453449129e-08, + "loss": 1.0974, + "step": 31123 + }, + { + "epoch": 0.94, + "learning_rate": 5.086359028363214e-08, + "loss": 1.0881, + "step": 31124 + }, + { + "epoch": 0.94, + "learning_rate": 5.081464934737212e-08, + "loss": 1.0531, + "step": 31125 + }, + { + "epoch": 0.94, + "learning_rate": 5.076573172617699e-08, + "loss": 0.9929, + "step": 31126 + }, + { + "epoch": 0.94, + "learning_rate": 5.071683742051276e-08, + "loss": 1.0683, + "step": 31127 + }, + { + "epoch": 0.94, + "learning_rate": 5.066796643084432e-08, + "loss": 1.0262, + "step": 31128 + }, + { + "epoch": 0.94, + "learning_rate": 5.061911875763742e-08, + "loss": 1.0282, + "step": 31129 + }, + { + "epoch": 0.94, + "learning_rate": 5.057029440135669e-08, + "loss": 1.2625, + "step": 31130 + }, + { + "epoch": 0.94, + "learning_rate": 5.052149336246703e-08, + "loss": 1.3263, + "step": 31131 + }, + { + "epoch": 0.94, + "learning_rate": 5.047271564143308e-08, + "loss": 1.1345, + "step": 31132 + }, + { + "epoch": 0.94, + "learning_rate": 5.0423961238719176e-08, + "loss": 1.0199, + "step": 31133 + }, + { + "epoch": 0.94, + "learning_rate": 5.03752301547894e-08, + "loss": 1.0353, + "step": 31134 + }, + { + "epoch": 0.94, + "learning_rate": 5.0326522390107824e-08, + "loss": 1.0329, + "step": 31135 + }, + { + "epoch": 0.94, + "learning_rate": 5.0277837945137686e-08, + "loss": 1.1529, + "step": 31136 + }, + { + "epoch": 0.94, + "learning_rate": 5.022917682034278e-08, + "loss": 1.1545, + "step": 31137 + }, + { + "epoch": 0.94, + "learning_rate": 5.018053901618608e-08, + "loss": 1.0399, + "step": 31138 + }, + { + "epoch": 0.94, + "learning_rate": 5.013192453313137e-08, + "loss": 1.1963, + "step": 31139 + }, + { + "epoch": 0.94, + "learning_rate": 5.008333337164023e-08, + "loss": 1.1018, + "step": 31140 + }, + { + "epoch": 0.94, + "learning_rate": 5.0034765532176175e-08, + "loss": 1.1278, + "step": 31141 + }, + { + "epoch": 0.94, + "learning_rate": 4.998622101520106e-08, + "loss": 1.1154, + "step": 31142 + }, + { + "epoch": 0.94, + "learning_rate": 4.99376998211773e-08, + "loss": 1.0778, + "step": 31143 + }, + { + "epoch": 0.94, + "learning_rate": 4.988920195056646e-08, + "loss": 1.1832, + "step": 31144 + }, + { + "epoch": 0.94, + "learning_rate": 4.984072740383067e-08, + "loss": 1.0897, + "step": 31145 + }, + { + "epoch": 0.94, + "learning_rate": 4.9792276181430674e-08, + "loss": 1.0574, + "step": 31146 + }, + { + "epoch": 0.94, + "learning_rate": 4.9743848283828614e-08, + "loss": 1.0637, + "step": 31147 + }, + { + "epoch": 0.94, + "learning_rate": 4.969544371148494e-08, + "loss": 1.0944, + "step": 31148 + }, + { + "epoch": 0.94, + "learning_rate": 4.96470624648604e-08, + "loss": 1.1286, + "step": 31149 + }, + { + "epoch": 0.94, + "learning_rate": 4.9598704544415734e-08, + "loss": 1.158, + "step": 31150 + }, + { + "epoch": 0.94, + "learning_rate": 4.955036995061113e-08, + "loss": 1.0381, + "step": 31151 + }, + { + "epoch": 0.94, + "learning_rate": 4.950205868390706e-08, + "loss": 1.1075, + "step": 31152 + }, + { + "epoch": 0.94, + "learning_rate": 4.945377074476288e-08, + "loss": 1.1301, + "step": 31153 + }, + { + "epoch": 0.94, + "learning_rate": 4.940550613363876e-08, + "loss": 1.1122, + "step": 31154 + }, + { + "epoch": 0.94, + "learning_rate": 4.935726485099407e-08, + "loss": 1.0625, + "step": 31155 + }, + { + "epoch": 0.94, + "learning_rate": 4.9309046897287885e-08, + "loss": 1.0302, + "step": 31156 + }, + { + "epoch": 0.94, + "learning_rate": 4.9260852272979e-08, + "loss": 1.2113, + "step": 31157 + }, + { + "epoch": 0.94, + "learning_rate": 4.9212680978526775e-08, + "loss": 0.9841, + "step": 31158 + }, + { + "epoch": 0.94, + "learning_rate": 4.9164533014389446e-08, + "loss": 1.038, + "step": 31159 + }, + { + "epoch": 0.94, + "learning_rate": 4.911640838102555e-08, + "loss": 1.0846, + "step": 31160 + }, + { + "epoch": 0.94, + "learning_rate": 4.906830707889276e-08, + "loss": 1.1135, + "step": 31161 + }, + { + "epoch": 0.94, + "learning_rate": 4.9020229108449614e-08, + "loss": 1.2138, + "step": 31162 + }, + { + "epoch": 0.94, + "learning_rate": 4.8972174470153233e-08, + "loss": 1.069, + "step": 31163 + }, + { + "epoch": 0.94, + "learning_rate": 4.892414316446103e-08, + "loss": 1.0817, + "step": 31164 + }, + { + "epoch": 0.94, + "learning_rate": 4.8876135191830986e-08, + "loss": 1.1464, + "step": 31165 + }, + { + "epoch": 0.94, + "learning_rate": 4.8828150552719664e-08, + "loss": 1.0754, + "step": 31166 + }, + { + "epoch": 0.94, + "learning_rate": 4.878018924758338e-08, + "loss": 1.0453, + "step": 31167 + }, + { + "epoch": 0.94, + "learning_rate": 4.8732251276879526e-08, + "loss": 1.0893, + "step": 31168 + }, + { + "epoch": 0.94, + "learning_rate": 4.8684336641063865e-08, + "loss": 1.0421, + "step": 31169 + }, + { + "epoch": 0.94, + "learning_rate": 4.863644534059297e-08, + "loss": 1.0302, + "step": 31170 + }, + { + "epoch": 0.94, + "learning_rate": 4.858857737592204e-08, + "loss": 0.9835, + "step": 31171 + }, + { + "epoch": 0.94, + "learning_rate": 4.8540732747507646e-08, + "loss": 1.0737, + "step": 31172 + }, + { + "epoch": 0.94, + "learning_rate": 4.8492911455804705e-08, + "loss": 1.1385, + "step": 31173 + }, + { + "epoch": 0.94, + "learning_rate": 4.84451135012684e-08, + "loss": 1.1899, + "step": 31174 + }, + { + "epoch": 0.94, + "learning_rate": 4.839733888435422e-08, + "loss": 1.0612, + "step": 31175 + }, + { + "epoch": 0.94, + "learning_rate": 4.834958760551622e-08, + "loss": 1.0054, + "step": 31176 + }, + { + "epoch": 0.94, + "learning_rate": 4.830185966520962e-08, + "loss": 1.0959, + "step": 31177 + }, + { + "epoch": 0.94, + "learning_rate": 4.8254155063888753e-08, + "loss": 1.0029, + "step": 31178 + }, + { + "epoch": 0.94, + "learning_rate": 4.820647380200716e-08, + "loss": 1.0262, + "step": 31179 + }, + { + "epoch": 0.94, + "learning_rate": 4.8158815880019195e-08, + "loss": 1.1901, + "step": 31180 + }, + { + "epoch": 0.94, + "learning_rate": 4.811118129837838e-08, + "loss": 1.0861, + "step": 31181 + }, + { + "epoch": 0.94, + "learning_rate": 4.806357005753853e-08, + "loss": 1.1612, + "step": 31182 + }, + { + "epoch": 0.94, + "learning_rate": 4.8015982157952334e-08, + "loss": 1.0166, + "step": 31183 + }, + { + "epoch": 0.94, + "learning_rate": 4.7968417600073034e-08, + "loss": 1.0333, + "step": 31184 + }, + { + "epoch": 0.94, + "learning_rate": 4.792087638435361e-08, + "loss": 1.1288, + "step": 31185 + }, + { + "epoch": 0.94, + "learning_rate": 4.787335851124675e-08, + "loss": 1.0948, + "step": 31186 + }, + { + "epoch": 0.94, + "learning_rate": 4.782586398120431e-08, + "loss": 1.045, + "step": 31187 + }, + { + "epoch": 0.94, + "learning_rate": 4.777839279467844e-08, + "loss": 1.1372, + "step": 31188 + }, + { + "epoch": 0.94, + "learning_rate": 4.773094495212127e-08, + "loss": 1.084, + "step": 31189 + }, + { + "epoch": 0.94, + "learning_rate": 4.7683520453984664e-08, + "loss": 1.1261, + "step": 31190 + }, + { + "epoch": 0.94, + "learning_rate": 4.763611930071993e-08, + "loss": 1.1431, + "step": 31191 + }, + { + "epoch": 0.94, + "learning_rate": 4.758874149277809e-08, + "loss": 1.1619, + "step": 31192 + }, + { + "epoch": 0.94, + "learning_rate": 4.754138703061017e-08, + "loss": 1.0994, + "step": 31193 + }, + { + "epoch": 0.94, + "learning_rate": 4.7494055914667214e-08, + "loss": 1.1068, + "step": 31194 + }, + { + "epoch": 0.94, + "learning_rate": 4.7446748145399956e-08, + "loss": 1.0354, + "step": 31195 + }, + { + "epoch": 0.94, + "learning_rate": 4.7399463723258046e-08, + "loss": 0.9132, + "step": 31196 + }, + { + "epoch": 0.94, + "learning_rate": 4.7352202648692226e-08, + "loss": 1.0831, + "step": 31197 + }, + { + "epoch": 0.94, + "learning_rate": 4.7304964922152144e-08, + "loss": 1.0203, + "step": 31198 + }, + { + "epoch": 0.94, + "learning_rate": 4.725775054408771e-08, + "loss": 1.1816, + "step": 31199 + }, + { + "epoch": 0.94, + "learning_rate": 4.7210559514948016e-08, + "loss": 1.0368, + "step": 31200 + }, + { + "epoch": 0.94, + "learning_rate": 4.7163391835182426e-08, + "loss": 1.0764, + "step": 31201 + }, + { + "epoch": 0.94, + "learning_rate": 4.7116247505240296e-08, + "loss": 1.0812, + "step": 31202 + }, + { + "epoch": 0.94, + "learning_rate": 4.7069126525569885e-08, + "loss": 1.002, + "step": 31203 + }, + { + "epoch": 0.94, + "learning_rate": 4.702202889662027e-08, + "loss": 1.0255, + "step": 31204 + }, + { + "epoch": 0.94, + "learning_rate": 4.697495461883944e-08, + "loss": 1.1114, + "step": 31205 + }, + { + "epoch": 0.94, + "learning_rate": 4.692790369267536e-08, + "loss": 1.2127, + "step": 31206 + }, + { + "epoch": 0.94, + "learning_rate": 4.688087611857628e-08, + "loss": 1.1181, + "step": 31207 + }, + { + "epoch": 0.94, + "learning_rate": 4.68338718969899e-08, + "loss": 1.1325, + "step": 31208 + }, + { + "epoch": 0.94, + "learning_rate": 4.6786891028363926e-08, + "loss": 1.0658, + "step": 31209 + }, + { + "epoch": 0.94, + "learning_rate": 4.673993351314493e-08, + "loss": 1.0656, + "step": 31210 + }, + { + "epoch": 0.94, + "learning_rate": 4.6692999351780065e-08, + "loss": 1.1459, + "step": 31211 + }, + { + "epoch": 0.94, + "learning_rate": 4.6646088544716474e-08, + "loss": 1.1519, + "step": 31212 + }, + { + "epoch": 0.94, + "learning_rate": 4.659920109240046e-08, + "loss": 1.1703, + "step": 31213 + }, + { + "epoch": 0.94, + "learning_rate": 4.655233699527834e-08, + "loss": 1.1191, + "step": 31214 + }, + { + "epoch": 0.94, + "learning_rate": 4.650549625379669e-08, + "loss": 1.0963, + "step": 31215 + }, + { + "epoch": 0.94, + "learning_rate": 4.645867886840072e-08, + "loss": 1.1439, + "step": 31216 + }, + { + "epoch": 0.94, + "learning_rate": 4.6411884839536734e-08, + "loss": 1.2213, + "step": 31217 + }, + { + "epoch": 0.94, + "learning_rate": 4.636511416764994e-08, + "loss": 1.1409, + "step": 31218 + }, + { + "epoch": 0.94, + "learning_rate": 4.631836685318525e-08, + "loss": 1.0439, + "step": 31219 + }, + { + "epoch": 0.94, + "learning_rate": 4.6271642896588144e-08, + "loss": 1.0675, + "step": 31220 + }, + { + "epoch": 0.94, + "learning_rate": 4.6224942298303544e-08, + "loss": 1.068, + "step": 31221 + }, + { + "epoch": 0.94, + "learning_rate": 4.6178265058775266e-08, + "loss": 1.1178, + "step": 31222 + }, + { + "epoch": 0.94, + "learning_rate": 4.613161117844822e-08, + "loss": 1.0153, + "step": 31223 + }, + { + "epoch": 0.94, + "learning_rate": 4.608498065776651e-08, + "loss": 1.1355, + "step": 31224 + }, + { + "epoch": 0.94, + "learning_rate": 4.603837349717394e-08, + "loss": 1.2032, + "step": 31225 + }, + { + "epoch": 0.94, + "learning_rate": 4.599178969711404e-08, + "loss": 1.0381, + "step": 31226 + }, + { + "epoch": 0.94, + "learning_rate": 4.594522925803063e-08, + "loss": 1.0154, + "step": 31227 + }, + { + "epoch": 0.94, + "learning_rate": 4.589869218036641e-08, + "loss": 1.087, + "step": 31228 + }, + { + "epoch": 0.94, + "learning_rate": 4.585217846456491e-08, + "loss": 1.0026, + "step": 31229 + }, + { + "epoch": 0.94, + "learning_rate": 4.5805688111068836e-08, + "loss": 1.0728, + "step": 31230 + }, + { + "epoch": 0.94, + "learning_rate": 4.575922112032061e-08, + "loss": 1.1408, + "step": 31231 + }, + { + "epoch": 0.94, + "learning_rate": 4.5712777492762375e-08, + "loss": 1.103, + "step": 31232 + }, + { + "epoch": 0.94, + "learning_rate": 4.5666357228836557e-08, + "loss": 1.085, + "step": 31233 + }, + { + "epoch": 0.94, + "learning_rate": 4.5619960328985024e-08, + "loss": 1.0457, + "step": 31234 + }, + { + "epoch": 0.94, + "learning_rate": 4.557358679364937e-08, + "loss": 1.0696, + "step": 31235 + }, + { + "epoch": 0.94, + "learning_rate": 4.5527236623271185e-08, + "loss": 1.1129, + "step": 31236 + }, + { + "epoch": 0.94, + "learning_rate": 4.548090981829123e-08, + "loss": 1.2161, + "step": 31237 + }, + { + "epoch": 0.94, + "learning_rate": 4.5434606379151094e-08, + "loss": 1.1505, + "step": 31238 + }, + { + "epoch": 0.94, + "learning_rate": 4.538832630629125e-08, + "loss": 1.0149, + "step": 31239 + }, + { + "epoch": 0.94, + "learning_rate": 4.534206960015247e-08, + "loss": 1.1526, + "step": 31240 + }, + { + "epoch": 0.94, + "learning_rate": 4.529583626117495e-08, + "loss": 1.0917, + "step": 31241 + }, + { + "epoch": 0.94, + "learning_rate": 4.52496262897989e-08, + "loss": 1.0804, + "step": 31242 + }, + { + "epoch": 0.94, + "learning_rate": 4.5203439686464513e-08, + "loss": 1.2003, + "step": 31243 + }, + { + "epoch": 0.94, + "learning_rate": 4.515727645161061e-08, + "loss": 1.0996, + "step": 31244 + }, + { + "epoch": 0.94, + "learning_rate": 4.5111136585677116e-08, + "loss": 1.153, + "step": 31245 + }, + { + "epoch": 0.94, + "learning_rate": 4.5065020089103406e-08, + "loss": 1.1908, + "step": 31246 + }, + { + "epoch": 0.94, + "learning_rate": 4.501892696232857e-08, + "loss": 1.0649, + "step": 31247 + }, + { + "epoch": 0.94, + "learning_rate": 4.497285720579114e-08, + "loss": 1.0878, + "step": 31248 + }, + { + "epoch": 0.94, + "learning_rate": 4.492681081992939e-08, + "loss": 1.1492, + "step": 31249 + }, + { + "epoch": 0.94, + "learning_rate": 4.4880787805182404e-08, + "loss": 1.1584, + "step": 31250 + }, + { + "epoch": 0.94, + "learning_rate": 4.483478816198789e-08, + "loss": 0.9988, + "step": 31251 + }, + { + "epoch": 0.94, + "learning_rate": 4.478881189078354e-08, + "loss": 1.0186, + "step": 31252 + }, + { + "epoch": 0.94, + "learning_rate": 4.474285899200709e-08, + "loss": 1.1026, + "step": 31253 + }, + { + "epoch": 0.94, + "learning_rate": 4.469692946609622e-08, + "loss": 1.1024, + "step": 31254 + }, + { + "epoch": 0.94, + "learning_rate": 4.465102331348808e-08, + "loss": 1.1566, + "step": 31255 + }, + { + "epoch": 0.94, + "learning_rate": 4.460514053461984e-08, + "loss": 1.1828, + "step": 31256 + }, + { + "epoch": 0.94, + "learning_rate": 4.455928112992808e-08, + "loss": 1.0233, + "step": 31257 + }, + { + "epoch": 0.94, + "learning_rate": 4.451344509984912e-08, + "loss": 1.1398, + "step": 31258 + }, + { + "epoch": 0.94, + "learning_rate": 4.446763244481983e-08, + "loss": 1.1013, + "step": 31259 + }, + { + "epoch": 0.94, + "learning_rate": 4.442184316527598e-08, + "loss": 1.1811, + "step": 31260 + }, + { + "epoch": 0.94, + "learning_rate": 4.437607726165361e-08, + "loss": 1.1731, + "step": 31261 + }, + { + "epoch": 0.94, + "learning_rate": 4.4330334734388194e-08, + "loss": 1.0253, + "step": 31262 + }, + { + "epoch": 0.94, + "learning_rate": 4.428461558391523e-08, + "loss": 1.135, + "step": 31263 + }, + { + "epoch": 0.94, + "learning_rate": 4.423891981067019e-08, + "loss": 1.0122, + "step": 31264 + }, + { + "epoch": 0.94, + "learning_rate": 4.4193247415087735e-08, + "loss": 1.1509, + "step": 31265 + }, + { + "epoch": 0.94, + "learning_rate": 4.4147598397602795e-08, + "loss": 1.0813, + "step": 31266 + }, + { + "epoch": 0.94, + "learning_rate": 4.410197275865003e-08, + "loss": 1.0704, + "step": 31267 + }, + { + "epoch": 0.94, + "learning_rate": 4.4056370498663794e-08, + "loss": 1.1455, + "step": 31268 + }, + { + "epoch": 0.94, + "learning_rate": 4.401079161807792e-08, + "loss": 1.3256, + "step": 31269 + }, + { + "epoch": 0.94, + "learning_rate": 4.3965236117326503e-08, + "loss": 1.0936, + "step": 31270 + }, + { + "epoch": 0.94, + "learning_rate": 4.3919703996843086e-08, + "loss": 1.032, + "step": 31271 + }, + { + "epoch": 0.94, + "learning_rate": 4.387419525706122e-08, + "loss": 1.0857, + "step": 31272 + }, + { + "epoch": 0.94, + "learning_rate": 4.382870989841442e-08, + "loss": 1.1919, + "step": 31273 + }, + { + "epoch": 0.94, + "learning_rate": 4.3783247921335146e-08, + "loss": 1.1711, + "step": 31274 + }, + { + "epoch": 0.94, + "learning_rate": 4.373780932625638e-08, + "loss": 1.0175, + "step": 31275 + }, + { + "epoch": 0.94, + "learning_rate": 4.3692394113610536e-08, + "loss": 0.9756, + "step": 31276 + }, + { + "epoch": 0.94, + "learning_rate": 4.364700228383062e-08, + "loss": 0.9615, + "step": 31277 + }, + { + "epoch": 0.94, + "learning_rate": 4.360163383734767e-08, + "loss": 1.1184, + "step": 31278 + }, + { + "epoch": 0.94, + "learning_rate": 4.3556288774594394e-08, + "loss": 1.0754, + "step": 31279 + }, + { + "epoch": 0.94, + "learning_rate": 4.351096709600211e-08, + "loss": 1.1011, + "step": 31280 + }, + { + "epoch": 0.94, + "learning_rate": 4.3465668802002426e-08, + "loss": 1.2285, + "step": 31281 + }, + { + "epoch": 0.94, + "learning_rate": 4.342039389302638e-08, + "loss": 1.067, + "step": 31282 + }, + { + "epoch": 0.94, + "learning_rate": 4.3375142369505016e-08, + "loss": 1.0364, + "step": 31283 + }, + { + "epoch": 0.94, + "learning_rate": 4.3329914231869106e-08, + "loss": 1.0482, + "step": 31284 + }, + { + "epoch": 0.94, + "learning_rate": 4.328470948054914e-08, + "loss": 1.2277, + "step": 31285 + }, + { + "epoch": 0.94, + "learning_rate": 4.323952811597587e-08, + "loss": 1.2116, + "step": 31286 + }, + { + "epoch": 0.94, + "learning_rate": 4.3194370138578966e-08, + "loss": 1.2589, + "step": 31287 + }, + { + "epoch": 0.94, + "learning_rate": 4.314923554878836e-08, + "loss": 1.0568, + "step": 31288 + }, + { + "epoch": 0.94, + "learning_rate": 4.3104124347033706e-08, + "loss": 1.0913, + "step": 31289 + }, + { + "epoch": 0.94, + "learning_rate": 4.3059036533744656e-08, + "loss": 1.0635, + "step": 31290 + }, + { + "epoch": 0.94, + "learning_rate": 4.301397210935032e-08, + "loss": 1.0334, + "step": 31291 + }, + { + "epoch": 0.94, + "learning_rate": 4.2968931074279516e-08, + "loss": 1.0829, + "step": 31292 + }, + { + "epoch": 0.94, + "learning_rate": 4.292391342896107e-08, + "loss": 1.1835, + "step": 31293 + }, + { + "epoch": 0.94, + "learning_rate": 4.287891917382381e-08, + "loss": 1.0854, + "step": 31294 + }, + { + "epoch": 0.94, + "learning_rate": 4.283394830929544e-08, + "loss": 1.1602, + "step": 31295 + }, + { + "epoch": 0.94, + "learning_rate": 4.2789000835804785e-08, + "loss": 0.9744, + "step": 31296 + }, + { + "epoch": 0.94, + "learning_rate": 4.2744076753779285e-08, + "loss": 0.984, + "step": 31297 + }, + { + "epoch": 0.94, + "learning_rate": 4.269917606364693e-08, + "loss": 1.1662, + "step": 31298 + }, + { + "epoch": 0.94, + "learning_rate": 4.265429876583488e-08, + "loss": 1.1151, + "step": 31299 + }, + { + "epoch": 0.94, + "learning_rate": 4.260944486077029e-08, + "loss": 0.9758, + "step": 31300 + }, + { + "epoch": 0.94, + "learning_rate": 4.256461434888032e-08, + "loss": 1.0085, + "step": 31301 + }, + { + "epoch": 0.94, + "learning_rate": 4.251980723059185e-08, + "loss": 1.098, + "step": 31302 + }, + { + "epoch": 0.94, + "learning_rate": 4.24750235063312e-08, + "loss": 1.0565, + "step": 31303 + }, + { + "epoch": 0.94, + "learning_rate": 4.243026317652443e-08, + "loss": 1.0532, + "step": 31304 + }, + { + "epoch": 0.94, + "learning_rate": 4.238552624159814e-08, + "loss": 1.1089, + "step": 31305 + }, + { + "epoch": 0.94, + "learning_rate": 4.234081270197809e-08, + "loss": 1.0342, + "step": 31306 + }, + { + "epoch": 0.94, + "learning_rate": 4.229612255809007e-08, + "loss": 1.1265, + "step": 31307 + }, + { + "epoch": 0.94, + "learning_rate": 4.2251455810358997e-08, + "loss": 1.129, + "step": 31308 + }, + { + "epoch": 0.94, + "learning_rate": 4.22068124592101e-08, + "loss": 1.0989, + "step": 31309 + }, + { + "epoch": 0.94, + "learning_rate": 4.2162192505068864e-08, + "loss": 0.9583, + "step": 31310 + }, + { + "epoch": 0.94, + "learning_rate": 4.211759594835996e-08, + "loss": 1.1216, + "step": 31311 + }, + { + "epoch": 0.94, + "learning_rate": 4.207302278950775e-08, + "loss": 1.1327, + "step": 31312 + }, + { + "epoch": 0.94, + "learning_rate": 4.2028473028936643e-08, + "loss": 1.1193, + "step": 31313 + }, + { + "epoch": 0.94, + "learning_rate": 4.198394666707045e-08, + "loss": 1.0151, + "step": 31314 + }, + { + "epoch": 0.94, + "learning_rate": 4.193944370433328e-08, + "loss": 0.9839, + "step": 31315 + }, + { + "epoch": 0.94, + "learning_rate": 4.189496414114924e-08, + "loss": 1.1621, + "step": 31316 + }, + { + "epoch": 0.94, + "learning_rate": 4.185050797794077e-08, + "loss": 1.176, + "step": 31317 + }, + { + "epoch": 0.94, + "learning_rate": 4.180607521513169e-08, + "loss": 1.1147, + "step": 31318 + }, + { + "epoch": 0.94, + "learning_rate": 4.176166585314473e-08, + "loss": 1.215, + "step": 31319 + }, + { + "epoch": 0.94, + "learning_rate": 4.171727989240315e-08, + "loss": 1.1414, + "step": 31320 + }, + { + "epoch": 0.94, + "learning_rate": 4.167291733332884e-08, + "loss": 1.1193, + "step": 31321 + }, + { + "epoch": 0.94, + "learning_rate": 4.1628578176344245e-08, + "loss": 1.1041, + "step": 31322 + }, + { + "epoch": 0.94, + "learning_rate": 4.15842624218718e-08, + "loss": 1.1902, + "step": 31323 + }, + { + "epoch": 0.94, + "learning_rate": 4.153997007033311e-08, + "loss": 1.1364, + "step": 31324 + }, + { + "epoch": 0.94, + "learning_rate": 4.149570112215007e-08, + "loss": 1.1775, + "step": 31325 + }, + { + "epoch": 0.94, + "learning_rate": 4.145145557774372e-08, + "loss": 1.0377, + "step": 31326 + }, + { + "epoch": 0.94, + "learning_rate": 4.1407233437535385e-08, + "loss": 1.1279, + "step": 31327 + }, + { + "epoch": 0.94, + "learning_rate": 4.136303470194614e-08, + "loss": 1.0129, + "step": 31328 + }, + { + "epoch": 0.94, + "learning_rate": 4.1318859371397013e-08, + "loss": 1.0568, + "step": 31329 + }, + { + "epoch": 0.94, + "learning_rate": 4.127470744630796e-08, + "loss": 1.0911, + "step": 31330 + }, + { + "epoch": 0.94, + "learning_rate": 4.1230578927099476e-08, + "loss": 1.1592, + "step": 31331 + }, + { + "epoch": 0.94, + "learning_rate": 4.11864738141915e-08, + "loss": 1.0704, + "step": 31332 + }, + { + "epoch": 0.94, + "learning_rate": 4.114239210800453e-08, + "loss": 1.0629, + "step": 31333 + }, + { + "epoch": 0.94, + "learning_rate": 4.109833380895739e-08, + "loss": 0.9832, + "step": 31334 + }, + { + "epoch": 0.94, + "learning_rate": 4.105429891747004e-08, + "loss": 1.1495, + "step": 31335 + }, + { + "epoch": 0.94, + "learning_rate": 4.101028743396129e-08, + "loss": 1.0892, + "step": 31336 + }, + { + "epoch": 0.94, + "learning_rate": 4.096629935885055e-08, + "loss": 1.0971, + "step": 31337 + }, + { + "epoch": 0.94, + "learning_rate": 4.0922334692556354e-08, + "loss": 1.1543, + "step": 31338 + }, + { + "epoch": 0.94, + "learning_rate": 4.087839343549699e-08, + "loss": 1.072, + "step": 31339 + }, + { + "epoch": 0.94, + "learning_rate": 4.083447558809101e-08, + "loss": 1.0246, + "step": 31340 + }, + { + "epoch": 0.94, + "learning_rate": 4.079058115075668e-08, + "loss": 1.013, + "step": 31341 + }, + { + "epoch": 0.94, + "learning_rate": 4.074671012391146e-08, + "loss": 1.1265, + "step": 31342 + }, + { + "epoch": 0.94, + "learning_rate": 4.070286250797306e-08, + "loss": 1.1382, + "step": 31343 + }, + { + "epoch": 0.94, + "learning_rate": 4.065903830335921e-08, + "loss": 1.2777, + "step": 31344 + }, + { + "epoch": 0.94, + "learning_rate": 4.061523751048652e-08, + "loss": 1.0224, + "step": 31345 + }, + { + "epoch": 0.94, + "learning_rate": 4.057146012977242e-08, + "loss": 1.0649, + "step": 31346 + }, + { + "epoch": 0.94, + "learning_rate": 4.052770616163354e-08, + "loss": 1.0198, + "step": 31347 + }, + { + "epoch": 0.94, + "learning_rate": 4.048397560648648e-08, + "loss": 1.1261, + "step": 31348 + }, + { + "epoch": 0.94, + "learning_rate": 4.04402684647473e-08, + "loss": 1.0787, + "step": 31349 + }, + { + "epoch": 0.94, + "learning_rate": 4.0396584736832056e-08, + "loss": 1.1408, + "step": 31350 + }, + { + "epoch": 0.94, + "learning_rate": 4.035292442315708e-08, + "loss": 1.1876, + "step": 31351 + }, + { + "epoch": 0.94, + "learning_rate": 4.03092875241376e-08, + "loss": 1.0984, + "step": 31352 + }, + { + "epoch": 0.94, + "learning_rate": 4.026567404018883e-08, + "loss": 1.0383, + "step": 31353 + }, + { + "epoch": 0.94, + "learning_rate": 4.022208397172628e-08, + "loss": 1.0381, + "step": 31354 + }, + { + "epoch": 0.94, + "learning_rate": 4.0178517319165165e-08, + "loss": 1.1395, + "step": 31355 + }, + { + "epoch": 0.94, + "learning_rate": 4.013497408291961e-08, + "loss": 1.108, + "step": 31356 + }, + { + "epoch": 0.94, + "learning_rate": 4.0091454263404275e-08, + "loss": 1.0692, + "step": 31357 + }, + { + "epoch": 0.94, + "learning_rate": 4.004795786103355e-08, + "loss": 1.0345, + "step": 31358 + }, + { + "epoch": 0.94, + "learning_rate": 4.000448487622183e-08, + "loss": 1.0493, + "step": 31359 + }, + { + "epoch": 0.94, + "learning_rate": 3.996103530938239e-08, + "loss": 1.0765, + "step": 31360 + }, + { + "epoch": 0.94, + "learning_rate": 3.991760916092907e-08, + "loss": 1.0995, + "step": 31361 + }, + { + "epoch": 0.94, + "learning_rate": 3.987420643127543e-08, + "loss": 1.0628, + "step": 31362 + }, + { + "epoch": 0.94, + "learning_rate": 3.9830827120834195e-08, + "loss": 1.0678, + "step": 31363 + }, + { + "epoch": 0.94, + "learning_rate": 3.9787471230019194e-08, + "loss": 1.0503, + "step": 31364 + }, + { + "epoch": 0.94, + "learning_rate": 3.9744138759242045e-08, + "loss": 1.0739, + "step": 31365 + }, + { + "epoch": 0.94, + "learning_rate": 3.9700829708916034e-08, + "loss": 1.1252, + "step": 31366 + }, + { + "epoch": 0.94, + "learning_rate": 3.965754407945332e-08, + "loss": 1.0014, + "step": 31367 + }, + { + "epoch": 0.94, + "learning_rate": 3.961428187126581e-08, + "loss": 1.1695, + "step": 31368 + }, + { + "epoch": 0.94, + "learning_rate": 3.9571043084765116e-08, + "loss": 0.967, + "step": 31369 + }, + { + "epoch": 0.95, + "learning_rate": 3.95278277203634e-08, + "loss": 1.0688, + "step": 31370 + }, + { + "epoch": 0.95, + "learning_rate": 3.9484635778471446e-08, + "loss": 1.0146, + "step": 31371 + }, + { + "epoch": 0.95, + "learning_rate": 3.9441467259500874e-08, + "loss": 0.985, + "step": 31372 + }, + { + "epoch": 0.95, + "learning_rate": 3.939832216386247e-08, + "loss": 1.0582, + "step": 31373 + }, + { + "epoch": 0.95, + "learning_rate": 3.9355200491967286e-08, + "loss": 1.2156, + "step": 31374 + }, + { + "epoch": 0.95, + "learning_rate": 3.931210224422527e-08, + "loss": 1.0378, + "step": 31375 + }, + { + "epoch": 0.95, + "learning_rate": 3.9269027421046934e-08, + "loss": 1.0662, + "step": 31376 + }, + { + "epoch": 0.95, + "learning_rate": 3.9225976022842224e-08, + "loss": 1.0935, + "step": 31377 + }, + { + "epoch": 0.95, + "learning_rate": 3.91829480500211e-08, + "loss": 1.0378, + "step": 31378 + }, + { + "epoch": 0.95, + "learning_rate": 3.9139943502993215e-08, + "loss": 1.0526, + "step": 31379 + }, + { + "epoch": 0.95, + "learning_rate": 3.9096962382167704e-08, + "loss": 1.1819, + "step": 31380 + }, + { + "epoch": 0.95, + "learning_rate": 3.9054004687954225e-08, + "loss": 1.2688, + "step": 31381 + }, + { + "epoch": 0.95, + "learning_rate": 3.9011070420761076e-08, + "loss": 1.1224, + "step": 31382 + }, + { + "epoch": 0.95, + "learning_rate": 3.896815958099764e-08, + "loss": 1.0797, + "step": 31383 + }, + { + "epoch": 0.95, + "learning_rate": 3.892527216907166e-08, + "loss": 1.0425, + "step": 31384 + }, + { + "epoch": 0.95, + "learning_rate": 3.888240818539224e-08, + "loss": 1.0726, + "step": 31385 + }, + { + "epoch": 0.95, + "learning_rate": 3.883956763036656e-08, + "loss": 1.0914, + "step": 31386 + }, + { + "epoch": 0.95, + "learning_rate": 3.8796750504402905e-08, + "loss": 1.1438, + "step": 31387 + }, + { + "epoch": 0.95, + "learning_rate": 3.8753956807909e-08, + "loss": 1.0389, + "step": 31388 + }, + { + "epoch": 0.95, + "learning_rate": 3.8711186541292026e-08, + "loss": 1.1103, + "step": 31389 + }, + { + "epoch": 0.95, + "learning_rate": 3.866843970495915e-08, + "loss": 1.1515, + "step": 31390 + }, + { + "epoch": 0.95, + "learning_rate": 3.862571629931727e-08, + "loss": 1.0241, + "step": 31391 + }, + { + "epoch": 0.95, + "learning_rate": 3.858301632477329e-08, + "loss": 1.1274, + "step": 31392 + }, + { + "epoch": 0.95, + "learning_rate": 3.854033978173327e-08, + "loss": 0.9639, + "step": 31393 + }, + { + "epoch": 0.95, + "learning_rate": 3.849768667060411e-08, + "loss": 1.0943, + "step": 31394 + }, + { + "epoch": 0.95, + "learning_rate": 3.845505699179103e-08, + "loss": 1.1212, + "step": 31395 + }, + { + "epoch": 0.95, + "learning_rate": 3.841245074570038e-08, + "loss": 1.1123, + "step": 31396 + }, + { + "epoch": 0.95, + "learning_rate": 3.836986793273767e-08, + "loss": 1.1666, + "step": 31397 + }, + { + "epoch": 0.95, + "learning_rate": 3.8327308553308684e-08, + "loss": 1.0861, + "step": 31398 + }, + { + "epoch": 0.95, + "learning_rate": 3.8284772607817544e-08, + "loss": 1.1476, + "step": 31399 + }, + { + "epoch": 0.95, + "learning_rate": 3.8242260096670033e-08, + "loss": 1.129, + "step": 31400 + }, + { + "epoch": 0.95, + "learning_rate": 3.819977102027056e-08, + "loss": 0.9902, + "step": 31401 + }, + { + "epoch": 0.95, + "learning_rate": 3.815730537902351e-08, + "loss": 1.1179, + "step": 31402 + }, + { + "epoch": 0.95, + "learning_rate": 3.8114863173333573e-08, + "loss": 1.0357, + "step": 31403 + }, + { + "epoch": 0.95, + "learning_rate": 3.807244440360403e-08, + "loss": 1.1244, + "step": 31404 + }, + { + "epoch": 0.95, + "learning_rate": 3.803004907023927e-08, + "loss": 1.1122, + "step": 31405 + }, + { + "epoch": 0.95, + "learning_rate": 3.798767717364288e-08, + "loss": 1.0626, + "step": 31406 + }, + { + "epoch": 0.95, + "learning_rate": 3.7945328714218133e-08, + "loss": 1.1339, + "step": 31407 + }, + { + "epoch": 0.95, + "learning_rate": 3.7903003692367765e-08, + "loss": 1.1344, + "step": 31408 + }, + { + "epoch": 0.95, + "learning_rate": 3.7860702108495075e-08, + "loss": 1.1, + "step": 31409 + }, + { + "epoch": 0.95, + "learning_rate": 3.781842396300278e-08, + "loss": 1.1625, + "step": 31410 + }, + { + "epoch": 0.95, + "learning_rate": 3.777616925629335e-08, + "loss": 1.1097, + "step": 31411 + }, + { + "epoch": 0.95, + "learning_rate": 3.773393798876895e-08, + "loss": 1.2021, + "step": 31412 + }, + { + "epoch": 0.95, + "learning_rate": 3.76917301608315e-08, + "loss": 1.0907, + "step": 31413 + }, + { + "epoch": 0.95, + "learning_rate": 3.7649545772882876e-08, + "loss": 1.1416, + "step": 31414 + }, + { + "epoch": 0.95, + "learning_rate": 3.760738482532444e-08, + "loss": 1.1002, + "step": 31415 + }, + { + "epoch": 0.95, + "learning_rate": 3.756524731855837e-08, + "loss": 1.0687, + "step": 31416 + }, + { + "epoch": 0.95, + "learning_rate": 3.7523133252984625e-08, + "loss": 1.1426, + "step": 31417 + }, + { + "epoch": 0.95, + "learning_rate": 3.748104262900482e-08, + "loss": 1.0715, + "step": 31418 + }, + { + "epoch": 0.95, + "learning_rate": 3.743897544701974e-08, + "loss": 1.0733, + "step": 31419 + }, + { + "epoch": 0.95, + "learning_rate": 3.739693170742964e-08, + "loss": 0.9744, + "step": 31420 + }, + { + "epoch": 0.95, + "learning_rate": 3.7354911410634466e-08, + "loss": 1.1348, + "step": 31421 + }, + { + "epoch": 0.95, + "learning_rate": 3.731291455703445e-08, + "loss": 1.1467, + "step": 31422 + }, + { + "epoch": 0.95, + "learning_rate": 3.7270941147029284e-08, + "loss": 1.1621, + "step": 31423 + }, + { + "epoch": 0.95, + "learning_rate": 3.722899118101919e-08, + "loss": 1.0722, + "step": 31424 + }, + { + "epoch": 0.95, + "learning_rate": 3.718706465940247e-08, + "loss": 1.1227, + "step": 31425 + }, + { + "epoch": 0.95, + "learning_rate": 3.714516158257908e-08, + "loss": 1.0883, + "step": 31426 + }, + { + "epoch": 0.95, + "learning_rate": 3.710328195094731e-08, + "loss": 1.0999, + "step": 31427 + }, + { + "epoch": 0.95, + "learning_rate": 3.706142576490629e-08, + "loss": 1.0803, + "step": 31428 + }, + { + "epoch": 0.95, + "learning_rate": 3.7019593024854305e-08, + "loss": 1.1499, + "step": 31429 + }, + { + "epoch": 0.95, + "learning_rate": 3.697778373118965e-08, + "loss": 1.1291, + "step": 31430 + }, + { + "epoch": 0.95, + "learning_rate": 3.693599788431007e-08, + "loss": 1.0064, + "step": 31431 + }, + { + "epoch": 0.95, + "learning_rate": 3.689423548461385e-08, + "loss": 1.0197, + "step": 31432 + }, + { + "epoch": 0.95, + "learning_rate": 3.685249653249817e-08, + "loss": 1.0422, + "step": 31433 + }, + { + "epoch": 0.95, + "learning_rate": 3.681078102836022e-08, + "loss": 1.1389, + "step": 31434 + }, + { + "epoch": 0.95, + "learning_rate": 3.6769088972597454e-08, + "loss": 1.1537, + "step": 31435 + }, + { + "epoch": 0.95, + "learning_rate": 3.67274203656065e-08, + "loss": 1.1943, + "step": 31436 + }, + { + "epoch": 0.95, + "learning_rate": 3.6685775207784547e-08, + "loss": 1.0862, + "step": 31437 + }, + { + "epoch": 0.95, + "learning_rate": 3.66441534995271e-08, + "loss": 1.0281, + "step": 31438 + }, + { + "epoch": 0.95, + "learning_rate": 3.660255524123135e-08, + "loss": 1.0544, + "step": 31439 + }, + { + "epoch": 0.95, + "learning_rate": 3.6560980433292537e-08, + "loss": 1.0928, + "step": 31440 + }, + { + "epoch": 0.95, + "learning_rate": 3.651942907610701e-08, + "loss": 1.1208, + "step": 31441 + }, + { + "epoch": 0.95, + "learning_rate": 3.647790117007e-08, + "loss": 1.1169, + "step": 31442 + }, + { + "epoch": 0.95, + "learning_rate": 3.643639671557675e-08, + "loss": 1.1985, + "step": 31443 + }, + { + "epoch": 0.95, + "learning_rate": 3.639491571302251e-08, + "loss": 1.1608, + "step": 31444 + }, + { + "epoch": 0.95, + "learning_rate": 3.635345816280222e-08, + "loss": 1.1265, + "step": 31445 + }, + { + "epoch": 0.95, + "learning_rate": 3.631202406531087e-08, + "loss": 0.9989, + "step": 31446 + }, + { + "epoch": 0.95, + "learning_rate": 3.6270613420942016e-08, + "loss": 1.0878, + "step": 31447 + }, + { + "epoch": 0.95, + "learning_rate": 3.6229226230090345e-08, + "loss": 0.9052, + "step": 31448 + }, + { + "epoch": 0.95, + "learning_rate": 3.618786249314998e-08, + "loss": 1.1171, + "step": 31449 + }, + { + "epoch": 0.95, + "learning_rate": 3.614652221051479e-08, + "loss": 1.1998, + "step": 31450 + }, + { + "epoch": 0.95, + "learning_rate": 3.610520538257778e-08, + "loss": 1.0989, + "step": 31451 + }, + { + "epoch": 0.95, + "learning_rate": 3.6063912009732524e-08, + "loss": 1.0605, + "step": 31452 + }, + { + "epoch": 0.95, + "learning_rate": 3.602264209237233e-08, + "loss": 1.0717, + "step": 31453 + }, + { + "epoch": 0.95, + "learning_rate": 3.598139563088965e-08, + "loss": 1.0312, + "step": 31454 + }, + { + "epoch": 0.95, + "learning_rate": 3.594017262567751e-08, + "loss": 1.2422, + "step": 31455 + }, + { + "epoch": 0.95, + "learning_rate": 3.589897307712836e-08, + "loss": 1.1844, + "step": 31456 + }, + { + "epoch": 0.95, + "learning_rate": 3.585779698563413e-08, + "loss": 1.0809, + "step": 31457 + }, + { + "epoch": 0.95, + "learning_rate": 3.5816644351586715e-08, + "loss": 1.0884, + "step": 31458 + }, + { + "epoch": 0.95, + "learning_rate": 3.577551517537831e-08, + "loss": 1.0977, + "step": 31459 + }, + { + "epoch": 0.95, + "learning_rate": 3.573440945739998e-08, + "loss": 1.1385, + "step": 31460 + }, + { + "epoch": 0.95, + "learning_rate": 3.569332719804336e-08, + "loss": 1.1343, + "step": 31461 + }, + { + "epoch": 0.95, + "learning_rate": 3.5652268397699253e-08, + "loss": 1.0176, + "step": 31462 + }, + { + "epoch": 0.95, + "learning_rate": 3.561123305675901e-08, + "loss": 1.126, + "step": 31463 + }, + { + "epoch": 0.95, + "learning_rate": 3.5570221175612874e-08, + "loss": 1.1039, + "step": 31464 + }, + { + "epoch": 0.95, + "learning_rate": 3.552923275465109e-08, + "loss": 0.976, + "step": 31465 + }, + { + "epoch": 0.95, + "learning_rate": 3.5488267794264173e-08, + "loss": 1.1548, + "step": 31466 + }, + { + "epoch": 0.95, + "learning_rate": 3.54473262948421e-08, + "loss": 1.0455, + "step": 31467 + }, + { + "epoch": 0.95, + "learning_rate": 3.540640825677455e-08, + "loss": 1.1624, + "step": 31468 + }, + { + "epoch": 0.95, + "learning_rate": 3.536551368045066e-08, + "loss": 1.2686, + "step": 31469 + }, + { + "epoch": 0.95, + "learning_rate": 3.532464256626039e-08, + "loss": 0.9628, + "step": 31470 + }, + { + "epoch": 0.95, + "learning_rate": 3.528379491459233e-08, + "loss": 1.0821, + "step": 31471 + }, + { + "epoch": 0.95, + "learning_rate": 3.52429707258356e-08, + "loss": 1.0558, + "step": 31472 + }, + { + "epoch": 0.95, + "learning_rate": 3.520217000037879e-08, + "loss": 1.0612, + "step": 31473 + }, + { + "epoch": 0.95, + "learning_rate": 3.516139273860991e-08, + "loss": 1.1641, + "step": 31474 + }, + { + "epoch": 0.95, + "learning_rate": 3.5120638940917825e-08, + "loss": 1.1937, + "step": 31475 + }, + { + "epoch": 0.95, + "learning_rate": 3.507990860769001e-08, + "loss": 1.1295, + "step": 31476 + }, + { + "epoch": 0.95, + "learning_rate": 3.5039201739314465e-08, + "loss": 1.1244, + "step": 31477 + }, + { + "epoch": 0.95, + "learning_rate": 3.4998518336178125e-08, + "loss": 1.121, + "step": 31478 + }, + { + "epoch": 0.95, + "learning_rate": 3.4957858398668996e-08, + "loss": 1.1971, + "step": 31479 + }, + { + "epoch": 0.95, + "learning_rate": 3.4917221927174005e-08, + "loss": 1.1301, + "step": 31480 + }, + { + "epoch": 0.95, + "learning_rate": 3.48766089220795e-08, + "loss": 1.1052, + "step": 31481 + }, + { + "epoch": 0.95, + "learning_rate": 3.483601938377268e-08, + "loss": 1.0472, + "step": 31482 + }, + { + "epoch": 0.95, + "learning_rate": 3.479545331263961e-08, + "loss": 1.0968, + "step": 31483 + }, + { + "epoch": 0.95, + "learning_rate": 3.4754910709066395e-08, + "loss": 1.0298, + "step": 31484 + }, + { + "epoch": 0.95, + "learning_rate": 3.4714391573439364e-08, + "loss": 1.1024, + "step": 31485 + }, + { + "epoch": 0.95, + "learning_rate": 3.467389590614378e-08, + "loss": 1.0484, + "step": 31486 + }, + { + "epoch": 0.95, + "learning_rate": 3.463342370756545e-08, + "loss": 1.2637, + "step": 31487 + }, + { + "epoch": 0.95, + "learning_rate": 3.459297497808961e-08, + "loss": 1.1083, + "step": 31488 + }, + { + "epoch": 0.95, + "learning_rate": 3.4552549718101235e-08, + "loss": 1.1856, + "step": 31489 + }, + { + "epoch": 0.95, + "learning_rate": 3.45121479279853e-08, + "loss": 1.145, + "step": 31490 + }, + { + "epoch": 0.95, + "learning_rate": 3.44717696081262e-08, + "loss": 0.9855, + "step": 31491 + }, + { + "epoch": 0.95, + "learning_rate": 3.443141475890838e-08, + "loss": 1.1926, + "step": 31492 + }, + { + "epoch": 0.95, + "learning_rate": 3.4391083380716226e-08, + "loss": 1.1484, + "step": 31493 + }, + { + "epoch": 0.95, + "learning_rate": 3.435077547393334e-08, + "loss": 1.0171, + "step": 31494 + }, + { + "epoch": 0.95, + "learning_rate": 3.4310491038943295e-08, + "loss": 1.1702, + "step": 31495 + }, + { + "epoch": 0.95, + "learning_rate": 3.427023007613023e-08, + "loss": 1.0646, + "step": 31496 + }, + { + "epoch": 0.95, + "learning_rate": 3.4229992585876894e-08, + "loss": 1.0496, + "step": 31497 + }, + { + "epoch": 0.95, + "learning_rate": 3.418977856856659e-08, + "loss": 1.2072, + "step": 31498 + }, + { + "epoch": 0.95, + "learning_rate": 3.4149588024581795e-08, + "loss": 1.1514, + "step": 31499 + }, + { + "epoch": 0.95, + "learning_rate": 3.410942095430553e-08, + "loss": 1.1168, + "step": 31500 + }, + { + "epoch": 0.95, + "learning_rate": 3.406927735811999e-08, + "loss": 1.1107, + "step": 31501 + }, + { + "epoch": 0.95, + "learning_rate": 3.402915723640737e-08, + "loss": 1.0904, + "step": 31502 + }, + { + "epoch": 0.95, + "learning_rate": 3.398906058954932e-08, + "loss": 1.0551, + "step": 31503 + }, + { + "epoch": 0.95, + "learning_rate": 3.394898741792774e-08, + "loss": 1.1683, + "step": 31504 + }, + { + "epoch": 0.95, + "learning_rate": 3.3908937721923996e-08, + "loss": 1.0784, + "step": 31505 + }, + { + "epoch": 0.95, + "learning_rate": 3.3868911501919734e-08, + "loss": 1.1148, + "step": 31506 + }, + { + "epoch": 0.95, + "learning_rate": 3.382890875829575e-08, + "loss": 0.9568, + "step": 31507 + }, + { + "epoch": 0.95, + "learning_rate": 3.378892949143259e-08, + "loss": 1.1003, + "step": 31508 + }, + { + "epoch": 0.95, + "learning_rate": 3.374897370171104e-08, + "loss": 1.0888, + "step": 31509 + }, + { + "epoch": 0.95, + "learning_rate": 3.370904138951137e-08, + "loss": 1.0776, + "step": 31510 + }, + { + "epoch": 0.95, + "learning_rate": 3.366913255521409e-08, + "loss": 1.0456, + "step": 31511 + }, + { + "epoch": 0.95, + "learning_rate": 3.3629247199198636e-08, + "loss": 1.1575, + "step": 31512 + }, + { + "epoch": 0.95, + "learning_rate": 3.358938532184497e-08, + "loss": 1.0754, + "step": 31513 + }, + { + "epoch": 0.95, + "learning_rate": 3.3549546923532516e-08, + "loss": 1.129, + "step": 31514 + }, + { + "epoch": 0.95, + "learning_rate": 3.3509732004640696e-08, + "loss": 1.1734, + "step": 31515 + }, + { + "epoch": 0.95, + "learning_rate": 3.3469940565548085e-08, + "loss": 0.99, + "step": 31516 + }, + { + "epoch": 0.95, + "learning_rate": 3.343017260663356e-08, + "loss": 1.1145, + "step": 31517 + }, + { + "epoch": 0.95, + "learning_rate": 3.3390428128275974e-08, + "loss": 1.0988, + "step": 31518 + }, + { + "epoch": 0.95, + "learning_rate": 3.335070713085392e-08, + "loss": 1.0905, + "step": 31519 + }, + { + "epoch": 0.95, + "learning_rate": 3.3311009614744874e-08, + "loss": 1.0893, + "step": 31520 + }, + { + "epoch": 0.95, + "learning_rate": 3.327133558032686e-08, + "loss": 1.1277, + "step": 31521 + }, + { + "epoch": 0.95, + "learning_rate": 3.3231685027977913e-08, + "loss": 1.0746, + "step": 31522 + }, + { + "epoch": 0.95, + "learning_rate": 3.319205795807523e-08, + "loss": 1.0671, + "step": 31523 + }, + { + "epoch": 0.95, + "learning_rate": 3.315245437099629e-08, + "loss": 1.2902, + "step": 31524 + }, + { + "epoch": 0.95, + "learning_rate": 3.3112874267117736e-08, + "loss": 1.2043, + "step": 31525 + }, + { + "epoch": 0.95, + "learning_rate": 3.307331764681648e-08, + "loss": 1.1623, + "step": 31526 + }, + { + "epoch": 0.95, + "learning_rate": 3.303378451046918e-08, + "loss": 1.0027, + "step": 31527 + }, + { + "epoch": 0.95, + "learning_rate": 3.2994274858452194e-08, + "loss": 1.0967, + "step": 31528 + }, + { + "epoch": 0.95, + "learning_rate": 3.295478869114133e-08, + "loss": 1.072, + "step": 31529 + }, + { + "epoch": 0.95, + "learning_rate": 3.291532600891295e-08, + "loss": 1.0264, + "step": 31530 + }, + { + "epoch": 0.95, + "learning_rate": 3.287588681214232e-08, + "loss": 1.1513, + "step": 31531 + }, + { + "epoch": 0.95, + "learning_rate": 3.283647110120525e-08, + "loss": 1.0728, + "step": 31532 + }, + { + "epoch": 0.95, + "learning_rate": 3.279707887647643e-08, + "loss": 1.1151, + "step": 31533 + }, + { + "epoch": 0.95, + "learning_rate": 3.27577101383314e-08, + "loss": 1.1074, + "step": 31534 + }, + { + "epoch": 0.95, + "learning_rate": 3.271836488714458e-08, + "loss": 1.0071, + "step": 31535 + }, + { + "epoch": 0.95, + "learning_rate": 3.2679043123290676e-08, + "loss": 1.1661, + "step": 31536 + }, + { + "epoch": 0.95, + "learning_rate": 3.2639744847144105e-08, + "loss": 1.0304, + "step": 31537 + }, + { + "epoch": 0.95, + "learning_rate": 3.260047005907874e-08, + "loss": 1.144, + "step": 31538 + }, + { + "epoch": 0.95, + "learning_rate": 3.256121875946844e-08, + "loss": 1.188, + "step": 31539 + }, + { + "epoch": 0.95, + "learning_rate": 3.2521990948687074e-08, + "loss": 1.0489, + "step": 31540 + }, + { + "epoch": 0.95, + "learning_rate": 3.2482786627108246e-08, + "loss": 1.0306, + "step": 31541 + }, + { + "epoch": 0.95, + "learning_rate": 3.2443605795104414e-08, + "loss": 1.108, + "step": 31542 + }, + { + "epoch": 0.95, + "learning_rate": 3.2404448453049185e-08, + "loss": 1.0966, + "step": 31543 + }, + { + "epoch": 0.95, + "learning_rate": 3.236531460131531e-08, + "loss": 0.9435, + "step": 31544 + }, + { + "epoch": 0.95, + "learning_rate": 3.2326204240275275e-08, + "loss": 1.0588, + "step": 31545 + }, + { + "epoch": 0.95, + "learning_rate": 3.228711737030127e-08, + "loss": 1.0668, + "step": 31546 + }, + { + "epoch": 0.95, + "learning_rate": 3.224805399176523e-08, + "loss": 1.0993, + "step": 31547 + }, + { + "epoch": 0.95, + "learning_rate": 3.220901410503935e-08, + "loss": 1.1986, + "step": 31548 + }, + { + "epoch": 0.95, + "learning_rate": 3.2169997710495007e-08, + "loss": 1.0876, + "step": 31549 + }, + { + "epoch": 0.95, + "learning_rate": 3.213100480850384e-08, + "loss": 1.0823, + "step": 31550 + }, + { + "epoch": 0.95, + "learning_rate": 3.209203539943695e-08, + "loss": 1.1413, + "step": 31551 + }, + { + "epoch": 0.95, + "learning_rate": 3.2053089483665145e-08, + "loss": 1.1374, + "step": 31552 + }, + { + "epoch": 0.95, + "learning_rate": 3.201416706155952e-08, + "loss": 1.0918, + "step": 31553 + }, + { + "epoch": 0.95, + "learning_rate": 3.1975268133490334e-08, + "loss": 1.1027, + "step": 31554 + }, + { + "epoch": 0.95, + "learning_rate": 3.193639269982785e-08, + "loss": 1.1232, + "step": 31555 + }, + { + "epoch": 0.95, + "learning_rate": 3.1897540760942316e-08, + "loss": 1.1776, + "step": 31556 + }, + { + "epoch": 0.95, + "learning_rate": 3.1858712317203445e-08, + "loss": 1.0901, + "step": 31557 + }, + { + "epoch": 0.95, + "learning_rate": 3.181990736898122e-08, + "loss": 1.0369, + "step": 31558 + }, + { + "epoch": 0.95, + "learning_rate": 3.1781125916644506e-08, + "loss": 1.1297, + "step": 31559 + }, + { + "epoch": 0.95, + "learning_rate": 3.1742367960562734e-08, + "loss": 1.1437, + "step": 31560 + }, + { + "epoch": 0.95, + "learning_rate": 3.170363350110506e-08, + "loss": 1.1476, + "step": 31561 + }, + { + "epoch": 0.95, + "learning_rate": 3.1664922538639786e-08, + "loss": 1.1649, + "step": 31562 + }, + { + "epoch": 0.95, + "learning_rate": 3.1626235073535794e-08, + "loss": 1.1917, + "step": 31563 + }, + { + "epoch": 0.95, + "learning_rate": 3.158757110616112e-08, + "loss": 1.0338, + "step": 31564 + }, + { + "epoch": 0.95, + "learning_rate": 3.154893063688408e-08, + "loss": 1.0951, + "step": 31565 + }, + { + "epoch": 0.95, + "learning_rate": 3.151031366607243e-08, + "loss": 1.0902, + "step": 31566 + }, + { + "epoch": 0.95, + "learning_rate": 3.1471720194093393e-08, + "loss": 1.0631, + "step": 31567 + }, + { + "epoch": 0.95, + "learning_rate": 3.143315022131499e-08, + "loss": 1.1923, + "step": 31568 + }, + { + "epoch": 0.95, + "learning_rate": 3.139460374810388e-08, + "loss": 1.1141, + "step": 31569 + }, + { + "epoch": 0.95, + "learning_rate": 3.135608077482727e-08, + "loss": 1.0709, + "step": 31570 + }, + { + "epoch": 0.95, + "learning_rate": 3.131758130185209e-08, + "loss": 1.0577, + "step": 31571 + }, + { + "epoch": 0.95, + "learning_rate": 3.1279105329544424e-08, + "loss": 1.1088, + "step": 31572 + }, + { + "epoch": 0.95, + "learning_rate": 3.124065285827066e-08, + "loss": 1.0387, + "step": 31573 + }, + { + "epoch": 0.95, + "learning_rate": 3.120222388839689e-08, + "loss": 1.1251, + "step": 31574 + }, + { + "epoch": 0.95, + "learning_rate": 3.116381842028893e-08, + "loss": 1.1627, + "step": 31575 + }, + { + "epoch": 0.95, + "learning_rate": 3.1125436454312596e-08, + "loss": 1.0859, + "step": 31576 + }, + { + "epoch": 0.95, + "learning_rate": 3.1087077990832884e-08, + "loss": 1.0309, + "step": 31577 + }, + { + "epoch": 0.95, + "learning_rate": 3.1048743030215045e-08, + "loss": 1.0637, + "step": 31578 + }, + { + "epoch": 0.95, + "learning_rate": 3.1010431572824076e-08, + "loss": 1.172, + "step": 31579 + }, + { + "epoch": 0.95, + "learning_rate": 3.097214361902495e-08, + "loss": 0.9759, + "step": 31580 + }, + { + "epoch": 0.95, + "learning_rate": 3.093387916918156e-08, + "loss": 1.1745, + "step": 31581 + }, + { + "epoch": 0.95, + "learning_rate": 3.08956382236586e-08, + "loss": 1.0676, + "step": 31582 + }, + { + "epoch": 0.95, + "learning_rate": 3.0857420782819946e-08, + "loss": 1.0638, + "step": 31583 + }, + { + "epoch": 0.95, + "learning_rate": 3.0819226847029756e-08, + "loss": 1.1385, + "step": 31584 + }, + { + "epoch": 0.95, + "learning_rate": 3.078105641665108e-08, + "loss": 1.0262, + "step": 31585 + }, + { + "epoch": 0.95, + "learning_rate": 3.07429094920475e-08, + "loss": 1.0513, + "step": 31586 + }, + { + "epoch": 0.95, + "learning_rate": 3.070478607358235e-08, + "loss": 1.2334, + "step": 31587 + }, + { + "epoch": 0.95, + "learning_rate": 3.0666686161618385e-08, + "loss": 1.1061, + "step": 31588 + }, + { + "epoch": 0.95, + "learning_rate": 3.062860975651838e-08, + "loss": 1.0944, + "step": 31589 + }, + { + "epoch": 0.95, + "learning_rate": 3.0590556858644535e-08, + "loss": 0.9818, + "step": 31590 + }, + { + "epoch": 0.95, + "learning_rate": 3.055252746835907e-08, + "loss": 1.1486, + "step": 31591 + }, + { + "epoch": 0.95, + "learning_rate": 3.051452158602447e-08, + "loss": 1.2701, + "step": 31592 + }, + { + "epoch": 0.95, + "learning_rate": 3.047653921200211e-08, + "loss": 1.1021, + "step": 31593 + }, + { + "epoch": 0.95, + "learning_rate": 3.043858034665392e-08, + "loss": 1.0496, + "step": 31594 + }, + { + "epoch": 0.95, + "learning_rate": 3.040064499034101e-08, + "loss": 1.1465, + "step": 31595 + }, + { + "epoch": 0.95, + "learning_rate": 3.036273314342447e-08, + "loss": 1.1174, + "step": 31596 + }, + { + "epoch": 0.95, + "learning_rate": 3.032484480626569e-08, + "loss": 1.1791, + "step": 31597 + }, + { + "epoch": 0.95, + "learning_rate": 3.028697997922464e-08, + "loss": 1.063, + "step": 31598 + }, + { + "epoch": 0.95, + "learning_rate": 3.024913866266216e-08, + "loss": 1.1036, + "step": 31599 + }, + { + "epoch": 0.95, + "learning_rate": 3.021132085693823e-08, + "loss": 1.0618, + "step": 31600 + }, + { + "epoch": 0.95, + "learning_rate": 3.0173526562413125e-08, + "loss": 1.0566, + "step": 31601 + }, + { + "epoch": 0.95, + "learning_rate": 3.013575577944655e-08, + "loss": 1.1265, + "step": 31602 + }, + { + "epoch": 0.95, + "learning_rate": 3.0098008508398226e-08, + "loss": 1.1, + "step": 31603 + }, + { + "epoch": 0.95, + "learning_rate": 3.006028474962702e-08, + "loss": 1.1471, + "step": 31604 + }, + { + "epoch": 0.95, + "learning_rate": 3.002258450349238e-08, + "loss": 1.0576, + "step": 31605 + }, + { + "epoch": 0.95, + "learning_rate": 2.998490777035346e-08, + "loss": 1.1082, + "step": 31606 + }, + { + "epoch": 0.95, + "learning_rate": 2.99472545505683e-08, + "loss": 1.0843, + "step": 31607 + }, + { + "epoch": 0.95, + "learning_rate": 2.990962484449578e-08, + "loss": 1.1512, + "step": 31608 + }, + { + "epoch": 0.95, + "learning_rate": 2.987201865249395e-08, + "loss": 1.038, + "step": 31609 + }, + { + "epoch": 0.95, + "learning_rate": 2.9834435974921136e-08, + "loss": 1.1807, + "step": 31610 + }, + { + "epoch": 0.95, + "learning_rate": 2.9796876812134557e-08, + "loss": 1.089, + "step": 31611 + }, + { + "epoch": 0.95, + "learning_rate": 2.9759341164491973e-08, + "loss": 1.0756, + "step": 31612 + }, + { + "epoch": 0.95, + "learning_rate": 2.9721829032350602e-08, + "loss": 1.1522, + "step": 31613 + }, + { + "epoch": 0.95, + "learning_rate": 2.9684340416067936e-08, + "loss": 1.1628, + "step": 31614 + }, + { + "epoch": 0.95, + "learning_rate": 2.964687531600091e-08, + "loss": 1.0606, + "step": 31615 + }, + { + "epoch": 0.95, + "learning_rate": 2.9609433732505354e-08, + "loss": 1.0796, + "step": 31616 + }, + { + "epoch": 0.95, + "learning_rate": 2.957201566593848e-08, + "loss": 1.1301, + "step": 31617 + }, + { + "epoch": 0.95, + "learning_rate": 2.9534621116655837e-08, + "loss": 1.1014, + "step": 31618 + }, + { + "epoch": 0.95, + "learning_rate": 2.9497250085014083e-08, + "loss": 1.1918, + "step": 31619 + }, + { + "epoch": 0.95, + "learning_rate": 2.945990257136877e-08, + "loss": 1.2373, + "step": 31620 + }, + { + "epoch": 0.95, + "learning_rate": 2.9422578576075167e-08, + "loss": 1.1245, + "step": 31621 + }, + { + "epoch": 0.95, + "learning_rate": 2.9385278099488825e-08, + "loss": 1.0057, + "step": 31622 + }, + { + "epoch": 0.95, + "learning_rate": 2.9348001141964733e-08, + "loss": 1.0936, + "step": 31623 + }, + { + "epoch": 0.95, + "learning_rate": 2.931074770385761e-08, + "loss": 1.0774, + "step": 31624 + }, + { + "epoch": 0.95, + "learning_rate": 2.9273517785522453e-08, + "loss": 1.0558, + "step": 31625 + }, + { + "epoch": 0.95, + "learning_rate": 2.923631138731342e-08, + "loss": 1.1724, + "step": 31626 + }, + { + "epoch": 0.95, + "learning_rate": 2.9199128509584673e-08, + "loss": 1.1647, + "step": 31627 + }, + { + "epoch": 0.95, + "learning_rate": 2.916196915269037e-08, + "loss": 1.0874, + "step": 31628 + }, + { + "epoch": 0.95, + "learning_rate": 2.9124833316984125e-08, + "loss": 1.1579, + "step": 31629 + }, + { + "epoch": 0.95, + "learning_rate": 2.908772100281926e-08, + "loss": 1.1281, + "step": 31630 + }, + { + "epoch": 0.95, + "learning_rate": 2.905063221054938e-08, + "loss": 1.0004, + "step": 31631 + }, + { + "epoch": 0.95, + "learning_rate": 2.901356694052754e-08, + "loss": 1.0513, + "step": 31632 + }, + { + "epoch": 0.95, + "learning_rate": 2.897652519310623e-08, + "loss": 1.1047, + "step": 31633 + }, + { + "epoch": 0.95, + "learning_rate": 2.8939506968638507e-08, + "loss": 1.0131, + "step": 31634 + }, + { + "epoch": 0.95, + "learning_rate": 2.8902512267476313e-08, + "loss": 1.0767, + "step": 31635 + }, + { + "epoch": 0.95, + "learning_rate": 2.8865541089972416e-08, + "loss": 1.0568, + "step": 31636 + }, + { + "epoch": 0.95, + "learning_rate": 2.8828593436478204e-08, + "loss": 1.244, + "step": 31637 + }, + { + "epoch": 0.95, + "learning_rate": 2.8791669307345893e-08, + "loss": 1.1074, + "step": 31638 + }, + { + "epoch": 0.95, + "learning_rate": 2.8754768702926316e-08, + "loss": 1.0723, + "step": 31639 + }, + { + "epoch": 0.95, + "learning_rate": 2.8717891623571413e-08, + "loss": 1.1467, + "step": 31640 + }, + { + "epoch": 0.95, + "learning_rate": 2.8681038069632017e-08, + "loss": 1.0777, + "step": 31641 + }, + { + "epoch": 0.95, + "learning_rate": 2.8644208041458678e-08, + "loss": 1.0977, + "step": 31642 + }, + { + "epoch": 0.95, + "learning_rate": 2.86074015394025e-08, + "loss": 1.0938, + "step": 31643 + }, + { + "epoch": 0.95, + "learning_rate": 2.857061856381349e-08, + "loss": 1.2059, + "step": 31644 + }, + { + "epoch": 0.95, + "learning_rate": 2.8533859115041918e-08, + "loss": 1.1918, + "step": 31645 + }, + { + "epoch": 0.95, + "learning_rate": 2.8497123193437503e-08, + "loss": 1.0439, + "step": 31646 + }, + { + "epoch": 0.95, + "learning_rate": 2.8460410799350524e-08, + "loss": 1.0013, + "step": 31647 + }, + { + "epoch": 0.95, + "learning_rate": 2.8423721933129867e-08, + "loss": 1.059, + "step": 31648 + }, + { + "epoch": 0.95, + "learning_rate": 2.8387056595124974e-08, + "loss": 1.1011, + "step": 31649 + }, + { + "epoch": 0.95, + "learning_rate": 2.835041478568501e-08, + "loss": 1.1841, + "step": 31650 + }, + { + "epoch": 0.95, + "learning_rate": 2.8313796505158587e-08, + "loss": 1.0979, + "step": 31651 + }, + { + "epoch": 0.95, + "learning_rate": 2.827720175389459e-08, + "loss": 0.9609, + "step": 31652 + }, + { + "epoch": 0.95, + "learning_rate": 2.8240630532241354e-08, + "loss": 1.1073, + "step": 31653 + }, + { + "epoch": 0.95, + "learning_rate": 2.8204082840546655e-08, + "loss": 1.1108, + "step": 31654 + }, + { + "epoch": 0.95, + "learning_rate": 2.8167558679158547e-08, + "loss": 1.1296, + "step": 31655 + }, + { + "epoch": 0.95, + "learning_rate": 2.8131058048424808e-08, + "loss": 1.1682, + "step": 31656 + }, + { + "epoch": 0.95, + "learning_rate": 2.809458094869294e-08, + "loss": 1.1203, + "step": 31657 + }, + { + "epoch": 0.95, + "learning_rate": 2.805812738031044e-08, + "loss": 1.0108, + "step": 31658 + }, + { + "epoch": 0.95, + "learning_rate": 2.8021697343623976e-08, + "loss": 1.0049, + "step": 31659 + }, + { + "epoch": 0.95, + "learning_rate": 2.7985290838980217e-08, + "loss": 1.1871, + "step": 31660 + }, + { + "epoch": 0.95, + "learning_rate": 2.7948907866725826e-08, + "loss": 1.0908, + "step": 31661 + }, + { + "epoch": 0.95, + "learning_rate": 2.7912548427207474e-08, + "loss": 1.0544, + "step": 31662 + }, + { + "epoch": 0.95, + "learning_rate": 2.7876212520770996e-08, + "loss": 1.2231, + "step": 31663 + }, + { + "epoch": 0.95, + "learning_rate": 2.7839900147762222e-08, + "loss": 1.0737, + "step": 31664 + }, + { + "epoch": 0.95, + "learning_rate": 2.7803611308527268e-08, + "loss": 1.1772, + "step": 31665 + }, + { + "epoch": 0.95, + "learning_rate": 2.776734600341113e-08, + "loss": 1.0494, + "step": 31666 + }, + { + "epoch": 0.95, + "learning_rate": 2.7731104232759097e-08, + "loss": 1.1582, + "step": 31667 + }, + { + "epoch": 0.95, + "learning_rate": 2.7694885996916444e-08, + "loss": 1.1364, + "step": 31668 + }, + { + "epoch": 0.95, + "learning_rate": 2.7658691296227612e-08, + "loss": 1.0491, + "step": 31669 + }, + { + "epoch": 0.95, + "learning_rate": 2.7622520131037335e-08, + "loss": 1.0371, + "step": 31670 + }, + { + "epoch": 0.95, + "learning_rate": 2.758637250169005e-08, + "loss": 1.0009, + "step": 31671 + }, + { + "epoch": 0.95, + "learning_rate": 2.7550248408529656e-08, + "loss": 1.0231, + "step": 31672 + }, + { + "epoch": 0.95, + "learning_rate": 2.7514147851900043e-08, + "loss": 1.161, + "step": 31673 + }, + { + "epoch": 0.95, + "learning_rate": 2.7478070832145098e-08, + "loss": 1.1445, + "step": 31674 + }, + { + "epoch": 0.95, + "learning_rate": 2.7442017349607887e-08, + "loss": 1.0769, + "step": 31675 + }, + { + "epoch": 0.95, + "learning_rate": 2.7405987404632016e-08, + "loss": 1.0546, + "step": 31676 + }, + { + "epoch": 0.95, + "learning_rate": 2.7369980997560274e-08, + "loss": 1.0065, + "step": 31677 + }, + { + "epoch": 0.95, + "learning_rate": 2.733399812873544e-08, + "loss": 1.0503, + "step": 31678 + }, + { + "epoch": 0.95, + "learning_rate": 2.729803879850029e-08, + "loss": 1.0737, + "step": 31679 + }, + { + "epoch": 0.95, + "learning_rate": 2.7262103007196507e-08, + "loss": 1.1865, + "step": 31680 + }, + { + "epoch": 0.95, + "learning_rate": 2.722619075516686e-08, + "loss": 1.183, + "step": 31681 + }, + { + "epoch": 0.95, + "learning_rate": 2.7190302042753026e-08, + "loss": 1.0958, + "step": 31682 + }, + { + "epoch": 0.95, + "learning_rate": 2.7154436870296396e-08, + "loss": 1.0705, + "step": 31683 + }, + { + "epoch": 0.95, + "learning_rate": 2.7118595238138644e-08, + "loss": 1.2155, + "step": 31684 + }, + { + "epoch": 0.95, + "learning_rate": 2.7082777146620887e-08, + "loss": 1.0048, + "step": 31685 + }, + { + "epoch": 0.95, + "learning_rate": 2.704698259608396e-08, + "loss": 1.0698, + "step": 31686 + }, + { + "epoch": 0.95, + "learning_rate": 2.701121158686898e-08, + "loss": 1.2202, + "step": 31687 + }, + { + "epoch": 0.95, + "learning_rate": 2.697546411931623e-08, + "loss": 1.1172, + "step": 31688 + }, + { + "epoch": 0.95, + "learning_rate": 2.6939740193765717e-08, + "loss": 1.0899, + "step": 31689 + }, + { + "epoch": 0.95, + "learning_rate": 2.6904039810558e-08, + "loss": 1.1354, + "step": 31690 + }, + { + "epoch": 0.95, + "learning_rate": 2.6868362970032536e-08, + "loss": 1.0944, + "step": 31691 + }, + { + "epoch": 0.95, + "learning_rate": 2.68327096725296e-08, + "loss": 1.139, + "step": 31692 + }, + { + "epoch": 0.95, + "learning_rate": 2.6797079918387814e-08, + "loss": 1.0884, + "step": 31693 + }, + { + "epoch": 0.95, + "learning_rate": 2.676147370794663e-08, + "loss": 1.0737, + "step": 31694 + }, + { + "epoch": 0.95, + "learning_rate": 2.6725891041545215e-08, + "loss": 1.1564, + "step": 31695 + }, + { + "epoch": 0.95, + "learning_rate": 2.6690331919522195e-08, + "loss": 1.0555, + "step": 31696 + }, + { + "epoch": 0.95, + "learning_rate": 2.6654796342215906e-08, + "loss": 0.9927, + "step": 31697 + }, + { + "epoch": 0.95, + "learning_rate": 2.6619284309964967e-08, + "loss": 1.1092, + "step": 31698 + }, + { + "epoch": 0.95, + "learning_rate": 2.6583795823106883e-08, + "loss": 1.0738, + "step": 31699 + }, + { + "epoch": 0.95, + "learning_rate": 2.654833088198e-08, + "loss": 0.8464, + "step": 31700 + }, + { + "epoch": 0.95, + "learning_rate": 2.651288948692182e-08, + "loss": 1.0446, + "step": 31701 + }, + { + "epoch": 0.96, + "learning_rate": 2.647747163826958e-08, + "loss": 1.0563, + "step": 31702 + }, + { + "epoch": 0.96, + "learning_rate": 2.6442077336360507e-08, + "loss": 1.0753, + "step": 31703 + }, + { + "epoch": 0.96, + "learning_rate": 2.640670658153155e-08, + "loss": 1.025, + "step": 31704 + }, + { + "epoch": 0.96, + "learning_rate": 2.637135937411939e-08, + "loss": 1.0263, + "step": 31705 + }, + { + "epoch": 0.96, + "learning_rate": 2.6336035714460694e-08, + "loss": 1.2407, + "step": 31706 + }, + { + "epoch": 0.96, + "learning_rate": 2.6300735602891592e-08, + "loss": 1.0504, + "step": 31707 + }, + { + "epoch": 0.96, + "learning_rate": 2.626545903974792e-08, + "loss": 1.095, + "step": 31708 + }, + { + "epoch": 0.96, + "learning_rate": 2.62302060253658e-08, + "loss": 1.0777, + "step": 31709 + }, + { + "epoch": 0.96, + "learning_rate": 2.61949765600808e-08, + "loss": 1.0698, + "step": 31710 + }, + { + "epoch": 0.96, + "learning_rate": 2.615977064422792e-08, + "loss": 1.0461, + "step": 31711 + }, + { + "epoch": 0.96, + "learning_rate": 2.612458827814274e-08, + "loss": 1.0748, + "step": 31712 + }, + { + "epoch": 0.96, + "learning_rate": 2.6089429462159977e-08, + "loss": 1.1604, + "step": 31713 + }, + { + "epoch": 0.96, + "learning_rate": 2.6054294196614648e-08, + "loss": 0.982, + "step": 31714 + }, + { + "epoch": 0.96, + "learning_rate": 2.6019182481840656e-08, + "loss": 1.0074, + "step": 31715 + }, + { + "epoch": 0.96, + "learning_rate": 2.5984094318172726e-08, + "loss": 1.1023, + "step": 31716 + }, + { + "epoch": 0.96, + "learning_rate": 2.5949029705944485e-08, + "loss": 1.0792, + "step": 31717 + }, + { + "epoch": 0.96, + "learning_rate": 2.5913988645490106e-08, + "loss": 1.0964, + "step": 31718 + }, + { + "epoch": 0.96, + "learning_rate": 2.587897113714294e-08, + "loss": 1.1261, + "step": 31719 + }, + { + "epoch": 0.96, + "learning_rate": 2.5843977181236323e-08, + "loss": 1.061, + "step": 31720 + }, + { + "epoch": 0.96, + "learning_rate": 2.580900677810333e-08, + "loss": 1.0582, + "step": 31721 + }, + { + "epoch": 0.96, + "learning_rate": 2.5774059928077022e-08, + "loss": 0.9902, + "step": 31722 + }, + { + "epoch": 0.96, + "learning_rate": 2.573913663149047e-08, + "loss": 1.0526, + "step": 31723 + }, + { + "epoch": 0.96, + "learning_rate": 2.570423688867535e-08, + "loss": 1.2159, + "step": 31724 + }, + { + "epoch": 0.96, + "learning_rate": 2.5669360699964174e-08, + "loss": 1.1601, + "step": 31725 + }, + { + "epoch": 0.96, + "learning_rate": 2.56345080656889e-08, + "loss": 1.0591, + "step": 31726 + }, + { + "epoch": 0.96, + "learning_rate": 2.5599678986181764e-08, + "loss": 1.0803, + "step": 31727 + }, + { + "epoch": 0.96, + "learning_rate": 2.5564873461773888e-08, + "loss": 0.9761, + "step": 31728 + }, + { + "epoch": 0.96, + "learning_rate": 2.5530091492796672e-08, + "loss": 1.0788, + "step": 31729 + }, + { + "epoch": 0.96, + "learning_rate": 2.5495333079580963e-08, + "loss": 1.0491, + "step": 31730 + }, + { + "epoch": 0.96, + "learning_rate": 2.5460598222458165e-08, + "loss": 1.1404, + "step": 31731 + }, + { + "epoch": 0.96, + "learning_rate": 2.542588692175857e-08, + "loss": 1.1196, + "step": 31732 + }, + { + "epoch": 0.96, + "learning_rate": 2.539119917781302e-08, + "loss": 1.0057, + "step": 31733 + }, + { + "epoch": 0.96, + "learning_rate": 2.5356534990950976e-08, + "loss": 1.0253, + "step": 31734 + }, + { + "epoch": 0.96, + "learning_rate": 2.5321894361503285e-08, + "loss": 1.0493, + "step": 31735 + }, + { + "epoch": 0.96, + "learning_rate": 2.5287277289799405e-08, + "loss": 1.0596, + "step": 31736 + }, + { + "epoch": 0.96, + "learning_rate": 2.525268377616852e-08, + "loss": 1.1375, + "step": 31737 + }, + { + "epoch": 0.96, + "learning_rate": 2.521811382094008e-08, + "loss": 1.0651, + "step": 31738 + }, + { + "epoch": 0.96, + "learning_rate": 2.5183567424443554e-08, + "loss": 1.0018, + "step": 31739 + }, + { + "epoch": 0.96, + "learning_rate": 2.5149044587007564e-08, + "loss": 0.9858, + "step": 31740 + }, + { + "epoch": 0.96, + "learning_rate": 2.511454530896046e-08, + "loss": 1.0278, + "step": 31741 + }, + { + "epoch": 0.96, + "learning_rate": 2.508006959063114e-08, + "loss": 1.1755, + "step": 31742 + }, + { + "epoch": 0.96, + "learning_rate": 2.504561743234768e-08, + "loss": 1.0969, + "step": 31743 + }, + { + "epoch": 0.96, + "learning_rate": 2.501118883443787e-08, + "loss": 1.0486, + "step": 31744 + }, + { + "epoch": 0.96, + "learning_rate": 2.497678379722951e-08, + "loss": 1.09, + "step": 31745 + }, + { + "epoch": 0.96, + "learning_rate": 2.4942402321050384e-08, + "loss": 1.0377, + "step": 31746 + }, + { + "epoch": 0.96, + "learning_rate": 2.4908044406227182e-08, + "loss": 1.1124, + "step": 31747 + }, + { + "epoch": 0.96, + "learning_rate": 2.4873710053087418e-08, + "loss": 1.0762, + "step": 31748 + }, + { + "epoch": 0.96, + "learning_rate": 2.483939926195833e-08, + "loss": 1.0595, + "step": 31749 + }, + { + "epoch": 0.96, + "learning_rate": 2.480511203316577e-08, + "loss": 0.9999, + "step": 31750 + }, + { + "epoch": 0.96, + "learning_rate": 2.4770848367036136e-08, + "loss": 1.1481, + "step": 31751 + }, + { + "epoch": 0.96, + "learning_rate": 2.47366082638964e-08, + "loss": 1.0366, + "step": 31752 + }, + { + "epoch": 0.96, + "learning_rate": 2.4702391724071852e-08, + "loss": 1.0785, + "step": 31753 + }, + { + "epoch": 0.96, + "learning_rate": 2.466819874788834e-08, + "loss": 1.1629, + "step": 31754 + }, + { + "epoch": 0.96, + "learning_rate": 2.4634029335671438e-08, + "loss": 1.1249, + "step": 31755 + }, + { + "epoch": 0.96, + "learning_rate": 2.4599883487746447e-08, + "loss": 1.1742, + "step": 31756 + }, + { + "epoch": 0.96, + "learning_rate": 2.4565761204438098e-08, + "loss": 1.1256, + "step": 31757 + }, + { + "epoch": 0.96, + "learning_rate": 2.4531662486071695e-08, + "loss": 1.1662, + "step": 31758 + }, + { + "epoch": 0.96, + "learning_rate": 2.4497587332971695e-08, + "loss": 1.177, + "step": 31759 + }, + { + "epoch": 0.96, + "learning_rate": 2.4463535745462286e-08, + "loss": 1.1479, + "step": 31760 + }, + { + "epoch": 0.96, + "learning_rate": 2.442950772386793e-08, + "loss": 1.0605, + "step": 31761 + }, + { + "epoch": 0.96, + "learning_rate": 2.4395503268512534e-08, + "loss": 1.1359, + "step": 31762 + }, + { + "epoch": 0.96, + "learning_rate": 2.436152237971945e-08, + "loss": 1.1656, + "step": 31763 + }, + { + "epoch": 0.96, + "learning_rate": 2.4327565057812306e-08, + "loss": 1.0228, + "step": 31764 + }, + { + "epoch": 0.96, + "learning_rate": 2.4293631303114463e-08, + "loss": 1.0923, + "step": 31765 + }, + { + "epoch": 0.96, + "learning_rate": 2.4259721115948987e-08, + "loss": 1.0938, + "step": 31766 + }, + { + "epoch": 0.96, + "learning_rate": 2.42258344966384e-08, + "loss": 0.996, + "step": 31767 + }, + { + "epoch": 0.96, + "learning_rate": 2.4191971445505502e-08, + "loss": 1.1548, + "step": 31768 + }, + { + "epoch": 0.96, + "learning_rate": 2.415813196287281e-08, + "loss": 1.1227, + "step": 31769 + }, + { + "epoch": 0.96, + "learning_rate": 2.412431604906257e-08, + "loss": 0.9696, + "step": 31770 + }, + { + "epoch": 0.96, + "learning_rate": 2.4090523704395908e-08, + "loss": 1.1255, + "step": 31771 + }, + { + "epoch": 0.96, + "learning_rate": 2.4056754929195348e-08, + "loss": 1.1639, + "step": 31772 + }, + { + "epoch": 0.96, + "learning_rate": 2.402300972378174e-08, + "loss": 1.098, + "step": 31773 + }, + { + "epoch": 0.96, + "learning_rate": 2.398928808847678e-08, + "loss": 1.0319, + "step": 31774 + }, + { + "epoch": 0.96, + "learning_rate": 2.3955590023601317e-08, + "loss": 1.0366, + "step": 31775 + }, + { + "epoch": 0.96, + "learning_rate": 2.3921915529476203e-08, + "loss": 1.0184, + "step": 31776 + }, + { + "epoch": 0.96, + "learning_rate": 2.388826460642174e-08, + "loss": 1.0647, + "step": 31777 + }, + { + "epoch": 0.96, + "learning_rate": 2.3854637254758507e-08, + "loss": 1.0486, + "step": 31778 + }, + { + "epoch": 0.96, + "learning_rate": 2.38210334748068e-08, + "loss": 1.089, + "step": 31779 + }, + { + "epoch": 0.96, + "learning_rate": 2.3787453266886084e-08, + "loss": 1.1443, + "step": 31780 + }, + { + "epoch": 0.96, + "learning_rate": 2.375389663131611e-08, + "loss": 1.0604, + "step": 31781 + }, + { + "epoch": 0.96, + "learning_rate": 2.3720363568416616e-08, + "loss": 1.0558, + "step": 31782 + }, + { + "epoch": 0.96, + "learning_rate": 2.3686854078506516e-08, + "loss": 1.0303, + "step": 31783 + }, + { + "epoch": 0.96, + "learning_rate": 2.3653368161905e-08, + "loss": 1.0609, + "step": 31784 + }, + { + "epoch": 0.96, + "learning_rate": 2.3619905818930977e-08, + "loss": 1.0045, + "step": 31785 + }, + { + "epoch": 0.96, + "learning_rate": 2.358646704990253e-08, + "loss": 1.1207, + "step": 31786 + }, + { + "epoch": 0.96, + "learning_rate": 2.3553051855138287e-08, + "loss": 1.1042, + "step": 31787 + }, + { + "epoch": 0.96, + "learning_rate": 2.351966023495633e-08, + "loss": 1.1028, + "step": 31788 + }, + { + "epoch": 0.96, + "learning_rate": 2.3486292189674463e-08, + "loss": 1.119, + "step": 31789 + }, + { + "epoch": 0.96, + "learning_rate": 2.3452947719610487e-08, + "loss": 1.0527, + "step": 31790 + }, + { + "epoch": 0.96, + "learning_rate": 2.3419626825081642e-08, + "loss": 1.1265, + "step": 31791 + }, + { + "epoch": 0.96, + "learning_rate": 2.338632950640518e-08, + "loss": 1.0846, + "step": 31792 + }, + { + "epoch": 0.96, + "learning_rate": 2.3353055763898068e-08, + "loss": 1.1589, + "step": 31793 + }, + { + "epoch": 0.96, + "learning_rate": 2.3319805597877e-08, + "loss": 1.1172, + "step": 31794 + }, + { + "epoch": 0.96, + "learning_rate": 2.3286579008658662e-08, + "loss": 1.0708, + "step": 31795 + }, + { + "epoch": 0.96, + "learning_rate": 2.325337599655919e-08, + "loss": 0.9686, + "step": 31796 + }, + { + "epoch": 0.96, + "learning_rate": 2.3220196561894726e-08, + "loss": 1.137, + "step": 31797 + }, + { + "epoch": 0.96, + "learning_rate": 2.3187040704981122e-08, + "loss": 1.0631, + "step": 31798 + }, + { + "epoch": 0.96, + "learning_rate": 2.3153908426134243e-08, + "loss": 1.04, + "step": 31799 + }, + { + "epoch": 0.96, + "learning_rate": 2.3120799725669108e-08, + "loss": 1.014, + "step": 31800 + }, + { + "epoch": 0.96, + "learning_rate": 2.3087714603901023e-08, + "loss": 1.1254, + "step": 31801 + }, + { + "epoch": 0.96, + "learning_rate": 2.3054653061145014e-08, + "loss": 0.9883, + "step": 31802 + }, + { + "epoch": 0.96, + "learning_rate": 2.3021615097715556e-08, + "loss": 1.1813, + "step": 31803 + }, + { + "epoch": 0.96, + "learning_rate": 2.2988600713927665e-08, + "loss": 1.0179, + "step": 31804 + }, + { + "epoch": 0.96, + "learning_rate": 2.2955609910095267e-08, + "loss": 1.1458, + "step": 31805 + }, + { + "epoch": 0.96, + "learning_rate": 2.2922642686532546e-08, + "loss": 1.024, + "step": 31806 + }, + { + "epoch": 0.96, + "learning_rate": 2.288969904355315e-08, + "loss": 1.1123, + "step": 31807 + }, + { + "epoch": 0.96, + "learning_rate": 2.2856778981470707e-08, + "loss": 1.0854, + "step": 31808 + }, + { + "epoch": 0.96, + "learning_rate": 2.282388250059886e-08, + "loss": 1.0739, + "step": 31809 + }, + { + "epoch": 0.96, + "learning_rate": 2.2791009601250414e-08, + "loss": 1.1544, + "step": 31810 + }, + { + "epoch": 0.96, + "learning_rate": 2.275816028373873e-08, + "loss": 1.1934, + "step": 31811 + }, + { + "epoch": 0.96, + "learning_rate": 2.2725334548376056e-08, + "loss": 1.0723, + "step": 31812 + }, + { + "epoch": 0.96, + "learning_rate": 2.2692532395475196e-08, + "loss": 1.0875, + "step": 31813 + }, + { + "epoch": 0.96, + "learning_rate": 2.2659753825348407e-08, + "loss": 1.106, + "step": 31814 + }, + { + "epoch": 0.96, + "learning_rate": 2.262699883830738e-08, + "loss": 1.0778, + "step": 31815 + }, + { + "epoch": 0.96, + "learning_rate": 2.2594267434664363e-08, + "loss": 1.1612, + "step": 31816 + }, + { + "epoch": 0.96, + "learning_rate": 2.2561559614730775e-08, + "loss": 1.0935, + "step": 31817 + }, + { + "epoch": 0.96, + "learning_rate": 2.2528875378818038e-08, + "loss": 1.2379, + "step": 31818 + }, + { + "epoch": 0.96, + "learning_rate": 2.249621472723701e-08, + "loss": 1.1469, + "step": 31819 + }, + { + "epoch": 0.96, + "learning_rate": 2.2463577660299107e-08, + "loss": 1.114, + "step": 31820 + }, + { + "epoch": 0.96, + "learning_rate": 2.2430964178314364e-08, + "loss": 1.0223, + "step": 31821 + }, + { + "epoch": 0.96, + "learning_rate": 2.2398374281593916e-08, + "loss": 1.0864, + "step": 31822 + }, + { + "epoch": 0.96, + "learning_rate": 2.2365807970447518e-08, + "loss": 0.9598, + "step": 31823 + }, + { + "epoch": 0.96, + "learning_rate": 2.2333265245185476e-08, + "loss": 1.2079, + "step": 31824 + }, + { + "epoch": 0.96, + "learning_rate": 2.2300746106117264e-08, + "loss": 1.0983, + "step": 31825 + }, + { + "epoch": 0.96, + "learning_rate": 2.2268250553552917e-08, + "loss": 1.1781, + "step": 31826 + }, + { + "epoch": 0.96, + "learning_rate": 2.223577858780135e-08, + "loss": 1.1637, + "step": 31827 + }, + { + "epoch": 0.96, + "learning_rate": 2.220333020917176e-08, + "loss": 1.0553, + "step": 31828 + }, + { + "epoch": 0.96, + "learning_rate": 2.2170905417973066e-08, + "loss": 1.0928, + "step": 31829 + }, + { + "epoch": 0.96, + "learning_rate": 2.213850421451419e-08, + "loss": 1.0936, + "step": 31830 + }, + { + "epoch": 0.96, + "learning_rate": 2.2106126599103495e-08, + "loss": 1.2167, + "step": 31831 + }, + { + "epoch": 0.96, + "learning_rate": 2.207377257204879e-08, + "loss": 1.041, + "step": 31832 + }, + { + "epoch": 0.96, + "learning_rate": 2.204144213365844e-08, + "loss": 1.0895, + "step": 31833 + }, + { + "epoch": 0.96, + "learning_rate": 2.2009135284240258e-08, + "loss": 1.0339, + "step": 31834 + }, + { + "epoch": 0.96, + "learning_rate": 2.197685202410149e-08, + "loss": 1.1979, + "step": 31835 + }, + { + "epoch": 0.96, + "learning_rate": 2.1944592353549677e-08, + "loss": 1.1772, + "step": 31836 + }, + { + "epoch": 0.96, + "learning_rate": 2.1912356272892064e-08, + "loss": 1.1994, + "step": 31837 + }, + { + "epoch": 0.96, + "learning_rate": 2.1880143782435082e-08, + "loss": 1.0767, + "step": 31838 + }, + { + "epoch": 0.96, + "learning_rate": 2.18479548824857e-08, + "loss": 1.0537, + "step": 31839 + }, + { + "epoch": 0.96, + "learning_rate": 2.1815789573350342e-08, + "loss": 1.014, + "step": 31840 + }, + { + "epoch": 0.96, + "learning_rate": 2.1783647855334878e-08, + "loss": 1.0934, + "step": 31841 + }, + { + "epoch": 0.96, + "learning_rate": 2.1751529728745723e-08, + "loss": 1.0753, + "step": 31842 + }, + { + "epoch": 0.96, + "learning_rate": 2.1719435193888473e-08, + "loss": 1.0972, + "step": 31843 + }, + { + "epoch": 0.96, + "learning_rate": 2.168736425106871e-08, + "loss": 1.1929, + "step": 31844 + }, + { + "epoch": 0.96, + "learning_rate": 2.165531690059147e-08, + "loss": 1.0897, + "step": 31845 + }, + { + "epoch": 0.96, + "learning_rate": 2.1623293142762068e-08, + "loss": 1.0452, + "step": 31846 + }, + { + "epoch": 0.96, + "learning_rate": 2.159129297788526e-08, + "loss": 1.0808, + "step": 31847 + }, + { + "epoch": 0.96, + "learning_rate": 2.1559316406265797e-08, + "loss": 1.1884, + "step": 31848 + }, + { + "epoch": 0.96, + "learning_rate": 2.1527363428207883e-08, + "loss": 1.1063, + "step": 31849 + }, + { + "epoch": 0.96, + "learning_rate": 2.1495434044015717e-08, + "loss": 1.1074, + "step": 31850 + }, + { + "epoch": 0.96, + "learning_rate": 2.1463528253993504e-08, + "loss": 1.0664, + "step": 31851 + }, + { + "epoch": 0.96, + "learning_rate": 2.143164605844489e-08, + "loss": 1.0296, + "step": 31852 + }, + { + "epoch": 0.96, + "learning_rate": 2.1399787457673237e-08, + "loss": 1.0817, + "step": 31853 + }, + { + "epoch": 0.96, + "learning_rate": 2.1367952451981646e-08, + "loss": 1.1354, + "step": 31854 + }, + { + "epoch": 0.96, + "learning_rate": 2.1336141041673474e-08, + "loss": 1.0511, + "step": 31855 + }, + { + "epoch": 0.96, + "learning_rate": 2.1304353227051542e-08, + "loss": 1.1094, + "step": 31856 + }, + { + "epoch": 0.96, + "learning_rate": 2.127258900841839e-08, + "loss": 1.071, + "step": 31857 + }, + { + "epoch": 0.96, + "learning_rate": 2.1240848386076263e-08, + "loss": 1.0695, + "step": 31858 + }, + { + "epoch": 0.96, + "learning_rate": 2.1209131360327707e-08, + "loss": 1.0689, + "step": 31859 + }, + { + "epoch": 0.96, + "learning_rate": 2.1177437931474143e-08, + "loss": 1.0538, + "step": 31860 + }, + { + "epoch": 0.96, + "learning_rate": 2.1145768099817832e-08, + "loss": 1.0847, + "step": 31861 + }, + { + "epoch": 0.96, + "learning_rate": 2.1114121865659644e-08, + "loss": 1.1577, + "step": 31862 + }, + { + "epoch": 0.96, + "learning_rate": 2.108249922930128e-08, + "loss": 1.0826, + "step": 31863 + }, + { + "epoch": 0.96, + "learning_rate": 2.1050900191043334e-08, + "loss": 1.0432, + "step": 31864 + }, + { + "epoch": 0.96, + "learning_rate": 2.101932475118723e-08, + "loss": 1.0876, + "step": 31865 + }, + { + "epoch": 0.96, + "learning_rate": 2.098777291003329e-08, + "loss": 1.018, + "step": 31866 + }, + { + "epoch": 0.96, + "learning_rate": 2.0956244667881542e-08, + "loss": 1.0882, + "step": 31867 + }, + { + "epoch": 0.96, + "learning_rate": 2.0924740025032587e-08, + "loss": 1.1143, + "step": 31868 + }, + { + "epoch": 0.96, + "learning_rate": 2.0893258981786178e-08, + "loss": 1.1682, + "step": 31869 + }, + { + "epoch": 0.96, + "learning_rate": 2.0861801538441806e-08, + "loss": 1.0965, + "step": 31870 + }, + { + "epoch": 0.96, + "learning_rate": 2.0830367695299224e-08, + "loss": 1.0775, + "step": 31871 + }, + { + "epoch": 0.96, + "learning_rate": 2.0798957452657642e-08, + "loss": 1.1887, + "step": 31872 + }, + { + "epoch": 0.96, + "learning_rate": 2.0767570810815707e-08, + "loss": 1.1491, + "step": 31873 + }, + { + "epoch": 0.96, + "learning_rate": 2.0736207770072627e-08, + "loss": 1.231, + "step": 31874 + }, + { + "epoch": 0.96, + "learning_rate": 2.0704868330726767e-08, + "loss": 1.0624, + "step": 31875 + }, + { + "epoch": 0.96, + "learning_rate": 2.067355249307651e-08, + "loss": 1.0099, + "step": 31876 + }, + { + "epoch": 0.96, + "learning_rate": 2.0642260257419666e-08, + "loss": 1.1058, + "step": 31877 + }, + { + "epoch": 0.96, + "learning_rate": 2.0610991624054888e-08, + "loss": 1.0771, + "step": 31878 + }, + { + "epoch": 0.96, + "learning_rate": 2.057974659327916e-08, + "loss": 1.1519, + "step": 31879 + }, + { + "epoch": 0.96, + "learning_rate": 2.054852516539002e-08, + "loss": 1.0767, + "step": 31880 + }, + { + "epoch": 0.96, + "learning_rate": 2.0517327340684734e-08, + "loss": 1.1049, + "step": 31881 + }, + { + "epoch": 0.96, + "learning_rate": 2.0486153119460284e-08, + "loss": 1.1035, + "step": 31882 + }, + { + "epoch": 0.96, + "learning_rate": 2.0455002502013933e-08, + "loss": 1.0848, + "step": 31883 + }, + { + "epoch": 0.96, + "learning_rate": 2.0423875488641275e-08, + "loss": 1.0679, + "step": 31884 + }, + { + "epoch": 0.96, + "learning_rate": 2.03927720796393e-08, + "loss": 1.0948, + "step": 31885 + }, + { + "epoch": 0.96, + "learning_rate": 2.0361692275303878e-08, + "loss": 1.2048, + "step": 31886 + }, + { + "epoch": 0.96, + "learning_rate": 2.0330636075931165e-08, + "loss": 1.0214, + "step": 31887 + }, + { + "epoch": 0.96, + "learning_rate": 2.02996034818162e-08, + "loss": 1.0322, + "step": 31888 + }, + { + "epoch": 0.96, + "learning_rate": 2.0268594493254857e-08, + "loss": 1.0514, + "step": 31889 + }, + { + "epoch": 0.96, + "learning_rate": 2.0237609110542177e-08, + "loss": 1.1187, + "step": 31890 + }, + { + "epoch": 0.96, + "learning_rate": 2.0206647333973206e-08, + "loss": 1.079, + "step": 31891 + }, + { + "epoch": 0.96, + "learning_rate": 2.0175709163842706e-08, + "loss": 1.132, + "step": 31892 + }, + { + "epoch": 0.96, + "learning_rate": 2.0144794600445162e-08, + "loss": 1.1084, + "step": 31893 + }, + { + "epoch": 0.96, + "learning_rate": 2.0113903644074505e-08, + "loss": 1.0158, + "step": 31894 + }, + { + "epoch": 0.96, + "learning_rate": 2.0083036295025503e-08, + "loss": 1.1478, + "step": 31895 + }, + { + "epoch": 0.96, + "learning_rate": 2.0052192553591533e-08, + "loss": 1.038, + "step": 31896 + }, + { + "epoch": 0.96, + "learning_rate": 2.0021372420066244e-08, + "loss": 1.0844, + "step": 31897 + }, + { + "epoch": 0.96, + "learning_rate": 1.9990575894743015e-08, + "loss": 1.136, + "step": 31898 + }, + { + "epoch": 0.96, + "learning_rate": 1.9959802977915222e-08, + "loss": 1.332, + "step": 31899 + }, + { + "epoch": 0.96, + "learning_rate": 1.9929053669875685e-08, + "loss": 0.9763, + "step": 31900 + }, + { + "epoch": 0.96, + "learning_rate": 1.9898327970916954e-08, + "loss": 1.1094, + "step": 31901 + }, + { + "epoch": 0.96, + "learning_rate": 1.9867625881331842e-08, + "loss": 1.058, + "step": 31902 + }, + { + "epoch": 0.96, + "learning_rate": 1.9836947401412342e-08, + "loss": 1.0496, + "step": 31903 + }, + { + "epoch": 0.96, + "learning_rate": 1.980629253145072e-08, + "loss": 0.9893, + "step": 31904 + }, + { + "epoch": 0.96, + "learning_rate": 1.977566127173869e-08, + "loss": 1.0909, + "step": 31905 + }, + { + "epoch": 0.96, + "learning_rate": 1.9745053622567955e-08, + "loss": 1.0336, + "step": 31906 + }, + { + "epoch": 0.96, + "learning_rate": 1.9714469584229402e-08, + "loss": 1.08, + "step": 31907 + }, + { + "epoch": 0.96, + "learning_rate": 1.9683909157015014e-08, + "loss": 1.1104, + "step": 31908 + }, + { + "epoch": 0.96, + "learning_rate": 1.9653372341215116e-08, + "loss": 1.0386, + "step": 31909 + }, + { + "epoch": 0.96, + "learning_rate": 1.962285913712031e-08, + "loss": 1.0847, + "step": 31910 + }, + { + "epoch": 0.96, + "learning_rate": 1.9592369545021473e-08, + "loss": 1.0859, + "step": 31911 + }, + { + "epoch": 0.96, + "learning_rate": 1.956190356520865e-08, + "loss": 1.1769, + "step": 31912 + }, + { + "epoch": 0.96, + "learning_rate": 1.953146119797189e-08, + "loss": 1.0599, + "step": 31913 + }, + { + "epoch": 0.96, + "learning_rate": 1.950104244360096e-08, + "loss": 1.054, + "step": 31914 + }, + { + "epoch": 0.96, + "learning_rate": 1.947064730238535e-08, + "loss": 1.044, + "step": 31915 + }, + { + "epoch": 0.96, + "learning_rate": 1.9440275774614548e-08, + "loss": 1.1354, + "step": 31916 + }, + { + "epoch": 0.96, + "learning_rate": 1.940992786057805e-08, + "loss": 1.108, + "step": 31917 + }, + { + "epoch": 0.96, + "learning_rate": 1.9379603560563954e-08, + "loss": 1.2739, + "step": 31918 + }, + { + "epoch": 0.96, + "learning_rate": 1.93493028748612e-08, + "loss": 1.0206, + "step": 31919 + }, + { + "epoch": 0.96, + "learning_rate": 1.9319025803758716e-08, + "loss": 1.2145, + "step": 31920 + }, + { + "epoch": 0.96, + "learning_rate": 1.928877234754406e-08, + "loss": 1.0945, + "step": 31921 + }, + { + "epoch": 0.96, + "learning_rate": 1.9258542506505605e-08, + "loss": 1.1652, + "step": 31922 + }, + { + "epoch": 0.96, + "learning_rate": 1.9228336280931182e-08, + "loss": 1.1274, + "step": 31923 + }, + { + "epoch": 0.96, + "learning_rate": 1.9198153671108056e-08, + "loss": 1.255, + "step": 31924 + }, + { + "epoch": 0.96, + "learning_rate": 1.9167994677323777e-08, + "loss": 1.1488, + "step": 31925 + }, + { + "epoch": 0.96, + "learning_rate": 1.9137859299865612e-08, + "loss": 1.0657, + "step": 31926 + }, + { + "epoch": 0.96, + "learning_rate": 1.9107747539020004e-08, + "loss": 1.0454, + "step": 31927 + }, + { + "epoch": 0.96, + "learning_rate": 1.9077659395073667e-08, + "loss": 1.0453, + "step": 31928 + }, + { + "epoch": 0.96, + "learning_rate": 1.9047594868313313e-08, + "loss": 1.2059, + "step": 31929 + }, + { + "epoch": 0.96, + "learning_rate": 1.9017553959025104e-08, + "loss": 1.0659, + "step": 31930 + }, + { + "epoch": 0.96, + "learning_rate": 1.8987536667494645e-08, + "loss": 1.0958, + "step": 31931 + }, + { + "epoch": 0.96, + "learning_rate": 1.8957542994008092e-08, + "loss": 1.0786, + "step": 31932 + }, + { + "epoch": 0.96, + "learning_rate": 1.892757293885078e-08, + "loss": 1.077, + "step": 31933 + }, + { + "epoch": 0.96, + "learning_rate": 1.8897626502308032e-08, + "loss": 1.0532, + "step": 31934 + }, + { + "epoch": 0.96, + "learning_rate": 1.8867703684665174e-08, + "loss": 1.1161, + "step": 31935 + }, + { + "epoch": 0.96, + "learning_rate": 1.8837804486206702e-08, + "loss": 1.0974, + "step": 31936 + }, + { + "epoch": 0.96, + "learning_rate": 1.880792890721711e-08, + "loss": 1.243, + "step": 31937 + }, + { + "epoch": 0.96, + "learning_rate": 1.877807694798117e-08, + "loss": 1.1342, + "step": 31938 + }, + { + "epoch": 0.96, + "learning_rate": 1.8748248608783103e-08, + "loss": 1.2192, + "step": 31939 + }, + { + "epoch": 0.96, + "learning_rate": 1.8718443889906567e-08, + "loss": 1.0419, + "step": 31940 + }, + { + "epoch": 0.96, + "learning_rate": 1.8688662791635504e-08, + "loss": 0.9777, + "step": 31941 + }, + { + "epoch": 0.96, + "learning_rate": 1.8658905314253294e-08, + "loss": 1.1228, + "step": 31942 + }, + { + "epoch": 0.96, + "learning_rate": 1.8629171458043326e-08, + "loss": 1.1687, + "step": 31943 + }, + { + "epoch": 0.96, + "learning_rate": 1.8599461223288428e-08, + "loss": 1.144, + "step": 31944 + }, + { + "epoch": 0.96, + "learning_rate": 1.856977461027143e-08, + "loss": 1.0472, + "step": 31945 + }, + { + "epoch": 0.96, + "learning_rate": 1.8540111619275438e-08, + "loss": 1.1274, + "step": 31946 + }, + { + "epoch": 0.96, + "learning_rate": 1.8510472250582167e-08, + "loss": 1.1154, + "step": 31947 + }, + { + "epoch": 0.96, + "learning_rate": 1.8480856504474178e-08, + "loss": 1.1072, + "step": 31948 + }, + { + "epoch": 0.96, + "learning_rate": 1.845126438123318e-08, + "loss": 1.1812, + "step": 31949 + }, + { + "epoch": 0.96, + "learning_rate": 1.8421695881141455e-08, + "loss": 1.1703, + "step": 31950 + }, + { + "epoch": 0.96, + "learning_rate": 1.839215100447961e-08, + "loss": 1.0826, + "step": 31951 + }, + { + "epoch": 0.96, + "learning_rate": 1.8362629751529358e-08, + "loss": 0.9662, + "step": 31952 + }, + { + "epoch": 0.96, + "learning_rate": 1.8333132122571595e-08, + "loss": 0.9956, + "step": 31953 + }, + { + "epoch": 0.96, + "learning_rate": 1.8303658117887478e-08, + "loss": 1.1172, + "step": 31954 + }, + { + "epoch": 0.96, + "learning_rate": 1.8274207737757066e-08, + "loss": 1.1382, + "step": 31955 + }, + { + "epoch": 0.96, + "learning_rate": 1.8244780982460964e-08, + "loss": 1.2294, + "step": 31956 + }, + { + "epoch": 0.96, + "learning_rate": 1.8215377852279505e-08, + "loss": 0.9738, + "step": 31957 + }, + { + "epoch": 0.96, + "learning_rate": 1.8185998347492184e-08, + "loss": 1.0576, + "step": 31958 + }, + { + "epoch": 0.96, + "learning_rate": 1.8156642468378783e-08, + "loss": 1.0543, + "step": 31959 + }, + { + "epoch": 0.96, + "learning_rate": 1.8127310215219075e-08, + "loss": 1.0685, + "step": 31960 + }, + { + "epoch": 0.96, + "learning_rate": 1.8098001588292e-08, + "loss": 1.0787, + "step": 31961 + }, + { + "epoch": 0.96, + "learning_rate": 1.8068716587876788e-08, + "loss": 1.0883, + "step": 31962 + }, + { + "epoch": 0.96, + "learning_rate": 1.8039455214251822e-08, + "loss": 1.0016, + "step": 31963 + }, + { + "epoch": 0.96, + "learning_rate": 1.8010217467695767e-08, + "loss": 1.1055, + "step": 31964 + }, + { + "epoch": 0.96, + "learning_rate": 1.798100334848757e-08, + "loss": 1.0422, + "step": 31965 + }, + { + "epoch": 0.96, + "learning_rate": 1.7951812856904505e-08, + "loss": 1.1104, + "step": 31966 + }, + { + "epoch": 0.96, + "learning_rate": 1.7922645993224687e-08, + "loss": 1.0872, + "step": 31967 + }, + { + "epoch": 0.96, + "learning_rate": 1.7893502757725944e-08, + "loss": 1.1361, + "step": 31968 + }, + { + "epoch": 0.96, + "learning_rate": 1.7864383150685838e-08, + "loss": 1.1047, + "step": 31969 + }, + { + "epoch": 0.96, + "learning_rate": 1.7835287172381087e-08, + "loss": 1.1389, + "step": 31970 + }, + { + "epoch": 0.96, + "learning_rate": 1.7806214823088973e-08, + "loss": 1.172, + "step": 31971 + }, + { + "epoch": 0.96, + "learning_rate": 1.7777166103086495e-08, + "loss": 1.1572, + "step": 31972 + }, + { + "epoch": 0.96, + "learning_rate": 1.7748141012649544e-08, + "loss": 1.1295, + "step": 31973 + }, + { + "epoch": 0.96, + "learning_rate": 1.771913955205512e-08, + "loss": 1.2395, + "step": 31974 + }, + { + "epoch": 0.96, + "learning_rate": 1.7690161721578835e-08, + "loss": 1.119, + "step": 31975 + }, + { + "epoch": 0.96, + "learning_rate": 1.766120752149686e-08, + "loss": 1.1139, + "step": 31976 + }, + { + "epoch": 0.96, + "learning_rate": 1.7632276952084247e-08, + "loss": 1.042, + "step": 31977 + }, + { + "epoch": 0.96, + "learning_rate": 1.760337001361717e-08, + "loss": 1.0476, + "step": 31978 + }, + { + "epoch": 0.96, + "learning_rate": 1.757448670637041e-08, + "loss": 1.0922, + "step": 31979 + }, + { + "epoch": 0.96, + "learning_rate": 1.754562703061874e-08, + "loss": 1.1752, + "step": 31980 + }, + { + "epoch": 0.96, + "learning_rate": 1.751679098663722e-08, + "loss": 1.2185, + "step": 31981 + }, + { + "epoch": 0.96, + "learning_rate": 1.748797857470036e-08, + "loss": 1.0767, + "step": 31982 + }, + { + "epoch": 0.96, + "learning_rate": 1.7459189795082377e-08, + "loss": 1.0856, + "step": 31983 + }, + { + "epoch": 0.96, + "learning_rate": 1.743042464805694e-08, + "loss": 1.0602, + "step": 31984 + }, + { + "epoch": 0.96, + "learning_rate": 1.7401683133898562e-08, + "loss": 1.0485, + "step": 31985 + }, + { + "epoch": 0.96, + "learning_rate": 1.7372965252880348e-08, + "loss": 1.0984, + "step": 31986 + }, + { + "epoch": 0.96, + "learning_rate": 1.734427100527597e-08, + "loss": 1.0944, + "step": 31987 + }, + { + "epoch": 0.96, + "learning_rate": 1.7315600391358268e-08, + "loss": 1.1652, + "step": 31988 + }, + { + "epoch": 0.96, + "learning_rate": 1.7286953411400355e-08, + "loss": 1.0342, + "step": 31989 + }, + { + "epoch": 0.96, + "learning_rate": 1.725833006567479e-08, + "loss": 1.0493, + "step": 31990 + }, + { + "epoch": 0.96, + "learning_rate": 1.7229730354454687e-08, + "loss": 0.9794, + "step": 31991 + }, + { + "epoch": 0.96, + "learning_rate": 1.7201154278011502e-08, + "loss": 1.0703, + "step": 31992 + }, + { + "epoch": 0.96, + "learning_rate": 1.717260183661751e-08, + "loss": 1.0901, + "step": 31993 + }, + { + "epoch": 0.96, + "learning_rate": 1.714407303054444e-08, + "loss": 1.1056, + "step": 31994 + }, + { + "epoch": 0.96, + "learning_rate": 1.7115567860064298e-08, + "loss": 1.1573, + "step": 31995 + }, + { + "epoch": 0.96, + "learning_rate": 1.7087086325447975e-08, + "loss": 1.0023, + "step": 31996 + }, + { + "epoch": 0.96, + "learning_rate": 1.7058628426966926e-08, + "loss": 1.0665, + "step": 31997 + }, + { + "epoch": 0.96, + "learning_rate": 1.7030194164891768e-08, + "loss": 1.0176, + "step": 31998 + }, + { + "epoch": 0.96, + "learning_rate": 1.700178353949339e-08, + "loss": 1.1334, + "step": 31999 + }, + { + "epoch": 0.96, + "learning_rate": 1.697339655104241e-08, + "loss": 1.0538, + "step": 32000 + }, + { + "epoch": 0.96, + "learning_rate": 1.6945033199808615e-08, + "loss": 1.1263, + "step": 32001 + }, + { + "epoch": 0.96, + "learning_rate": 1.6916693486062065e-08, + "loss": 1.0593, + "step": 32002 + }, + { + "epoch": 0.96, + "learning_rate": 1.688837741007282e-08, + "loss": 1.1087, + "step": 32003 + }, + { + "epoch": 0.96, + "learning_rate": 1.6860084972110392e-08, + "loss": 0.963, + "step": 32004 + }, + { + "epoch": 0.96, + "learning_rate": 1.6831816172444006e-08, + "loss": 1.1, + "step": 32005 + }, + { + "epoch": 0.96, + "learning_rate": 1.6803571011342613e-08, + "loss": 1.0673, + "step": 32006 + }, + { + "epoch": 0.96, + "learning_rate": 1.6775349489075442e-08, + "loss": 1.1176, + "step": 32007 + }, + { + "epoch": 0.96, + "learning_rate": 1.674715160591117e-08, + "loss": 1.1547, + "step": 32008 + }, + { + "epoch": 0.96, + "learning_rate": 1.6718977362117916e-08, + "loss": 1.1432, + "step": 32009 + }, + { + "epoch": 0.96, + "learning_rate": 1.6690826757963798e-08, + "loss": 1.1175, + "step": 32010 + }, + { + "epoch": 0.96, + "learning_rate": 1.6662699793717208e-08, + "loss": 1.1069, + "step": 32011 + }, + { + "epoch": 0.96, + "learning_rate": 1.6634596469645713e-08, + "loss": 1.1921, + "step": 32012 + }, + { + "epoch": 0.96, + "learning_rate": 1.6606516786016604e-08, + "loss": 1.1487, + "step": 32013 + }, + { + "epoch": 0.96, + "learning_rate": 1.6578460743097712e-08, + "loss": 1.0002, + "step": 32014 + }, + { + "epoch": 0.96, + "learning_rate": 1.65504283411555e-08, + "loss": 1.0417, + "step": 32015 + }, + { + "epoch": 0.96, + "learning_rate": 1.6522419580457248e-08, + "loss": 1.1084, + "step": 32016 + }, + { + "epoch": 0.96, + "learning_rate": 1.6494434461269693e-08, + "loss": 1.1546, + "step": 32017 + }, + { + "epoch": 0.96, + "learning_rate": 1.6466472983858727e-08, + "loss": 1.2616, + "step": 32018 + }, + { + "epoch": 0.96, + "learning_rate": 1.6438535148491086e-08, + "loss": 1.1478, + "step": 32019 + }, + { + "epoch": 0.96, + "learning_rate": 1.6410620955432388e-08, + "loss": 1.0852, + "step": 32020 + }, + { + "epoch": 0.96, + "learning_rate": 1.6382730404948534e-08, + "loss": 1.082, + "step": 32021 + }, + { + "epoch": 0.96, + "learning_rate": 1.6354863497304583e-08, + "loss": 1.0094, + "step": 32022 + }, + { + "epoch": 0.96, + "learning_rate": 1.6327020232766445e-08, + "loss": 1.071, + "step": 32023 + }, + { + "epoch": 0.96, + "learning_rate": 1.62992006115989e-08, + "loss": 1.186, + "step": 32024 + }, + { + "epoch": 0.96, + "learning_rate": 1.6271404634066733e-08, + "loss": 1.0869, + "step": 32025 + }, + { + "epoch": 0.96, + "learning_rate": 1.6243632300434465e-08, + "loss": 1.1717, + "step": 32026 + }, + { + "epoch": 0.96, + "learning_rate": 1.6215883610966877e-08, + "loss": 1.0798, + "step": 32027 + }, + { + "epoch": 0.96, + "learning_rate": 1.6188158565927646e-08, + "loss": 1.0447, + "step": 32028 + }, + { + "epoch": 0.96, + "learning_rate": 1.6160457165580734e-08, + "loss": 1.1249, + "step": 32029 + }, + { + "epoch": 0.96, + "learning_rate": 1.6132779410190368e-08, + "loss": 1.1124, + "step": 32030 + }, + { + "epoch": 0.96, + "learning_rate": 1.61051253000194e-08, + "loss": 1.1762, + "step": 32031 + }, + { + "epoch": 0.96, + "learning_rate": 1.60774948353315e-08, + "loss": 1.0841, + "step": 32032 + }, + { + "epoch": 0.96, + "learning_rate": 1.6049888016389514e-08, + "loss": 1.1623, + "step": 32033 + }, + { + "epoch": 0.97, + "learning_rate": 1.6022304843456295e-08, + "loss": 1.1883, + "step": 32034 + }, + { + "epoch": 0.97, + "learning_rate": 1.5994745316794402e-08, + "loss": 1.1302, + "step": 32035 + }, + { + "epoch": 0.97, + "learning_rate": 1.596720943666613e-08, + "loss": 1.087, + "step": 32036 + }, + { + "epoch": 0.97, + "learning_rate": 1.593969720333377e-08, + "loss": 1.1425, + "step": 32037 + }, + { + "epoch": 0.97, + "learning_rate": 1.5912208617059056e-08, + "loss": 1.0977, + "step": 32038 + }, + { + "epoch": 0.97, + "learning_rate": 1.588474367810372e-08, + "loss": 1.0911, + "step": 32039 + }, + { + "epoch": 0.97, + "learning_rate": 1.5857302386729222e-08, + "loss": 1.0915, + "step": 32040 + }, + { + "epoch": 0.97, + "learning_rate": 1.582988474319702e-08, + "loss": 1.0597, + "step": 32041 + }, + { + "epoch": 0.97, + "learning_rate": 1.580249074776774e-08, + "loss": 1.1179, + "step": 32042 + }, + { + "epoch": 0.97, + "learning_rate": 1.5775120400702282e-08, + "loss": 1.1022, + "step": 32043 + }, + { + "epoch": 0.97, + "learning_rate": 1.5747773702261272e-08, + "loss": 1.0228, + "step": 32044 + }, + { + "epoch": 0.97, + "learning_rate": 1.5720450652705056e-08, + "loss": 1.1074, + "step": 32045 + }, + { + "epoch": 0.97, + "learning_rate": 1.5693151252293702e-08, + "loss": 1.0544, + "step": 32046 + }, + { + "epoch": 0.97, + "learning_rate": 1.5665875501287008e-08, + "loss": 1.0933, + "step": 32047 + }, + { + "epoch": 0.97, + "learning_rate": 1.5638623399944487e-08, + "loss": 1.0942, + "step": 32048 + }, + { + "epoch": 0.97, + "learning_rate": 1.5611394948525927e-08, + "loss": 1.1691, + "step": 32049 + }, + { + "epoch": 0.97, + "learning_rate": 1.558419014729057e-08, + "loss": 1.0988, + "step": 32050 + }, + { + "epoch": 0.97, + "learning_rate": 1.5557008996496815e-08, + "loss": 1.2502, + "step": 32051 + }, + { + "epoch": 0.97, + "learning_rate": 1.552985149640418e-08, + "loss": 1.1017, + "step": 32052 + }, + { + "epoch": 0.97, + "learning_rate": 1.5502717647270516e-08, + "loss": 1.05, + "step": 32053 + }, + { + "epoch": 0.97, + "learning_rate": 1.5475607449354502e-08, + "loss": 1.1097, + "step": 32054 + }, + { + "epoch": 0.97, + "learning_rate": 1.5448520902913988e-08, + "loss": 1.0856, + "step": 32055 + }, + { + "epoch": 0.97, + "learning_rate": 1.54214580082071e-08, + "loss": 1.1403, + "step": 32056 + }, + { + "epoch": 0.97, + "learning_rate": 1.5394418765491136e-08, + "loss": 1.1152, + "step": 32057 + }, + { + "epoch": 0.97, + "learning_rate": 1.5367403175023944e-08, + "loss": 1.0318, + "step": 32058 + }, + { + "epoch": 0.97, + "learning_rate": 1.5340411237062257e-08, + "loss": 1.0532, + "step": 32059 + }, + { + "epoch": 0.97, + "learning_rate": 1.53134429518631e-08, + "loss": 1.0895, + "step": 32060 + }, + { + "epoch": 0.97, + "learning_rate": 1.5286498319683484e-08, + "loss": 1.0398, + "step": 32061 + }, + { + "epoch": 0.97, + "learning_rate": 1.5259577340779595e-08, + "loss": 1.085, + "step": 32062 + }, + { + "epoch": 0.97, + "learning_rate": 1.5232680015407895e-08, + "loss": 1.1439, + "step": 32063 + }, + { + "epoch": 0.97, + "learning_rate": 1.5205806343824568e-08, + "loss": 1.1082, + "step": 32064 + }, + { + "epoch": 0.97, + "learning_rate": 1.5178956326284965e-08, + "loss": 1.094, + "step": 32065 + }, + { + "epoch": 0.97, + "learning_rate": 1.515212996304527e-08, + "loss": 1.1232, + "step": 32066 + }, + { + "epoch": 0.97, + "learning_rate": 1.5125327254360278e-08, + "loss": 1.0065, + "step": 32067 + }, + { + "epoch": 0.97, + "learning_rate": 1.509854820048534e-08, + "loss": 1.1743, + "step": 32068 + }, + { + "epoch": 0.97, + "learning_rate": 1.507179280167581e-08, + "loss": 1.1157, + "step": 32069 + }, + { + "epoch": 0.97, + "learning_rate": 1.504506105818593e-08, + "loss": 1.1152, + "step": 32070 + }, + { + "epoch": 0.97, + "learning_rate": 1.501835297027021e-08, + "loss": 1.0011, + "step": 32071 + }, + { + "epoch": 0.97, + "learning_rate": 1.4991668538182903e-08, + "loss": 1.0643, + "step": 32072 + }, + { + "epoch": 0.97, + "learning_rate": 1.496500776217824e-08, + "loss": 1.0869, + "step": 32073 + }, + { + "epoch": 0.97, + "learning_rate": 1.4938370642509636e-08, + "loss": 1.1469, + "step": 32074 + }, + { + "epoch": 0.97, + "learning_rate": 1.4911757179431052e-08, + "loss": 1.0876, + "step": 32075 + }, + { + "epoch": 0.97, + "learning_rate": 1.4885167373195619e-08, + "loss": 1.0998, + "step": 32076 + }, + { + "epoch": 0.97, + "learning_rate": 1.4858601224056468e-08, + "loss": 1.0242, + "step": 32077 + }, + { + "epoch": 0.97, + "learning_rate": 1.483205873226673e-08, + "loss": 1.0602, + "step": 32078 + }, + { + "epoch": 0.97, + "learning_rate": 1.4805539898078702e-08, + "loss": 1.0782, + "step": 32079 + }, + { + "epoch": 0.97, + "learning_rate": 1.4779044721745239e-08, + "loss": 1.1487, + "step": 32080 + }, + { + "epoch": 0.97, + "learning_rate": 1.4752573203518083e-08, + "loss": 1.0597, + "step": 32081 + }, + { + "epoch": 0.97, + "learning_rate": 1.472612534364981e-08, + "loss": 1.0057, + "step": 32082 + }, + { + "epoch": 0.97, + "learning_rate": 1.4699701142391608e-08, + "loss": 1.0619, + "step": 32083 + }, + { + "epoch": 0.97, + "learning_rate": 1.4673300599995222e-08, + "loss": 1.1573, + "step": 32084 + }, + { + "epoch": 0.97, + "learning_rate": 1.4646923716712391e-08, + "loss": 1.0385, + "step": 32085 + }, + { + "epoch": 0.97, + "learning_rate": 1.4620570492793473e-08, + "loss": 1.1613, + "step": 32086 + }, + { + "epoch": 0.97, + "learning_rate": 1.4594240928489934e-08, + "loss": 1.1075, + "step": 32087 + }, + { + "epoch": 0.97, + "learning_rate": 1.4567935024052127e-08, + "loss": 1.0654, + "step": 32088 + }, + { + "epoch": 0.97, + "learning_rate": 1.4541652779730686e-08, + "loss": 1.0614, + "step": 32089 + }, + { + "epoch": 0.97, + "learning_rate": 1.4515394195775689e-08, + "loss": 1.0916, + "step": 32090 + }, + { + "epoch": 0.97, + "learning_rate": 1.4489159272436937e-08, + "loss": 1.0786, + "step": 32091 + }, + { + "epoch": 0.97, + "learning_rate": 1.4462948009964228e-08, + "loss": 1.1717, + "step": 32092 + }, + { + "epoch": 0.97, + "learning_rate": 1.4436760408607364e-08, + "loss": 1.1342, + "step": 32093 + }, + { + "epoch": 0.97, + "learning_rate": 1.441059646861559e-08, + "loss": 1.0706, + "step": 32094 + }, + { + "epoch": 0.97, + "learning_rate": 1.4384456190237594e-08, + "loss": 1.0945, + "step": 32095 + }, + { + "epoch": 0.97, + "learning_rate": 1.4358339573722624e-08, + "loss": 1.097, + "step": 32096 + }, + { + "epoch": 0.97, + "learning_rate": 1.433224661931909e-08, + "loss": 1.0603, + "step": 32097 + }, + { + "epoch": 0.97, + "learning_rate": 1.4306177327275129e-08, + "loss": 1.2162, + "step": 32098 + }, + { + "epoch": 0.97, + "learning_rate": 1.4280131697839705e-08, + "loss": 1.1497, + "step": 32099 + }, + { + "epoch": 0.97, + "learning_rate": 1.4254109731260123e-08, + "loss": 1.1578, + "step": 32100 + }, + { + "epoch": 0.97, + "learning_rate": 1.4228111427783964e-08, + "loss": 1.1984, + "step": 32101 + }, + { + "epoch": 0.97, + "learning_rate": 1.4202136787659082e-08, + "loss": 1.1683, + "step": 32102 + }, + { + "epoch": 0.97, + "learning_rate": 1.4176185811133059e-08, + "loss": 1.0125, + "step": 32103 + }, + { + "epoch": 0.97, + "learning_rate": 1.4150258498452086e-08, + "loss": 1.0954, + "step": 32104 + }, + { + "epoch": 0.97, + "learning_rate": 1.4124354849863465e-08, + "loss": 1.1069, + "step": 32105 + }, + { + "epoch": 0.97, + "learning_rate": 1.4098474865613942e-08, + "loss": 1.1575, + "step": 32106 + }, + { + "epoch": 0.97, + "learning_rate": 1.4072618545949435e-08, + "loss": 0.9961, + "step": 32107 + }, + { + "epoch": 0.97, + "learning_rate": 1.4046785891116687e-08, + "loss": 1.1757, + "step": 32108 + }, + { + "epoch": 0.97, + "learning_rate": 1.402097690136106e-08, + "loss": 1.0636, + "step": 32109 + }, + { + "epoch": 0.97, + "learning_rate": 1.3995191576928469e-08, + "loss": 1.1542, + "step": 32110 + }, + { + "epoch": 0.97, + "learning_rate": 1.396942991806427e-08, + "loss": 1.1235, + "step": 32111 + }, + { + "epoch": 0.97, + "learning_rate": 1.3943691925013824e-08, + "loss": 1.1348, + "step": 32112 + }, + { + "epoch": 0.97, + "learning_rate": 1.3917977598022215e-08, + "loss": 1.0857, + "step": 32113 + }, + { + "epoch": 0.97, + "learning_rate": 1.3892286937333965e-08, + "loss": 1.0928, + "step": 32114 + }, + { + "epoch": 0.97, + "learning_rate": 1.3866619943193882e-08, + "loss": 1.0354, + "step": 32115 + }, + { + "epoch": 0.97, + "learning_rate": 1.3840976615846213e-08, + "loss": 0.9737, + "step": 32116 + }, + { + "epoch": 0.97, + "learning_rate": 1.381535695553493e-08, + "loss": 1.0978, + "step": 32117 + }, + { + "epoch": 0.97, + "learning_rate": 1.3789760962504285e-08, + "loss": 1.149, + "step": 32118 + }, + { + "epoch": 0.97, + "learning_rate": 1.3764188636997688e-08, + "loss": 1.0585, + "step": 32119 + }, + { + "epoch": 0.97, + "learning_rate": 1.3738639979258561e-08, + "loss": 1.0618, + "step": 32120 + }, + { + "epoch": 0.97, + "learning_rate": 1.3713114989530041e-08, + "loss": 1.1432, + "step": 32121 + }, + { + "epoch": 0.97, + "learning_rate": 1.3687613668055267e-08, + "loss": 1.1068, + "step": 32122 + }, + { + "epoch": 0.97, + "learning_rate": 1.36621360150771e-08, + "loss": 1.1393, + "step": 32123 + }, + { + "epoch": 0.97, + "learning_rate": 1.3636682030837845e-08, + "loss": 1.1648, + "step": 32124 + }, + { + "epoch": 0.97, + "learning_rate": 1.3611251715580087e-08, + "loss": 1.1105, + "step": 32125 + }, + { + "epoch": 0.97, + "learning_rate": 1.35858450695453e-08, + "loss": 1.0532, + "step": 32126 + }, + { + "epoch": 0.97, + "learning_rate": 1.3560462092976067e-08, + "loss": 1.0686, + "step": 32127 + }, + { + "epoch": 0.97, + "learning_rate": 1.3535102786113584e-08, + "loss": 1.0583, + "step": 32128 + }, + { + "epoch": 0.97, + "learning_rate": 1.3509767149199604e-08, + "loss": 1.0688, + "step": 32129 + }, + { + "epoch": 0.97, + "learning_rate": 1.3484455182475042e-08, + "loss": 1.0768, + "step": 32130 + }, + { + "epoch": 0.97, + "learning_rate": 1.3459166886180818e-08, + "loss": 1.1377, + "step": 32131 + }, + { + "epoch": 0.97, + "learning_rate": 1.3433902260557851e-08, + "loss": 1.0825, + "step": 32132 + }, + { + "epoch": 0.97, + "learning_rate": 1.3408661305846505e-08, + "loss": 1.0361, + "step": 32133 + }, + { + "epoch": 0.97, + "learning_rate": 1.338344402228714e-08, + "loss": 1.1267, + "step": 32134 + }, + { + "epoch": 0.97, + "learning_rate": 1.3358250410119843e-08, + "loss": 1.0638, + "step": 32135 + }, + { + "epoch": 0.97, + "learning_rate": 1.3333080469584425e-08, + "loss": 1.1736, + "step": 32136 + }, + { + "epoch": 0.97, + "learning_rate": 1.3307934200920413e-08, + "loss": 1.1288, + "step": 32137 + }, + { + "epoch": 0.97, + "learning_rate": 1.3282811604367064e-08, + "loss": 0.9785, + "step": 32138 + }, + { + "epoch": 0.97, + "learning_rate": 1.3257712680163903e-08, + "loss": 1.0768, + "step": 32139 + }, + { + "epoch": 0.97, + "learning_rate": 1.3232637428549633e-08, + "loss": 1.0818, + "step": 32140 + }, + { + "epoch": 0.97, + "learning_rate": 1.320758584976295e-08, + "loss": 1.0739, + "step": 32141 + }, + { + "epoch": 0.97, + "learning_rate": 1.3182557944042273e-08, + "loss": 1.1628, + "step": 32142 + }, + { + "epoch": 0.97, + "learning_rate": 1.3157553711626026e-08, + "loss": 1.0385, + "step": 32143 + }, + { + "epoch": 0.97, + "learning_rate": 1.3132573152752349e-08, + "loss": 1.1075, + "step": 32144 + }, + { + "epoch": 0.97, + "learning_rate": 1.3107616267658552e-08, + "loss": 1.1147, + "step": 32145 + }, + { + "epoch": 0.97, + "learning_rate": 1.3082683056582779e-08, + "loss": 1.041, + "step": 32146 + }, + { + "epoch": 0.97, + "learning_rate": 1.3057773519762062e-08, + "loss": 1.073, + "step": 32147 + }, + { + "epoch": 0.97, + "learning_rate": 1.3032887657433435e-08, + "loss": 1.1456, + "step": 32148 + }, + { + "epoch": 0.97, + "learning_rate": 1.3008025469834207e-08, + "loss": 1.1215, + "step": 32149 + }, + { + "epoch": 0.97, + "learning_rate": 1.2983186957200578e-08, + "loss": 1.1528, + "step": 32150 + }, + { + "epoch": 0.97, + "learning_rate": 1.2958372119769303e-08, + "loss": 1.0829, + "step": 32151 + }, + { + "epoch": 0.97, + "learning_rate": 1.2933580957776581e-08, + "loss": 1.1271, + "step": 32152 + }, + { + "epoch": 0.97, + "learning_rate": 1.2908813471458337e-08, + "loss": 1.1101, + "step": 32153 + }, + { + "epoch": 0.97, + "learning_rate": 1.2884069661050213e-08, + "loss": 1.1458, + "step": 32154 + }, + { + "epoch": 0.97, + "learning_rate": 1.2859349526788133e-08, + "loss": 1.1805, + "step": 32155 + }, + { + "epoch": 0.97, + "learning_rate": 1.283465306890691e-08, + "loss": 1.1041, + "step": 32156 + }, + { + "epoch": 0.97, + "learning_rate": 1.2809980287642187e-08, + "loss": 1.0511, + "step": 32157 + }, + { + "epoch": 0.97, + "learning_rate": 1.27853311832285e-08, + "loss": 0.9832, + "step": 32158 + }, + { + "epoch": 0.97, + "learning_rate": 1.276070575590066e-08, + "loss": 1.0811, + "step": 32159 + }, + { + "epoch": 0.97, + "learning_rate": 1.2736104005892925e-08, + "loss": 1.117, + "step": 32160 + }, + { + "epoch": 0.97, + "learning_rate": 1.271152593343955e-08, + "loss": 1.05, + "step": 32161 + }, + { + "epoch": 0.97, + "learning_rate": 1.2686971538774517e-08, + "loss": 1.0887, + "step": 32162 + }, + { + "epoch": 0.97, + "learning_rate": 1.2662440822131528e-08, + "loss": 1.0681, + "step": 32163 + }, + { + "epoch": 0.97, + "learning_rate": 1.2637933783744282e-08, + "loss": 1.1265, + "step": 32164 + }, + { + "epoch": 0.97, + "learning_rate": 1.261345042384593e-08, + "loss": 1.1147, + "step": 32165 + }, + { + "epoch": 0.97, + "learning_rate": 1.2588990742669615e-08, + "loss": 1.1238, + "step": 32166 + }, + { + "epoch": 0.97, + "learning_rate": 1.2564554740447932e-08, + "loss": 1.0611, + "step": 32167 + }, + { + "epoch": 0.97, + "learning_rate": 1.2540142417413748e-08, + "loss": 1.1816, + "step": 32168 + }, + { + "epoch": 0.97, + "learning_rate": 1.2515753773799655e-08, + "loss": 1.0182, + "step": 32169 + }, + { + "epoch": 0.97, + "learning_rate": 1.2491388809837413e-08, + "loss": 1.287, + "step": 32170 + }, + { + "epoch": 0.97, + "learning_rate": 1.2467047525759058e-08, + "loss": 1.1039, + "step": 32171 + }, + { + "epoch": 0.97, + "learning_rate": 1.2442729921796349e-08, + "loss": 1.1282, + "step": 32172 + }, + { + "epoch": 0.97, + "learning_rate": 1.2418435998181044e-08, + "loss": 1.0436, + "step": 32173 + }, + { + "epoch": 0.97, + "learning_rate": 1.2394165755143794e-08, + "loss": 0.9811, + "step": 32174 + }, + { + "epoch": 0.97, + "learning_rate": 1.2369919192916358e-08, + "loss": 1.0122, + "step": 32175 + }, + { + "epoch": 0.97, + "learning_rate": 1.2345696311729104e-08, + "loss": 1.0525, + "step": 32176 + }, + { + "epoch": 0.97, + "learning_rate": 1.2321497111812686e-08, + "loss": 1.1224, + "step": 32177 + }, + { + "epoch": 0.97, + "learning_rate": 1.2297321593397472e-08, + "loss": 1.0502, + "step": 32178 + }, + { + "epoch": 0.97, + "learning_rate": 1.2273169756713832e-08, + "loss": 0.9763, + "step": 32179 + }, + { + "epoch": 0.97, + "learning_rate": 1.2249041601991308e-08, + "loss": 1.2797, + "step": 32180 + }, + { + "epoch": 0.97, + "learning_rate": 1.2224937129459713e-08, + "loss": 0.9897, + "step": 32181 + }, + { + "epoch": 0.97, + "learning_rate": 1.2200856339348588e-08, + "loss": 1.0587, + "step": 32182 + }, + { + "epoch": 0.97, + "learning_rate": 1.2176799231887193e-08, + "loss": 1.1329, + "step": 32183 + }, + { + "epoch": 0.97, + "learning_rate": 1.2152765807304512e-08, + "loss": 1.0825, + "step": 32184 + }, + { + "epoch": 0.97, + "learning_rate": 1.2128756065829529e-08, + "loss": 1.1367, + "step": 32185 + }, + { + "epoch": 0.97, + "learning_rate": 1.2104770007690392e-08, + "loss": 1.1483, + "step": 32186 + }, + { + "epoch": 0.97, + "learning_rate": 1.2080807633115533e-08, + "loss": 1.1967, + "step": 32187 + }, + { + "epoch": 0.97, + "learning_rate": 1.20568689423331e-08, + "loss": 0.9671, + "step": 32188 + }, + { + "epoch": 0.97, + "learning_rate": 1.2032953935571246e-08, + "loss": 1.0582, + "step": 32189 + }, + { + "epoch": 0.97, + "learning_rate": 1.2009062613057288e-08, + "loss": 0.9991, + "step": 32190 + }, + { + "epoch": 0.97, + "learning_rate": 1.19851949750191e-08, + "loss": 1.2148, + "step": 32191 + }, + { + "epoch": 0.97, + "learning_rate": 1.1961351021683165e-08, + "loss": 1.1936, + "step": 32192 + }, + { + "epoch": 0.97, + "learning_rate": 1.1937530753277082e-08, + "loss": 1.1337, + "step": 32193 + }, + { + "epoch": 0.97, + "learning_rate": 1.1913734170027335e-08, + "loss": 1.0468, + "step": 32194 + }, + { + "epoch": 0.97, + "learning_rate": 1.1889961272160689e-08, + "loss": 1.1503, + "step": 32195 + }, + { + "epoch": 0.97, + "learning_rate": 1.186621205990307e-08, + "loss": 1.035, + "step": 32196 + }, + { + "epoch": 0.97, + "learning_rate": 1.1842486533480968e-08, + "loss": 1.037, + "step": 32197 + }, + { + "epoch": 0.97, + "learning_rate": 1.1818784693120033e-08, + "loss": 1.1866, + "step": 32198 + }, + { + "epoch": 0.97, + "learning_rate": 1.179510653904592e-08, + "loss": 1.1359, + "step": 32199 + }, + { + "epoch": 0.97, + "learning_rate": 1.1771452071484002e-08, + "loss": 0.9769, + "step": 32200 + }, + { + "epoch": 0.97, + "learning_rate": 1.1747821290659379e-08, + "loss": 1.0373, + "step": 32201 + }, + { + "epoch": 0.97, + "learning_rate": 1.1724214196797423e-08, + "loss": 1.0988, + "step": 32202 + }, + { + "epoch": 0.97, + "learning_rate": 1.1700630790122403e-08, + "loss": 1.0587, + "step": 32203 + }, + { + "epoch": 0.97, + "learning_rate": 1.167707107085886e-08, + "loss": 1.0597, + "step": 32204 + }, + { + "epoch": 0.97, + "learning_rate": 1.1653535039231334e-08, + "loss": 1.1393, + "step": 32205 + }, + { + "epoch": 0.97, + "learning_rate": 1.163002269546354e-08, + "loss": 1.3167, + "step": 32206 + }, + { + "epoch": 0.97, + "learning_rate": 1.1606534039779737e-08, + "loss": 0.9854, + "step": 32207 + }, + { + "epoch": 0.97, + "learning_rate": 1.1583069072403087e-08, + "loss": 0.9651, + "step": 32208 + }, + { + "epoch": 0.97, + "learning_rate": 1.1559627793557293e-08, + "loss": 1.0236, + "step": 32209 + }, + { + "epoch": 0.97, + "learning_rate": 1.1536210203465237e-08, + "loss": 1.0598, + "step": 32210 + }, + { + "epoch": 0.97, + "learning_rate": 1.1512816302350071e-08, + "loss": 0.9752, + "step": 32211 + }, + { + "epoch": 0.97, + "learning_rate": 1.1489446090434397e-08, + "loss": 1.1187, + "step": 32212 + }, + { + "epoch": 0.97, + "learning_rate": 1.1466099567940536e-08, + "loss": 1.0753, + "step": 32213 + }, + { + "epoch": 0.97, + "learning_rate": 1.1442776735091088e-08, + "loss": 1.1328, + "step": 32214 + }, + { + "epoch": 0.97, + "learning_rate": 1.1419477592107542e-08, + "loss": 0.9756, + "step": 32215 + }, + { + "epoch": 0.97, + "learning_rate": 1.1396202139212498e-08, + "loss": 1.0298, + "step": 32216 + }, + { + "epoch": 0.97, + "learning_rate": 1.137295037662689e-08, + "loss": 1.0875, + "step": 32217 + }, + { + "epoch": 0.97, + "learning_rate": 1.1349722304571931e-08, + "loss": 1.0973, + "step": 32218 + }, + { + "epoch": 0.97, + "learning_rate": 1.1326517923269386e-08, + "loss": 1.1131, + "step": 32219 + }, + { + "epoch": 0.97, + "learning_rate": 1.1303337232939638e-08, + "loss": 1.1969, + "step": 32220 + }, + { + "epoch": 0.97, + "learning_rate": 1.1280180233803618e-08, + "loss": 1.1216, + "step": 32221 + }, + { + "epoch": 0.97, + "learning_rate": 1.1257046926081706e-08, + "loss": 1.0804, + "step": 32222 + }, + { + "epoch": 0.97, + "learning_rate": 1.1233937309994003e-08, + "loss": 1.0836, + "step": 32223 + }, + { + "epoch": 0.97, + "learning_rate": 1.1210851385760613e-08, + "loss": 1.1144, + "step": 32224 + }, + { + "epoch": 0.97, + "learning_rate": 1.118778915360108e-08, + "loss": 1.1361, + "step": 32225 + }, + { + "epoch": 0.97, + "learning_rate": 1.116475061373523e-08, + "loss": 1.1412, + "step": 32226 + }, + { + "epoch": 0.97, + "learning_rate": 1.114173576638261e-08, + "loss": 1.0588, + "step": 32227 + }, + { + "epoch": 0.97, + "learning_rate": 1.1118744611761656e-08, + "loss": 1.0907, + "step": 32228 + }, + { + "epoch": 0.97, + "learning_rate": 1.1095777150091635e-08, + "loss": 1.1606, + "step": 32229 + }, + { + "epoch": 0.97, + "learning_rate": 1.1072833381591263e-08, + "loss": 1.0048, + "step": 32230 + }, + { + "epoch": 0.97, + "learning_rate": 1.1049913306478699e-08, + "loss": 1.1354, + "step": 32231 + }, + { + "epoch": 0.97, + "learning_rate": 1.10270169249721e-08, + "loss": 1.0746, + "step": 32232 + }, + { + "epoch": 0.97, + "learning_rate": 1.1004144237289904e-08, + "loss": 1.0688, + "step": 32233 + }, + { + "epoch": 0.97, + "learning_rate": 1.0981295243649159e-08, + "loss": 1.0792, + "step": 32234 + }, + { + "epoch": 0.97, + "learning_rate": 1.0958469944268023e-08, + "loss": 1.1178, + "step": 32235 + }, + { + "epoch": 0.97, + "learning_rate": 1.093566833936327e-08, + "loss": 1.0888, + "step": 32236 + }, + { + "epoch": 0.97, + "learning_rate": 1.0912890429152501e-08, + "loss": 1.1741, + "step": 32237 + }, + { + "epoch": 0.97, + "learning_rate": 1.0890136213851932e-08, + "loss": 1.1832, + "step": 32238 + }, + { + "epoch": 0.97, + "learning_rate": 1.0867405693678334e-08, + "loss": 1.1032, + "step": 32239 + }, + { + "epoch": 0.97, + "learning_rate": 1.084469886884848e-08, + "loss": 1.0233, + "step": 32240 + }, + { + "epoch": 0.97, + "learning_rate": 1.0822015739578307e-08, + "loss": 1.1513, + "step": 32241 + }, + { + "epoch": 0.97, + "learning_rate": 1.0799356306083752e-08, + "loss": 1.1025, + "step": 32242 + }, + { + "epoch": 0.97, + "learning_rate": 1.0776720568580201e-08, + "loss": 1.0541, + "step": 32243 + }, + { + "epoch": 0.97, + "learning_rate": 1.0754108527283591e-08, + "loss": 1.0687, + "step": 32244 + }, + { + "epoch": 0.97, + "learning_rate": 1.0731520182409027e-08, + "loss": 1.1423, + "step": 32245 + }, + { + "epoch": 0.97, + "learning_rate": 1.0708955534171616e-08, + "loss": 1.1401, + "step": 32246 + }, + { + "epoch": 0.97, + "learning_rate": 1.0686414582785909e-08, + "loss": 1.0541, + "step": 32247 + }, + { + "epoch": 0.97, + "learning_rate": 1.0663897328466455e-08, + "loss": 1.1791, + "step": 32248 + }, + { + "epoch": 0.97, + "learning_rate": 1.0641403771428082e-08, + "loss": 1.0779, + "step": 32249 + }, + { + "epoch": 0.97, + "learning_rate": 1.061893391188451e-08, + "loss": 1.0324, + "step": 32250 + }, + { + "epoch": 0.97, + "learning_rate": 1.0596487750049734e-08, + "loss": 1.0801, + "step": 32251 + }, + { + "epoch": 0.97, + "learning_rate": 1.0574065286137747e-08, + "loss": 1.0723, + "step": 32252 + }, + { + "epoch": 0.97, + "learning_rate": 1.0551666520361437e-08, + "loss": 1.0315, + "step": 32253 + }, + { + "epoch": 0.97, + "learning_rate": 1.0529291452934244e-08, + "loss": 1.1265, + "step": 32254 + }, + { + "epoch": 0.97, + "learning_rate": 1.0506940084069329e-08, + "loss": 0.9989, + "step": 32255 + }, + { + "epoch": 0.97, + "learning_rate": 1.0484612413979301e-08, + "loss": 1.2179, + "step": 32256 + }, + { + "epoch": 0.97, + "learning_rate": 1.0462308442877045e-08, + "loss": 1.0564, + "step": 32257 + }, + { + "epoch": 0.97, + "learning_rate": 1.0440028170974337e-08, + "loss": 1.0771, + "step": 32258 + }, + { + "epoch": 0.97, + "learning_rate": 1.0417771598483784e-08, + "loss": 1.0723, + "step": 32259 + }, + { + "epoch": 0.97, + "learning_rate": 1.0395538725616605e-08, + "loss": 0.9776, + "step": 32260 + }, + { + "epoch": 0.97, + "learning_rate": 1.0373329552585133e-08, + "loss": 1.1885, + "step": 32261 + }, + { + "epoch": 0.97, + "learning_rate": 1.0351144079600584e-08, + "loss": 1.2202, + "step": 32262 + }, + { + "epoch": 0.97, + "learning_rate": 1.032898230687418e-08, + "loss": 1.1183, + "step": 32263 + }, + { + "epoch": 0.97, + "learning_rate": 1.0306844234616586e-08, + "loss": 1.1022, + "step": 32264 + }, + { + "epoch": 0.97, + "learning_rate": 1.0284729863038745e-08, + "loss": 1.0422, + "step": 32265 + }, + { + "epoch": 0.97, + "learning_rate": 1.0262639192351042e-08, + "loss": 1.0303, + "step": 32266 + }, + { + "epoch": 0.97, + "learning_rate": 1.0240572222764144e-08, + "loss": 0.9656, + "step": 32267 + }, + { + "epoch": 0.97, + "learning_rate": 1.0218528954487883e-08, + "loss": 1.1469, + "step": 32268 + }, + { + "epoch": 0.97, + "learning_rate": 1.019650938773209e-08, + "loss": 1.1701, + "step": 32269 + }, + { + "epoch": 0.97, + "learning_rate": 1.017451352270632e-08, + "loss": 1.0115, + "step": 32270 + }, + { + "epoch": 0.97, + "learning_rate": 1.0152541359620127e-08, + "loss": 1.1409, + "step": 32271 + }, + { + "epoch": 0.97, + "learning_rate": 1.013059289868279e-08, + "loss": 1.073, + "step": 32272 + }, + { + "epoch": 0.97, + "learning_rate": 1.0108668140102752e-08, + "loss": 1.1491, + "step": 32273 + }, + { + "epoch": 0.97, + "learning_rate": 1.008676708408901e-08, + "loss": 1.2151, + "step": 32274 + }, + { + "epoch": 0.97, + "learning_rate": 1.0064889730850014e-08, + "loss": 1.0823, + "step": 32275 + }, + { + "epoch": 0.97, + "learning_rate": 1.0043036080594205e-08, + "loss": 1.0081, + "step": 32276 + }, + { + "epoch": 0.97, + "learning_rate": 1.002120613352947e-08, + "loss": 1.0418, + "step": 32277 + }, + { + "epoch": 0.97, + "learning_rate": 9.999399889863703e-09, + "loss": 1.0154, + "step": 32278 + }, + { + "epoch": 0.97, + "learning_rate": 9.977617349804514e-09, + "loss": 1.0721, + "step": 32279 + }, + { + "epoch": 0.97, + "learning_rate": 9.955858513558959e-09, + "loss": 1.0013, + "step": 32280 + }, + { + "epoch": 0.97, + "learning_rate": 9.934123381334371e-09, + "loss": 1.0646, + "step": 32281 + }, + { + "epoch": 0.97, + "learning_rate": 9.912411953337809e-09, + "loss": 1.2466, + "step": 32282 + }, + { + "epoch": 0.97, + "learning_rate": 9.890724229775773e-09, + "loss": 1.0565, + "step": 32283 + }, + { + "epoch": 0.97, + "learning_rate": 9.869060210854764e-09, + "loss": 1.1318, + "step": 32284 + }, + { + "epoch": 0.97, + "learning_rate": 9.847419896781007e-09, + "loss": 1.0599, + "step": 32285 + }, + { + "epoch": 0.97, + "learning_rate": 9.82580328776045e-09, + "loss": 1.1633, + "step": 32286 + }, + { + "epoch": 0.97, + "learning_rate": 9.804210383999035e-09, + "loss": 1.085, + "step": 32287 + }, + { + "epoch": 0.97, + "learning_rate": 9.782641185702157e-09, + "loss": 1.1171, + "step": 32288 + }, + { + "epoch": 0.97, + "learning_rate": 9.761095693075206e-09, + "loss": 1.0875, + "step": 32289 + }, + { + "epoch": 0.97, + "learning_rate": 9.739573906323296e-09, + "loss": 1.0843, + "step": 32290 + }, + { + "epoch": 0.97, + "learning_rate": 9.718075825651264e-09, + "loss": 1.0919, + "step": 32291 + }, + { + "epoch": 0.97, + "learning_rate": 9.696601451263942e-09, + "loss": 1.1373, + "step": 32292 + }, + { + "epoch": 0.97, + "learning_rate": 9.675150783365339e-09, + "loss": 1.1404, + "step": 32293 + }, + { + "epoch": 0.97, + "learning_rate": 9.653723822160287e-09, + "loss": 1.1466, + "step": 32294 + }, + { + "epoch": 0.97, + "learning_rate": 9.632320567852239e-09, + "loss": 1.1821, + "step": 32295 + }, + { + "epoch": 0.97, + "learning_rate": 9.610941020644915e-09, + "loss": 1.0825, + "step": 32296 + }, + { + "epoch": 0.97, + "learning_rate": 9.589585180742044e-09, + "loss": 1.098, + "step": 32297 + }, + { + "epoch": 0.97, + "learning_rate": 9.568253048347075e-09, + "loss": 1.2363, + "step": 32298 + }, + { + "epoch": 0.97, + "learning_rate": 9.546944623662901e-09, + "loss": 1.1172, + "step": 32299 + }, + { + "epoch": 0.97, + "learning_rate": 9.525659906892138e-09, + "loss": 0.9097, + "step": 32300 + }, + { + "epoch": 0.97, + "learning_rate": 9.504398898237955e-09, + "loss": 1.0856, + "step": 32301 + }, + { + "epoch": 0.97, + "learning_rate": 9.483161597902412e-09, + "loss": 1.0341, + "step": 32302 + }, + { + "epoch": 0.97, + "learning_rate": 9.461948006087296e-09, + "loss": 0.9861, + "step": 32303 + }, + { + "epoch": 0.97, + "learning_rate": 9.44075812299522e-09, + "loss": 0.9123, + "step": 32304 + }, + { + "epoch": 0.97, + "learning_rate": 9.419591948827689e-09, + "loss": 1.1392, + "step": 32305 + }, + { + "epoch": 0.97, + "learning_rate": 9.398449483785932e-09, + "loss": 0.9457, + "step": 32306 + }, + { + "epoch": 0.97, + "learning_rate": 9.377330728071732e-09, + "loss": 1.0699, + "step": 32307 + }, + { + "epoch": 0.97, + "learning_rate": 9.356235681885484e-09, + "loss": 1.0717, + "step": 32308 + }, + { + "epoch": 0.97, + "learning_rate": 9.335164345428415e-09, + "loss": 1.1133, + "step": 32309 + }, + { + "epoch": 0.97, + "learning_rate": 9.3141167189012e-09, + "loss": 1.0747, + "step": 32310 + }, + { + "epoch": 0.97, + "learning_rate": 9.293092802503956e-09, + "loss": 1.1505, + "step": 32311 + }, + { + "epoch": 0.97, + "learning_rate": 9.272092596437077e-09, + "loss": 1.0567, + "step": 32312 + }, + { + "epoch": 0.97, + "learning_rate": 9.251116100900127e-09, + "loss": 0.9261, + "step": 32313 + }, + { + "epoch": 0.97, + "learning_rate": 9.230163316092944e-09, + "loss": 1.0665, + "step": 32314 + }, + { + "epoch": 0.97, + "learning_rate": 9.209234242215093e-09, + "loss": 0.9871, + "step": 32315 + }, + { + "epoch": 0.97, + "learning_rate": 9.18832887946558e-09, + "loss": 1.0899, + "step": 32316 + }, + { + "epoch": 0.97, + "learning_rate": 9.167447228043691e-09, + "loss": 1.0623, + "step": 32317 + }, + { + "epoch": 0.97, + "learning_rate": 9.146589288147877e-09, + "loss": 1.0087, + "step": 32318 + }, + { + "epoch": 0.97, + "learning_rate": 9.125755059977149e-09, + "loss": 1.2467, + "step": 32319 + }, + { + "epoch": 0.97, + "learning_rate": 9.1049445437294e-09, + "loss": 1.1689, + "step": 32320 + }, + { + "epoch": 0.97, + "learning_rate": 9.084157739603083e-09, + "loss": 0.9968, + "step": 32321 + }, + { + "epoch": 0.97, + "learning_rate": 9.06339464779582e-09, + "loss": 1.1396, + "step": 32322 + }, + { + "epoch": 0.97, + "learning_rate": 9.042655268505506e-09, + "loss": 1.0665, + "step": 32323 + }, + { + "epoch": 0.97, + "learning_rate": 9.021939601929209e-09, + "loss": 1.2098, + "step": 32324 + }, + { + "epoch": 0.97, + "learning_rate": 9.001247648264545e-09, + "loss": 1.062, + "step": 32325 + }, + { + "epoch": 0.97, + "learning_rate": 8.9805794077083e-09, + "loss": 0.9898, + "step": 32326 + }, + { + "epoch": 0.97, + "learning_rate": 8.959934880456989e-09, + "loss": 1.1451, + "step": 32327 + }, + { + "epoch": 0.97, + "learning_rate": 8.939314066707672e-09, + "loss": 1.0358, + "step": 32328 + }, + { + "epoch": 0.97, + "learning_rate": 8.918716966656026e-09, + "loss": 1.0682, + "step": 32329 + }, + { + "epoch": 0.97, + "learning_rate": 8.898143580498564e-09, + "loss": 1.0883, + "step": 32330 + }, + { + "epoch": 0.97, + "learning_rate": 8.877593908431237e-09, + "loss": 1.0489, + "step": 32331 + }, + { + "epoch": 0.97, + "learning_rate": 8.857067950649167e-09, + "loss": 1.058, + "step": 32332 + }, + { + "epoch": 0.97, + "learning_rate": 8.836565707348033e-09, + "loss": 1.0659, + "step": 32333 + }, + { + "epoch": 0.97, + "learning_rate": 8.816087178723231e-09, + "loss": 1.1172, + "step": 32334 + }, + { + "epoch": 0.97, + "learning_rate": 8.795632364969331e-09, + "loss": 1.0728, + "step": 32335 + }, + { + "epoch": 0.97, + "learning_rate": 8.775201266281174e-09, + "loss": 1.0164, + "step": 32336 + }, + { + "epoch": 0.97, + "learning_rate": 8.754793882853606e-09, + "loss": 1.1564, + "step": 32337 + }, + { + "epoch": 0.97, + "learning_rate": 8.734410214880363e-09, + "loss": 1.0857, + "step": 32338 + }, + { + "epoch": 0.97, + "learning_rate": 8.714050262555452e-09, + "loss": 1.1276, + "step": 32339 + }, + { + "epoch": 0.97, + "learning_rate": 8.693714026073163e-09, + "loss": 1.0186, + "step": 32340 + }, + { + "epoch": 0.97, + "learning_rate": 8.673401505626956e-09, + "loss": 1.0894, + "step": 32341 + }, + { + "epoch": 0.97, + "learning_rate": 8.653112701410005e-09, + "loss": 1.0152, + "step": 32342 + }, + { + "epoch": 0.97, + "learning_rate": 8.632847613615492e-09, + "loss": 1.3068, + "step": 32343 + }, + { + "epoch": 0.97, + "learning_rate": 8.612606242436317e-09, + "loss": 1.0107, + "step": 32344 + }, + { + "epoch": 0.97, + "learning_rate": 8.592388588065382e-09, + "loss": 1.0499, + "step": 32345 + }, + { + "epoch": 0.97, + "learning_rate": 8.572194650695031e-09, + "loss": 1.0676, + "step": 32346 + }, + { + "epoch": 0.97, + "learning_rate": 8.552024430517613e-09, + "loss": 1.0692, + "step": 32347 + }, + { + "epoch": 0.97, + "learning_rate": 8.531877927724641e-09, + "loss": 1.0576, + "step": 32348 + }, + { + "epoch": 0.97, + "learning_rate": 8.51175514250846e-09, + "loss": 1.2061, + "step": 32349 + }, + { + "epoch": 0.97, + "learning_rate": 8.491656075060584e-09, + "loss": 1.062, + "step": 32350 + }, + { + "epoch": 0.97, + "learning_rate": 8.471580725571971e-09, + "loss": 1.1083, + "step": 32351 + }, + { + "epoch": 0.97, + "learning_rate": 8.451529094233857e-09, + "loss": 1.077, + "step": 32352 + }, + { + "epoch": 0.97, + "learning_rate": 8.431501181237478e-09, + "loss": 1.0482, + "step": 32353 + }, + { + "epoch": 0.97, + "learning_rate": 8.41149698677296e-09, + "loss": 1.1935, + "step": 32354 + }, + { + "epoch": 0.97, + "learning_rate": 8.39151651103126e-09, + "loss": 1.1384, + "step": 32355 + }, + { + "epoch": 0.97, + "learning_rate": 8.37155975420223e-09, + "loss": 1.0097, + "step": 32356 + }, + { + "epoch": 0.97, + "learning_rate": 8.351626716475713e-09, + "loss": 1.0839, + "step": 32357 + }, + { + "epoch": 0.97, + "learning_rate": 8.331717398041839e-09, + "loss": 1.0058, + "step": 32358 + }, + { + "epoch": 0.97, + "learning_rate": 8.311831799090175e-09, + "loss": 1.0312, + "step": 32359 + }, + { + "epoch": 0.97, + "learning_rate": 8.291969919809461e-09, + "loss": 0.9178, + "step": 32360 + }, + { + "epoch": 0.97, + "learning_rate": 8.272131760389545e-09, + "loss": 1.1338, + "step": 32361 + }, + { + "epoch": 0.97, + "learning_rate": 8.25231732101861e-09, + "loss": 1.2524, + "step": 32362 + }, + { + "epoch": 0.97, + "learning_rate": 8.23252660188567e-09, + "loss": 1.071, + "step": 32363 + }, + { + "epoch": 0.97, + "learning_rate": 8.21275960317891e-09, + "loss": 1.1588, + "step": 32364 + }, + { + "epoch": 0.97, + "learning_rate": 8.19301632508679e-09, + "loss": 1.1115, + "step": 32365 + }, + { + "epoch": 0.98, + "learning_rate": 8.173296767796934e-09, + "loss": 1.1391, + "step": 32366 + }, + { + "epoch": 0.98, + "learning_rate": 8.153600931497253e-09, + "loss": 1.0914, + "step": 32367 + }, + { + "epoch": 0.98, + "learning_rate": 8.133928816375091e-09, + "loss": 1.1705, + "step": 32368 + }, + { + "epoch": 0.98, + "learning_rate": 8.114280422617804e-09, + "loss": 1.0513, + "step": 32369 + }, + { + "epoch": 0.98, + "learning_rate": 8.094655750412461e-09, + "loss": 1.078, + "step": 32370 + }, + { + "epoch": 0.98, + "learning_rate": 8.075054799945858e-09, + "loss": 1.1055, + "step": 32371 + }, + { + "epoch": 0.98, + "learning_rate": 8.055477571404514e-09, + "loss": 1.114, + "step": 32372 + }, + { + "epoch": 0.98, + "learning_rate": 8.035924064974943e-09, + "loss": 1.0952, + "step": 32373 + }, + { + "epoch": 0.98, + "learning_rate": 8.01639428084311e-09, + "loss": 1.0546, + "step": 32374 + }, + { + "epoch": 0.98, + "learning_rate": 7.996888219194975e-09, + "loss": 1.0975, + "step": 32375 + }, + { + "epoch": 0.98, + "learning_rate": 7.977405880216505e-09, + "loss": 1.104, + "step": 32376 + }, + { + "epoch": 0.98, + "learning_rate": 7.957947264092825e-09, + "loss": 1.0142, + "step": 32377 + }, + { + "epoch": 0.98, + "learning_rate": 7.938512371009066e-09, + "loss": 1.0611, + "step": 32378 + }, + { + "epoch": 0.98, + "learning_rate": 7.919101201150637e-09, + "loss": 1.1364, + "step": 32379 + }, + { + "epoch": 0.98, + "learning_rate": 7.899713754702388e-09, + "loss": 1.1249, + "step": 32380 + }, + { + "epoch": 0.98, + "learning_rate": 7.880350031848339e-09, + "loss": 1.2734, + "step": 32381 + }, + { + "epoch": 0.98, + "learning_rate": 7.861010032773065e-09, + "loss": 0.9941, + "step": 32382 + }, + { + "epoch": 0.98, + "learning_rate": 7.841693757660861e-09, + "loss": 1.0834, + "step": 32383 + }, + { + "epoch": 0.98, + "learning_rate": 7.822401206695474e-09, + "loss": 1.1321, + "step": 32384 + }, + { + "epoch": 0.98, + "learning_rate": 7.803132380060363e-09, + "loss": 1.045, + "step": 32385 + }, + { + "epoch": 0.98, + "learning_rate": 7.783887277939273e-09, + "loss": 1.0479, + "step": 32386 + }, + { + "epoch": 0.98, + "learning_rate": 7.76466590051539e-09, + "loss": 1.1682, + "step": 32387 + }, + { + "epoch": 0.98, + "learning_rate": 7.745468247971343e-09, + "loss": 1.1753, + "step": 32388 + }, + { + "epoch": 0.98, + "learning_rate": 7.726294320490325e-09, + "loss": 1.0698, + "step": 32389 + }, + { + "epoch": 0.98, + "learning_rate": 7.707144118254684e-09, + "loss": 1.1418, + "step": 32390 + }, + { + "epoch": 0.98, + "learning_rate": 7.6880176414465e-09, + "loss": 1.1094, + "step": 32391 + }, + { + "epoch": 0.98, + "learning_rate": 7.668914890248403e-09, + "loss": 1.1028, + "step": 32392 + }, + { + "epoch": 0.98, + "learning_rate": 7.649835864841637e-09, + "loss": 1.0488, + "step": 32393 + }, + { + "epoch": 0.98, + "learning_rate": 7.630780565408002e-09, + "loss": 1.0711, + "step": 32394 + }, + { + "epoch": 0.98, + "learning_rate": 7.61174899212902e-09, + "loss": 1.0685, + "step": 32395 + }, + { + "epoch": 0.98, + "learning_rate": 7.592741145185933e-09, + "loss": 1.1194, + "step": 32396 + }, + { + "epoch": 0.98, + "learning_rate": 7.573757024759709e-09, + "loss": 1.0906, + "step": 32397 + }, + { + "epoch": 0.98, + "learning_rate": 7.554796631030481e-09, + "loss": 1.0951, + "step": 32398 + }, + { + "epoch": 0.98, + "learning_rate": 7.535859964179493e-09, + "loss": 1.1421, + "step": 32399 + }, + { + "epoch": 0.98, + "learning_rate": 7.5169470243866e-09, + "loss": 1.1073, + "step": 32400 + }, + { + "epoch": 0.98, + "learning_rate": 7.498057811831937e-09, + "loss": 1.0613, + "step": 32401 + }, + { + "epoch": 0.98, + "learning_rate": 7.479192326695638e-09, + "loss": 1.0477, + "step": 32402 + }, + { + "epoch": 0.98, + "learning_rate": 7.46035056915645e-09, + "loss": 1.1135, + "step": 32403 + }, + { + "epoch": 0.98, + "learning_rate": 7.44153253939478e-09, + "loss": 1.1343, + "step": 32404 + }, + { + "epoch": 0.98, + "learning_rate": 7.422738237588822e-09, + "loss": 1.2129, + "step": 32405 + }, + { + "epoch": 0.98, + "learning_rate": 7.403967663918432e-09, + "loss": 1.1201, + "step": 32406 + }, + { + "epoch": 0.98, + "learning_rate": 7.385220818561245e-09, + "loss": 1.0242, + "step": 32407 + }, + { + "epoch": 0.98, + "learning_rate": 7.3664977016965626e-09, + "loss": 1.0931, + "step": 32408 + }, + { + "epoch": 0.98, + "learning_rate": 7.347798313502297e-09, + "loss": 1.1352, + "step": 32409 + }, + { + "epoch": 0.98, + "learning_rate": 7.32912265415664e-09, + "loss": 1.1661, + "step": 32410 + }, + { + "epoch": 0.98, + "learning_rate": 7.310470723836949e-09, + "loss": 1.0197, + "step": 32411 + }, + { + "epoch": 0.98, + "learning_rate": 7.291842522721415e-09, + "loss": 1.079, + "step": 32412 + }, + { + "epoch": 0.98, + "learning_rate": 7.273238050986564e-09, + "loss": 1.1975, + "step": 32413 + }, + { + "epoch": 0.98, + "learning_rate": 7.254657308810309e-09, + "loss": 1.1544, + "step": 32414 + }, + { + "epoch": 0.98, + "learning_rate": 7.236100296368898e-09, + "loss": 1.0768, + "step": 32415 + }, + { + "epoch": 0.98, + "learning_rate": 7.2175670138394106e-09, + "loss": 1.1495, + "step": 32416 + }, + { + "epoch": 0.98, + "learning_rate": 7.199057461398095e-09, + "loss": 1.124, + "step": 32417 + }, + { + "epoch": 0.98, + "learning_rate": 7.180571639221201e-09, + "loss": 1.0035, + "step": 32418 + }, + { + "epoch": 0.98, + "learning_rate": 7.162109547484697e-09, + "loss": 1.0455, + "step": 32419 + }, + { + "epoch": 0.98, + "learning_rate": 7.143671186364276e-09, + "loss": 1.0928, + "step": 32420 + }, + { + "epoch": 0.98, + "learning_rate": 7.125256556035354e-09, + "loss": 1.1298, + "step": 32421 + }, + { + "epoch": 0.98, + "learning_rate": 7.106865656673623e-09, + "loss": 1.1865, + "step": 32422 + }, + { + "epoch": 0.98, + "learning_rate": 7.088498488453943e-09, + "loss": 1.1432, + "step": 32423 + }, + { + "epoch": 0.98, + "learning_rate": 7.070155051550898e-09, + "loss": 1.0673, + "step": 32424 + }, + { + "epoch": 0.98, + "learning_rate": 7.051835346139346e-09, + "loss": 1.1373, + "step": 32425 + }, + { + "epoch": 0.98, + "learning_rate": 7.033539372393872e-09, + "loss": 1.0493, + "step": 32426 + }, + { + "epoch": 0.98, + "learning_rate": 7.015267130488223e-09, + "loss": 1.0778, + "step": 32427 + }, + { + "epoch": 0.98, + "learning_rate": 6.997018620596985e-09, + "loss": 1.1292, + "step": 32428 + }, + { + "epoch": 0.98, + "learning_rate": 6.978793842893072e-09, + "loss": 1.1078, + "step": 32429 + }, + { + "epoch": 0.98, + "learning_rate": 6.960592797550514e-09, + "loss": 1.1899, + "step": 32430 + }, + { + "epoch": 0.98, + "learning_rate": 6.942415484742226e-09, + "loss": 1.04, + "step": 32431 + }, + { + "epoch": 0.98, + "learning_rate": 6.924261904641682e-09, + "loss": 1.0472, + "step": 32432 + }, + { + "epoch": 0.98, + "learning_rate": 6.906132057421522e-09, + "loss": 1.1293, + "step": 32433 + }, + { + "epoch": 0.98, + "learning_rate": 6.8880259432541066e-09, + "loss": 0.9515, + "step": 32434 + }, + { + "epoch": 0.98, + "learning_rate": 6.869943562311798e-09, + "loss": 1.0689, + "step": 32435 + }, + { + "epoch": 0.98, + "learning_rate": 6.851884914767237e-09, + "loss": 1.2748, + "step": 32436 + }, + { + "epoch": 0.98, + "learning_rate": 6.833850000791675e-09, + "loss": 1.1932, + "step": 32437 + }, + { + "epoch": 0.98, + "learning_rate": 6.815838820557474e-09, + "loss": 1.0554, + "step": 32438 + }, + { + "epoch": 0.98, + "learning_rate": 6.797851374235331e-09, + "loss": 1.0097, + "step": 32439 + }, + { + "epoch": 0.98, + "learning_rate": 6.779887661997054e-09, + "loss": 1.1466, + "step": 32440 + }, + { + "epoch": 0.98, + "learning_rate": 6.761947684013614e-09, + "loss": 1.1191, + "step": 32441 + }, + { + "epoch": 0.98, + "learning_rate": 6.744031440455434e-09, + "loss": 1.1445, + "step": 32442 + }, + { + "epoch": 0.98, + "learning_rate": 6.726138931493209e-09, + "loss": 1.2711, + "step": 32443 + }, + { + "epoch": 0.98, + "learning_rate": 6.708270157297636e-09, + "loss": 1.0488, + "step": 32444 + }, + { + "epoch": 0.98, + "learning_rate": 6.690425118038302e-09, + "loss": 1.0294, + "step": 32445 + }, + { + "epoch": 0.98, + "learning_rate": 6.672603813885348e-09, + "loss": 1.0305, + "step": 32446 + }, + { + "epoch": 0.98, + "learning_rate": 6.6548062450083605e-09, + "loss": 1.0813, + "step": 32447 + }, + { + "epoch": 0.98, + "learning_rate": 6.637032411576927e-09, + "loss": 1.0101, + "step": 32448 + }, + { + "epoch": 0.98, + "learning_rate": 6.619282313760078e-09, + "loss": 0.9954, + "step": 32449 + }, + { + "epoch": 0.98, + "learning_rate": 6.601555951726568e-09, + "loss": 1.1716, + "step": 32450 + }, + { + "epoch": 0.98, + "learning_rate": 6.583853325645706e-09, + "loss": 1.1389, + "step": 32451 + }, + { + "epoch": 0.98, + "learning_rate": 6.566174435685413e-09, + "loss": 1.018, + "step": 32452 + }, + { + "epoch": 0.98, + "learning_rate": 6.548519282014443e-09, + "loss": 1.0961, + "step": 32453 + }, + { + "epoch": 0.98, + "learning_rate": 6.530887864800717e-09, + "loss": 1.0795, + "step": 32454 + }, + { + "epoch": 0.98, + "learning_rate": 6.513280184211878e-09, + "loss": 1.03, + "step": 32455 + }, + { + "epoch": 0.98, + "learning_rate": 6.495696240415572e-09, + "loss": 1.1017, + "step": 32456 + }, + { + "epoch": 0.98, + "learning_rate": 6.4781360335797184e-09, + "loss": 1.0852, + "step": 32457 + }, + { + "epoch": 0.98, + "learning_rate": 6.460599563870851e-09, + "loss": 1.1778, + "step": 32458 + }, + { + "epoch": 0.98, + "learning_rate": 6.443086831456058e-09, + "loss": 1.0931, + "step": 32459 + }, + { + "epoch": 0.98, + "learning_rate": 6.425597836502428e-09, + "loss": 1.098, + "step": 32460 + }, + { + "epoch": 0.98, + "learning_rate": 6.408132579175941e-09, + "loss": 1.113, + "step": 32461 + }, + { + "epoch": 0.98, + "learning_rate": 6.390691059643128e-09, + "loss": 1.029, + "step": 32462 + }, + { + "epoch": 0.98, + "learning_rate": 6.373273278069969e-09, + "loss": 1.084, + "step": 32463 + }, + { + "epoch": 0.98, + "learning_rate": 6.355879234622164e-09, + "loss": 1.0249, + "step": 32464 + }, + { + "epoch": 0.98, + "learning_rate": 6.3385089294656925e-09, + "loss": 1.1052, + "step": 32465 + }, + { + "epoch": 0.98, + "learning_rate": 6.321162362765421e-09, + "loss": 0.9319, + "step": 32466 + }, + { + "epoch": 0.98, + "learning_rate": 6.303839534686773e-09, + "loss": 1.1909, + "step": 32467 + }, + { + "epoch": 0.98, + "learning_rate": 6.2865404453946176e-09, + "loss": 1.2425, + "step": 32468 + }, + { + "epoch": 0.98, + "learning_rate": 6.269265095053267e-09, + "loss": 1.022, + "step": 32469 + }, + { + "epoch": 0.98, + "learning_rate": 6.252013483827868e-09, + "loss": 1.1049, + "step": 32470 + }, + { + "epoch": 0.98, + "learning_rate": 6.234785611882177e-09, + "loss": 1.0953, + "step": 32471 + }, + { + "epoch": 0.98, + "learning_rate": 6.217581479379953e-09, + "loss": 1.0559, + "step": 32472 + }, + { + "epoch": 0.98, + "learning_rate": 6.200401086485786e-09, + "loss": 0.9772, + "step": 32473 + }, + { + "epoch": 0.98, + "learning_rate": 6.183244433362323e-09, + "loss": 1.1921, + "step": 32474 + }, + { + "epoch": 0.98, + "learning_rate": 6.166111520173601e-09, + "loss": 1.0353, + "step": 32475 + }, + { + "epoch": 0.98, + "learning_rate": 6.149002347082544e-09, + "loss": 1.0784, + "step": 32476 + }, + { + "epoch": 0.98, + "learning_rate": 6.131916914251524e-09, + "loss": 1.0784, + "step": 32477 + }, + { + "epoch": 0.98, + "learning_rate": 6.1148552218437404e-09, + "loss": 1.0605, + "step": 32478 + }, + { + "epoch": 0.98, + "learning_rate": 6.097817270021567e-09, + "loss": 1.0583, + "step": 32479 + }, + { + "epoch": 0.98, + "learning_rate": 6.080803058947093e-09, + "loss": 1.0915, + "step": 32480 + }, + { + "epoch": 0.98, + "learning_rate": 6.063812588781859e-09, + "loss": 1.0917, + "step": 32481 + }, + { + "epoch": 0.98, + "learning_rate": 6.04684585968851e-09, + "loss": 1.0431, + "step": 32482 + }, + { + "epoch": 0.98, + "learning_rate": 6.029902871827753e-09, + "loss": 1.0805, + "step": 32483 + }, + { + "epoch": 0.98, + "learning_rate": 6.012983625361124e-09, + "loss": 1.0807, + "step": 32484 + }, + { + "epoch": 0.98, + "learning_rate": 5.996088120449884e-09, + "loss": 1.103, + "step": 32485 + }, + { + "epoch": 0.98, + "learning_rate": 5.979216357254736e-09, + "loss": 1.0273, + "step": 32486 + }, + { + "epoch": 0.98, + "learning_rate": 5.962368335936386e-09, + "loss": 1.0938, + "step": 32487 + }, + { + "epoch": 0.98, + "learning_rate": 5.945544056654984e-09, + "loss": 1.0557, + "step": 32488 + }, + { + "epoch": 0.98, + "learning_rate": 5.928743519570957e-09, + "loss": 1.0009, + "step": 32489 + }, + { + "epoch": 0.98, + "learning_rate": 5.911966724843899e-09, + "loss": 1.0597, + "step": 32490 + }, + { + "epoch": 0.98, + "learning_rate": 5.895213672633682e-09, + "loss": 1.0495, + "step": 32491 + }, + { + "epoch": 0.98, + "learning_rate": 5.878484363100179e-09, + "loss": 1.213, + "step": 32492 + }, + { + "epoch": 0.98, + "learning_rate": 5.861778796402151e-09, + "loss": 1.2117, + "step": 32493 + }, + { + "epoch": 0.98, + "learning_rate": 5.845096972698638e-09, + "loss": 1.1191, + "step": 32494 + }, + { + "epoch": 0.98, + "learning_rate": 5.82843889214868e-09, + "loss": 1.2012, + "step": 32495 + }, + { + "epoch": 0.98, + "learning_rate": 5.811804554910483e-09, + "loss": 1.0813, + "step": 32496 + }, + { + "epoch": 0.98, + "learning_rate": 5.795193961143086e-09, + "loss": 1.0425, + "step": 32497 + }, + { + "epoch": 0.98, + "learning_rate": 5.778607111003864e-09, + "loss": 1.0366, + "step": 32498 + }, + { + "epoch": 0.98, + "learning_rate": 5.762044004651302e-09, + "loss": 1.1232, + "step": 32499 + }, + { + "epoch": 0.98, + "learning_rate": 5.745504642242494e-09, + "loss": 1.1447, + "step": 32500 + }, + { + "epoch": 0.98, + "learning_rate": 5.728989023935649e-09, + "loss": 1.1318, + "step": 32501 + }, + { + "epoch": 0.98, + "learning_rate": 5.712497149887308e-09, + "loss": 1.0199, + "step": 32502 + }, + { + "epoch": 0.98, + "learning_rate": 5.696029020254567e-09, + "loss": 1.1353, + "step": 32503 + }, + { + "epoch": 0.98, + "learning_rate": 5.6795846351945235e-09, + "loss": 1.0341, + "step": 32504 + }, + { + "epoch": 0.98, + "learning_rate": 5.663163994863441e-09, + "loss": 1.155, + "step": 32505 + }, + { + "epoch": 0.98, + "learning_rate": 5.64676709941786e-09, + "loss": 1.0893, + "step": 32506 + }, + { + "epoch": 0.98, + "learning_rate": 5.630393949013491e-09, + "loss": 1.0992, + "step": 32507 + }, + { + "epoch": 0.98, + "learning_rate": 5.614044543806596e-09, + "loss": 1.1069, + "step": 32508 + }, + { + "epoch": 0.98, + "learning_rate": 5.597718883952607e-09, + "loss": 1.0738, + "step": 32509 + }, + { + "epoch": 0.98, + "learning_rate": 5.581416969606957e-09, + "loss": 1.1644, + "step": 32510 + }, + { + "epoch": 0.98, + "learning_rate": 5.565138800925074e-09, + "loss": 1.0945, + "step": 32511 + }, + { + "epoch": 0.98, + "learning_rate": 5.548884378061559e-09, + "loss": 1.0604, + "step": 32512 + }, + { + "epoch": 0.98, + "learning_rate": 5.532653701171286e-09, + "loss": 1.2464, + "step": 32513 + }, + { + "epoch": 0.98, + "learning_rate": 5.5164467704088566e-09, + "loss": 1.093, + "step": 32514 + }, + { + "epoch": 0.98, + "learning_rate": 5.500263585928311e-09, + "loss": 1.0667, + "step": 32515 + }, + { + "epoch": 0.98, + "learning_rate": 5.484104147883973e-09, + "loss": 1.1332, + "step": 32516 + }, + { + "epoch": 0.98, + "learning_rate": 5.467968456429607e-09, + "loss": 1.0869, + "step": 32517 + }, + { + "epoch": 0.98, + "learning_rate": 5.4518565117187e-09, + "loss": 1.1408, + "step": 32518 + }, + { + "epoch": 0.98, + "learning_rate": 5.4357683139047436e-09, + "loss": 1.0555, + "step": 32519 + }, + { + "epoch": 0.98, + "learning_rate": 5.419703863140669e-09, + "loss": 1.0792, + "step": 32520 + }, + { + "epoch": 0.98, + "learning_rate": 5.403663159579686e-09, + "loss": 1.1612, + "step": 32521 + }, + { + "epoch": 0.98, + "learning_rate": 5.3876462033744524e-09, + "loss": 0.9602, + "step": 32522 + }, + { + "epoch": 0.98, + "learning_rate": 5.371652994677345e-09, + "loss": 1.1098, + "step": 32523 + }, + { + "epoch": 0.98, + "learning_rate": 5.355683533640743e-09, + "loss": 1.1166, + "step": 32524 + }, + { + "epoch": 0.98, + "learning_rate": 5.339737820416469e-09, + "loss": 1.0582, + "step": 32525 + }, + { + "epoch": 0.98, + "learning_rate": 5.323815855156622e-09, + "loss": 0.9882, + "step": 32526 + }, + { + "epoch": 0.98, + "learning_rate": 5.307917638012195e-09, + "loss": 1.0654, + "step": 32527 + }, + { + "epoch": 0.98, + "learning_rate": 5.292043169135286e-09, + "loss": 1.028, + "step": 32528 + }, + { + "epoch": 0.98, + "learning_rate": 5.276192448676331e-09, + "loss": 1.0421, + "step": 32529 + }, + { + "epoch": 0.98, + "learning_rate": 5.2603654767866e-09, + "loss": 1.0629, + "step": 32530 + }, + { + "epoch": 0.98, + "learning_rate": 5.244562253616803e-09, + "loss": 1.0819, + "step": 32531 + }, + { + "epoch": 0.98, + "learning_rate": 5.2287827793170985e-09, + "loss": 1.0402, + "step": 32532 + }, + { + "epoch": 0.98, + "learning_rate": 5.213027054037922e-09, + "loss": 1.0789, + "step": 32533 + }, + { + "epoch": 0.98, + "learning_rate": 5.1972950779294315e-09, + "loss": 1.1253, + "step": 32534 + }, + { + "epoch": 0.98, + "learning_rate": 5.181586851140952e-09, + "loss": 1.053, + "step": 32535 + }, + { + "epoch": 0.98, + "learning_rate": 5.1659023738220845e-09, + "loss": 1.0714, + "step": 32536 + }, + { + "epoch": 0.98, + "learning_rate": 5.150241646122434e-09, + "loss": 1.2047, + "step": 32537 + }, + { + "epoch": 0.98, + "learning_rate": 5.134604668191046e-09, + "loss": 0.9828, + "step": 32538 + }, + { + "epoch": 0.98, + "learning_rate": 5.118991440176413e-09, + "loss": 1.0327, + "step": 32539 + }, + { + "epoch": 0.98, + "learning_rate": 5.103401962227583e-09, + "loss": 0.976, + "step": 32540 + }, + { + "epoch": 0.98, + "learning_rate": 5.087836234492494e-09, + "loss": 1.0768, + "step": 32541 + }, + { + "epoch": 0.98, + "learning_rate": 5.072294257119914e-09, + "loss": 0.9483, + "step": 32542 + }, + { + "epoch": 0.98, + "learning_rate": 5.056776030257227e-09, + "loss": 1.1124, + "step": 32543 + }, + { + "epoch": 0.98, + "learning_rate": 5.041281554052646e-09, + "loss": 1.0861, + "step": 32544 + }, + { + "epoch": 0.98, + "learning_rate": 5.0258108286535545e-09, + "loss": 1.0483, + "step": 32545 + }, + { + "epoch": 0.98, + "learning_rate": 5.010363854206779e-09, + "loss": 1.0048, + "step": 32546 + }, + { + "epoch": 0.98, + "learning_rate": 4.994940630859979e-09, + "loss": 1.0233, + "step": 32547 + }, + { + "epoch": 0.98, + "learning_rate": 4.9795411587597045e-09, + "loss": 1.0973, + "step": 32548 + }, + { + "epoch": 0.98, + "learning_rate": 4.964165438052504e-09, + "loss": 1.0595, + "step": 32549 + }, + { + "epoch": 0.98, + "learning_rate": 4.94881346888465e-09, + "loss": 1.1553, + "step": 32550 + }, + { + "epoch": 0.98, + "learning_rate": 4.933485251402692e-09, + "loss": 1.1311, + "step": 32551 + }, + { + "epoch": 0.98, + "learning_rate": 4.918180785752069e-09, + "loss": 1.0249, + "step": 32552 + }, + { + "epoch": 0.98, + "learning_rate": 4.902900072078775e-09, + "loss": 1.1226, + "step": 32553 + }, + { + "epoch": 0.98, + "learning_rate": 4.887643110528251e-09, + "loss": 1.1137, + "step": 32554 + }, + { + "epoch": 0.98, + "learning_rate": 4.872409901245379e-09, + "loss": 1.1719, + "step": 32555 + }, + { + "epoch": 0.98, + "learning_rate": 4.857200444375876e-09, + "loss": 1.1305, + "step": 32556 + }, + { + "epoch": 0.98, + "learning_rate": 4.842014740063794e-09, + "loss": 1.033, + "step": 32557 + }, + { + "epoch": 0.98, + "learning_rate": 4.826852788454295e-09, + "loss": 1.0668, + "step": 32558 + }, + { + "epoch": 0.98, + "learning_rate": 4.81171458969143e-09, + "loss": 1.1264, + "step": 32559 + }, + { + "epoch": 0.98, + "learning_rate": 4.7966001439189724e-09, + "loss": 1.0706, + "step": 32560 + }, + { + "epoch": 0.98, + "learning_rate": 4.78150945128153e-09, + "loss": 1.1646, + "step": 32561 + }, + { + "epoch": 0.98, + "learning_rate": 4.76644251192232e-09, + "loss": 1.1857, + "step": 32562 + }, + { + "epoch": 0.98, + "learning_rate": 4.751399325984563e-09, + "loss": 0.9002, + "step": 32563 + }, + { + "epoch": 0.98, + "learning_rate": 4.736379893612031e-09, + "loss": 1.0148, + "step": 32564 + }, + { + "epoch": 0.98, + "learning_rate": 4.721384214947388e-09, + "loss": 1.0192, + "step": 32565 + }, + { + "epoch": 0.98, + "learning_rate": 4.7064122901332995e-09, + "loss": 1.0419, + "step": 32566 + }, + { + "epoch": 0.98, + "learning_rate": 4.691464119312428e-09, + "loss": 1.0366, + "step": 32567 + }, + { + "epoch": 0.98, + "learning_rate": 4.676539702626881e-09, + "loss": 1.0931, + "step": 32568 + }, + { + "epoch": 0.98, + "learning_rate": 4.661639040219046e-09, + "loss": 1.139, + "step": 32569 + }, + { + "epoch": 0.98, + "learning_rate": 4.646762132230753e-09, + "loss": 1.0704, + "step": 32570 + }, + { + "epoch": 0.98, + "learning_rate": 4.631908978803279e-09, + "loss": 1.0095, + "step": 32571 + }, + { + "epoch": 0.98, + "learning_rate": 4.617079580078176e-09, + "loss": 1.0514, + "step": 32572 + }, + { + "epoch": 0.98, + "learning_rate": 4.602273936196721e-09, + "loss": 1.1299, + "step": 32573 + }, + { + "epoch": 0.98, + "learning_rate": 4.5874920472996355e-09, + "loss": 1.1273, + "step": 32574 + }, + { + "epoch": 0.98, + "learning_rate": 4.572733913528193e-09, + "loss": 1.0112, + "step": 32575 + }, + { + "epoch": 0.98, + "learning_rate": 4.557999535022284e-09, + "loss": 1.0216, + "step": 32576 + }, + { + "epoch": 0.98, + "learning_rate": 4.543288911922072e-09, + "loss": 1.0455, + "step": 32577 + }, + { + "epoch": 0.98, + "learning_rate": 4.52860204436828e-09, + "loss": 1.1057, + "step": 32578 + }, + { + "epoch": 0.98, + "learning_rate": 4.513938932500239e-09, + "loss": 0.9619, + "step": 32579 + }, + { + "epoch": 0.98, + "learning_rate": 4.499299576457561e-09, + "loss": 1.0167, + "step": 32580 + }, + { + "epoch": 0.98, + "learning_rate": 4.4846839763798554e-09, + "loss": 1.1088, + "step": 32581 + }, + { + "epoch": 0.98, + "learning_rate": 4.470092132405901e-09, + "loss": 1.1568, + "step": 32582 + }, + { + "epoch": 0.98, + "learning_rate": 4.455524044674753e-09, + "loss": 1.1051, + "step": 32583 + }, + { + "epoch": 0.98, + "learning_rate": 4.440979713325189e-09, + "loss": 1.0437, + "step": 32584 + }, + { + "epoch": 0.98, + "learning_rate": 4.426459138495709e-09, + "loss": 1.1271, + "step": 32585 + }, + { + "epoch": 0.98, + "learning_rate": 4.411962320324259e-09, + "loss": 1.0916, + "step": 32586 + }, + { + "epoch": 0.98, + "learning_rate": 4.397489258949061e-09, + "loss": 0.9971, + "step": 32587 + }, + { + "epoch": 0.98, + "learning_rate": 4.383039954507784e-09, + "loss": 1.0444, + "step": 32588 + }, + { + "epoch": 0.98, + "learning_rate": 4.368614407138094e-09, + "loss": 1.0005, + "step": 32589 + }, + { + "epoch": 0.98, + "learning_rate": 4.354212616977382e-09, + "loss": 1.1541, + "step": 32590 + }, + { + "epoch": 0.98, + "learning_rate": 4.339834584162484e-09, + "loss": 1.0985, + "step": 32591 + }, + { + "epoch": 0.98, + "learning_rate": 4.3254803088305095e-09, + "loss": 1.0259, + "step": 32592 + }, + { + "epoch": 0.98, + "learning_rate": 4.311149791118019e-09, + "loss": 1.126, + "step": 32593 + }, + { + "epoch": 0.98, + "learning_rate": 4.296843031161291e-09, + "loss": 1.0098, + "step": 32594 + }, + { + "epoch": 0.98, + "learning_rate": 4.2825600290966055e-09, + "loss": 1.1636, + "step": 32595 + }, + { + "epoch": 0.98, + "learning_rate": 4.268300785060242e-09, + "loss": 1.1236, + "step": 32596 + }, + { + "epoch": 0.98, + "learning_rate": 4.254065299187371e-09, + "loss": 1.0424, + "step": 32597 + }, + { + "epoch": 0.98, + "learning_rate": 4.239853571613994e-09, + "loss": 1.0413, + "step": 32598 + }, + { + "epoch": 0.98, + "learning_rate": 4.225665602475004e-09, + "loss": 1.0682, + "step": 32599 + }, + { + "epoch": 0.98, + "learning_rate": 4.211501391905848e-09, + "loss": 1.1567, + "step": 32600 + }, + { + "epoch": 0.98, + "learning_rate": 4.1973609400411395e-09, + "loss": 1.068, + "step": 32601 + }, + { + "epoch": 0.98, + "learning_rate": 4.1832442470154945e-09, + "loss": 1.1434, + "step": 32602 + }, + { + "epoch": 0.98, + "learning_rate": 4.169151312963526e-09, + "loss": 1.1478, + "step": 32603 + }, + { + "epoch": 0.98, + "learning_rate": 4.155082138019018e-09, + "loss": 1.0905, + "step": 32604 + }, + { + "epoch": 0.98, + "learning_rate": 4.141036722316027e-09, + "loss": 1.0401, + "step": 32605 + }, + { + "epoch": 0.98, + "learning_rate": 4.127015065988338e-09, + "loss": 1.1451, + "step": 32606 + }, + { + "epoch": 0.98, + "learning_rate": 4.113017169169453e-09, + "loss": 1.0205, + "step": 32607 + }, + { + "epoch": 0.98, + "learning_rate": 4.0990430319928774e-09, + "loss": 1.0353, + "step": 32608 + }, + { + "epoch": 0.98, + "learning_rate": 4.085092654591005e-09, + "loss": 1.0972, + "step": 32609 + }, + { + "epoch": 0.98, + "learning_rate": 4.071166037097063e-09, + "loss": 1.1974, + "step": 32610 + }, + { + "epoch": 0.98, + "learning_rate": 4.057263179643445e-09, + "loss": 1.0593, + "step": 32611 + }, + { + "epoch": 0.98, + "learning_rate": 4.043384082362545e-09, + "loss": 1.1821, + "step": 32612 + }, + { + "epoch": 0.98, + "learning_rate": 4.029528745386757e-09, + "loss": 1.297, + "step": 32613 + }, + { + "epoch": 0.98, + "learning_rate": 4.015697168847643e-09, + "loss": 1.0175, + "step": 32614 + }, + { + "epoch": 0.98, + "learning_rate": 4.001889352877042e-09, + "loss": 0.9843, + "step": 32615 + }, + { + "epoch": 0.98, + "learning_rate": 3.988105297606515e-09, + "loss": 1.1321, + "step": 32616 + }, + { + "epoch": 0.98, + "learning_rate": 3.97434500316679e-09, + "loss": 1.0825, + "step": 32617 + }, + { + "epoch": 0.98, + "learning_rate": 3.9606084696894305e-09, + "loss": 1.0781, + "step": 32618 + }, + { + "epoch": 0.98, + "learning_rate": 3.946895697304609e-09, + "loss": 1.0476, + "step": 32619 + }, + { + "epoch": 0.98, + "learning_rate": 3.933206686143332e-09, + "loss": 1.0308, + "step": 32620 + }, + { + "epoch": 0.98, + "learning_rate": 3.91954143633605e-09, + "loss": 1.0921, + "step": 32621 + }, + { + "epoch": 0.98, + "learning_rate": 3.905899948012382e-09, + "loss": 1.0678, + "step": 32622 + }, + { + "epoch": 0.98, + "learning_rate": 3.8922822213022235e-09, + "loss": 1.1912, + "step": 32623 + }, + { + "epoch": 0.98, + "learning_rate": 3.8786882563354725e-09, + "loss": 1.1833, + "step": 32624 + }, + { + "epoch": 0.98, + "learning_rate": 3.8651180532414675e-09, + "loss": 1.303, + "step": 32625 + }, + { + "epoch": 0.98, + "learning_rate": 3.851571612149551e-09, + "loss": 1.061, + "step": 32626 + }, + { + "epoch": 0.98, + "learning_rate": 3.838048933188232e-09, + "loss": 1.0184, + "step": 32627 + }, + { + "epoch": 0.98, + "learning_rate": 3.824550016486572e-09, + "loss": 1.0865, + "step": 32628 + }, + { + "epoch": 0.98, + "learning_rate": 3.811074862173081e-09, + "loss": 1.1362, + "step": 32629 + }, + { + "epoch": 0.98, + "learning_rate": 3.797623470375711e-09, + "loss": 1.1071, + "step": 32630 + }, + { + "epoch": 0.98, + "learning_rate": 3.784195841222971e-09, + "loss": 1.1478, + "step": 32631 + }, + { + "epoch": 0.98, + "learning_rate": 3.770791974842536e-09, + "loss": 1.0986, + "step": 32632 + }, + { + "epoch": 0.98, + "learning_rate": 3.757411871361804e-09, + "loss": 1.0543, + "step": 32633 + }, + { + "epoch": 0.98, + "learning_rate": 3.744055530908175e-09, + "loss": 1.0584, + "step": 32634 + }, + { + "epoch": 0.98, + "learning_rate": 3.730722953609045e-09, + "loss": 1.1419, + "step": 32635 + }, + { + "epoch": 0.98, + "learning_rate": 3.717414139591258e-09, + "loss": 1.1889, + "step": 32636 + }, + { + "epoch": 0.98, + "learning_rate": 3.704129088981101e-09, + "loss": 0.972, + "step": 32637 + }, + { + "epoch": 0.98, + "learning_rate": 3.6908678019056953e-09, + "loss": 1.065, + "step": 32638 + }, + { + "epoch": 0.98, + "learning_rate": 3.6776302784907737e-09, + "loss": 1.0607, + "step": 32639 + }, + { + "epoch": 0.98, + "learning_rate": 3.664416518862901e-09, + "loss": 1.108, + "step": 32640 + }, + { + "epoch": 0.98, + "learning_rate": 3.6512265231472554e-09, + "loss": 1.0568, + "step": 32641 + }, + { + "epoch": 0.98, + "learning_rate": 3.6380602914695695e-09, + "loss": 1.1011, + "step": 32642 + }, + { + "epoch": 0.98, + "learning_rate": 3.6249178239552987e-09, + "loss": 1.1254, + "step": 32643 + }, + { + "epoch": 0.98, + "learning_rate": 3.6117991207296197e-09, + "loss": 1.0485, + "step": 32644 + }, + { + "epoch": 0.98, + "learning_rate": 3.5987041819171565e-09, + "loss": 1.1829, + "step": 32645 + }, + { + "epoch": 0.98, + "learning_rate": 3.585633007642808e-09, + "loss": 1.1196, + "step": 32646 + }, + { + "epoch": 0.98, + "learning_rate": 3.57258559803092e-09, + "loss": 1.1739, + "step": 32647 + }, + { + "epoch": 0.98, + "learning_rate": 3.5595619532058368e-09, + "loss": 1.1769, + "step": 32648 + }, + { + "epoch": 0.98, + "learning_rate": 3.546562073291071e-09, + "loss": 0.9977, + "step": 32649 + }, + { + "epoch": 0.98, + "learning_rate": 3.5335859584109676e-09, + "loss": 1.0135, + "step": 32650 + }, + { + "epoch": 0.98, + "learning_rate": 3.5206336086887614e-09, + "loss": 1.0948, + "step": 32651 + }, + { + "epoch": 0.98, + "learning_rate": 3.5077050242476872e-09, + "loss": 1.1271, + "step": 32652 + }, + { + "epoch": 0.98, + "learning_rate": 3.49480020521098e-09, + "loss": 1.0814, + "step": 32653 + }, + { + "epoch": 0.98, + "learning_rate": 3.4819191517013182e-09, + "loss": 1.1174, + "step": 32654 + }, + { + "epoch": 0.98, + "learning_rate": 3.4690618638416605e-09, + "loss": 1.1843, + "step": 32655 + }, + { + "epoch": 0.98, + "learning_rate": 3.4562283417538535e-09, + "loss": 1.0983, + "step": 32656 + }, + { + "epoch": 0.98, + "learning_rate": 3.443418585560576e-09, + "loss": 0.9296, + "step": 32657 + }, + { + "epoch": 0.98, + "learning_rate": 3.4306325953833985e-09, + "loss": 1.0596, + "step": 32658 + }, + { + "epoch": 0.98, + "learning_rate": 3.417870371344445e-09, + "loss": 1.0571, + "step": 32659 + }, + { + "epoch": 0.98, + "learning_rate": 3.4051319135647297e-09, + "loss": 1.1896, + "step": 32660 + }, + { + "epoch": 0.98, + "learning_rate": 3.3924172221658225e-09, + "loss": 1.1899, + "step": 32661 + }, + { + "epoch": 0.98, + "learning_rate": 3.3797262972687372e-09, + "loss": 1.1158, + "step": 32662 + }, + { + "epoch": 0.98, + "learning_rate": 3.367059138994211e-09, + "loss": 1.09, + "step": 32663 + }, + { + "epoch": 0.98, + "learning_rate": 3.35441574746298e-09, + "loss": 1.2325, + "step": 32664 + }, + { + "epoch": 0.98, + "learning_rate": 3.3417961227952268e-09, + "loss": 1.0806, + "step": 32665 + }, + { + "epoch": 0.98, + "learning_rate": 3.329200265111132e-09, + "loss": 0.9831, + "step": 32666 + }, + { + "epoch": 0.98, + "learning_rate": 3.3166281745306004e-09, + "loss": 1.1553, + "step": 32667 + }, + { + "epoch": 0.98, + "learning_rate": 3.3040798511732585e-09, + "loss": 1.1967, + "step": 32668 + }, + { + "epoch": 0.98, + "learning_rate": 3.2915552951587326e-09, + "loss": 1.09, + "step": 32669 + }, + { + "epoch": 0.98, + "learning_rate": 3.2790545066060943e-09, + "loss": 1.0671, + "step": 32670 + }, + { + "epoch": 0.98, + "learning_rate": 3.2665774856344144e-09, + "loss": 1.0367, + "step": 32671 + }, + { + "epoch": 0.98, + "learning_rate": 3.2541242323624878e-09, + "loss": 1.054, + "step": 32672 + }, + { + "epoch": 0.98, + "learning_rate": 3.24169474690883e-09, + "loss": 1.1054, + "step": 32673 + }, + { + "epoch": 0.98, + "learning_rate": 3.22928902939168e-09, + "loss": 1.0978, + "step": 32674 + }, + { + "epoch": 0.98, + "learning_rate": 3.216907079929277e-09, + "loss": 1.0309, + "step": 32675 + }, + { + "epoch": 0.98, + "learning_rate": 3.2045488986393037e-09, + "loss": 1.0515, + "step": 32676 + }, + { + "epoch": 0.98, + "learning_rate": 3.1922144856397217e-09, + "loss": 1.1605, + "step": 32677 + }, + { + "epoch": 0.98, + "learning_rate": 3.1799038410473826e-09, + "loss": 1.1091, + "step": 32678 + }, + { + "epoch": 0.98, + "learning_rate": 3.167616964980247e-09, + "loss": 1.2257, + "step": 32679 + }, + { + "epoch": 0.98, + "learning_rate": 3.155353857554888e-09, + "loss": 1.0551, + "step": 32680 + }, + { + "epoch": 0.98, + "learning_rate": 3.14311451888788e-09, + "loss": 1.0538, + "step": 32681 + }, + { + "epoch": 0.98, + "learning_rate": 3.1308989490957953e-09, + "loss": 1.0955, + "step": 32682 + }, + { + "epoch": 0.98, + "learning_rate": 3.118707148295208e-09, + "loss": 1.1013, + "step": 32683 + }, + { + "epoch": 0.98, + "learning_rate": 3.1065391166018586e-09, + "loss": 1.0082, + "step": 32684 + }, + { + "epoch": 0.98, + "learning_rate": 3.094394854131766e-09, + "loss": 1.0777, + "step": 32685 + }, + { + "epoch": 0.98, + "learning_rate": 3.0822743610003926e-09, + "loss": 1.0446, + "step": 32686 + }, + { + "epoch": 0.98, + "learning_rate": 3.0701776373234794e-09, + "loss": 1.1489, + "step": 32687 + }, + { + "epoch": 0.98, + "learning_rate": 3.058104683215657e-09, + "loss": 1.0818, + "step": 32688 + }, + { + "epoch": 0.98, + "learning_rate": 3.046055498792111e-09, + "loss": 1.1526, + "step": 32689 + }, + { + "epoch": 0.98, + "learning_rate": 3.0340300841677496e-09, + "loss": 1.027, + "step": 32690 + }, + { + "epoch": 0.98, + "learning_rate": 3.022028439456648e-09, + "loss": 1.0894, + "step": 32691 + }, + { + "epoch": 0.98, + "learning_rate": 3.0100505647734368e-09, + "loss": 1.1348, + "step": 32692 + }, + { + "epoch": 0.98, + "learning_rate": 2.9980964602316364e-09, + "loss": 1.2909, + "step": 32693 + }, + { + "epoch": 0.98, + "learning_rate": 2.9861661259456e-09, + "loss": 1.0248, + "step": 32694 + }, + { + "epoch": 0.98, + "learning_rate": 2.9742595620285696e-09, + "loss": 1.1171, + "step": 32695 + }, + { + "epoch": 0.98, + "learning_rate": 2.9623767685940665e-09, + "loss": 1.1752, + "step": 32696 + }, + { + "epoch": 0.98, + "learning_rate": 2.950517745755055e-09, + "loss": 1.1448, + "step": 32697 + }, + { + "epoch": 0.99, + "learning_rate": 2.9386824936245005e-09, + "loss": 1.0889, + "step": 32698 + }, + { + "epoch": 0.99, + "learning_rate": 2.926871012315091e-09, + "loss": 1.0824, + "step": 32699 + }, + { + "epoch": 0.99, + "learning_rate": 2.9150833019392365e-09, + "loss": 1.1677, + "step": 32700 + }, + { + "epoch": 0.99, + "learning_rate": 2.9033193626090694e-09, + "loss": 1.0873, + "step": 32701 + }, + { + "epoch": 0.99, + "learning_rate": 2.891579194436722e-09, + "loss": 1.1024, + "step": 32702 + }, + { + "epoch": 0.99, + "learning_rate": 2.8798627975340498e-09, + "loss": 1.1747, + "step": 32703 + }, + { + "epoch": 0.99, + "learning_rate": 2.8681701720123523e-09, + "loss": 1.123, + "step": 32704 + }, + { + "epoch": 0.99, + "learning_rate": 2.8565013179829295e-09, + "loss": 1.0046, + "step": 32705 + }, + { + "epoch": 0.99, + "learning_rate": 2.8448562355568033e-09, + "loss": 1.1218, + "step": 32706 + }, + { + "epoch": 0.99, + "learning_rate": 2.833234924845274e-09, + "loss": 0.9737, + "step": 32707 + }, + { + "epoch": 0.99, + "learning_rate": 2.821637385958531e-09, + "loss": 1.1271, + "step": 32708 + }, + { + "epoch": 0.99, + "learning_rate": 2.8100636190070418e-09, + "loss": 0.98, + "step": 32709 + }, + { + "epoch": 0.99, + "learning_rate": 2.7985136241012732e-09, + "loss": 1.0897, + "step": 32710 + }, + { + "epoch": 0.99, + "learning_rate": 2.7869874013505826e-09, + "loss": 1.1155, + "step": 32711 + }, + { + "epoch": 0.99, + "learning_rate": 2.775484950865437e-09, + "loss": 1.1077, + "step": 32712 + }, + { + "epoch": 0.99, + "learning_rate": 2.7640062727549155e-09, + "loss": 1.0744, + "step": 32713 + }, + { + "epoch": 0.99, + "learning_rate": 2.752551367128098e-09, + "loss": 1.0507, + "step": 32714 + }, + { + "epoch": 0.99, + "learning_rate": 2.7411202340946186e-09, + "loss": 1.0537, + "step": 32715 + }, + { + "epoch": 0.99, + "learning_rate": 2.7297128737627245e-09, + "loss": 0.9501, + "step": 32716 + }, + { + "epoch": 0.99, + "learning_rate": 2.718329286241217e-09, + "loss": 1.2564, + "step": 32717 + }, + { + "epoch": 0.99, + "learning_rate": 2.706969471638621e-09, + "loss": 1.1821, + "step": 32718 + }, + { + "epoch": 0.99, + "learning_rate": 2.695633430062905e-09, + "loss": 1.1156, + "step": 32719 + }, + { + "epoch": 0.99, + "learning_rate": 2.6843211616220386e-09, + "loss": 1.1915, + "step": 32720 + }, + { + "epoch": 0.99, + "learning_rate": 2.6730326664234364e-09, + "loss": 1.0839, + "step": 32721 + }, + { + "epoch": 0.99, + "learning_rate": 2.6617679445750664e-09, + "loss": 1.1377, + "step": 32722 + }, + { + "epoch": 0.99, + "learning_rate": 2.6505269961840663e-09, + "loss": 1.1266, + "step": 32723 + }, + { + "epoch": 0.99, + "learning_rate": 2.6393098213570168e-09, + "loss": 1.1127, + "step": 32724 + }, + { + "epoch": 0.99, + "learning_rate": 2.6281164202010545e-09, + "loss": 1.0921, + "step": 32725 + }, + { + "epoch": 0.99, + "learning_rate": 2.6169467928224835e-09, + "loss": 1.0608, + "step": 32726 + }, + { + "epoch": 0.99, + "learning_rate": 2.605800939327885e-09, + "loss": 1.0396, + "step": 32727 + }, + { + "epoch": 0.99, + "learning_rate": 2.5946788598235627e-09, + "loss": 1.0038, + "step": 32728 + }, + { + "epoch": 0.99, + "learning_rate": 2.583580554414711e-09, + "loss": 1.1472, + "step": 32729 + }, + { + "epoch": 0.99, + "learning_rate": 2.5725060232076326e-09, + "loss": 1.1957, + "step": 32730 + }, + { + "epoch": 0.99, + "learning_rate": 2.5614552663072447e-09, + "loss": 1.1996, + "step": 32731 + }, + { + "epoch": 0.99, + "learning_rate": 2.550428283819295e-09, + "loss": 1.1118, + "step": 32732 + }, + { + "epoch": 0.99, + "learning_rate": 2.5394250758481454e-09, + "loss": 1.1401, + "step": 32733 + }, + { + "epoch": 0.99, + "learning_rate": 2.528445642498989e-09, + "loss": 1.1232, + "step": 32734 + }, + { + "epoch": 0.99, + "learning_rate": 2.5174899838764646e-09, + "loss": 1.0806, + "step": 32735 + }, + { + "epoch": 0.99, + "learning_rate": 2.5065581000840998e-09, + "loss": 1.1951, + "step": 32736 + }, + { + "epoch": 0.99, + "learning_rate": 2.4956499912268117e-09, + "loss": 1.1475, + "step": 32737 + }, + { + "epoch": 0.99, + "learning_rate": 2.484765657408128e-09, + "loss": 1.1766, + "step": 32738 + }, + { + "epoch": 0.99, + "learning_rate": 2.473905098731577e-09, + "loss": 1.0806, + "step": 32739 + }, + { + "epoch": 0.99, + "learning_rate": 2.46306831530041e-09, + "loss": 0.9979, + "step": 32740 + }, + { + "epoch": 0.99, + "learning_rate": 2.4522553072181543e-09, + "loss": 1.1201, + "step": 32741 + }, + { + "epoch": 0.99, + "learning_rate": 2.4414660745875064e-09, + "loss": 1.0072, + "step": 32742 + }, + { + "epoch": 0.99, + "learning_rate": 2.4307006175111614e-09, + "loss": 1.2632, + "step": 32743 + }, + { + "epoch": 0.99, + "learning_rate": 2.419958936091815e-09, + "loss": 1.0059, + "step": 32744 + }, + { + "epoch": 0.99, + "learning_rate": 2.4092410304316085e-09, + "loss": 1.1726, + "step": 32745 + }, + { + "epoch": 0.99, + "learning_rate": 2.3985469006324036e-09, + "loss": 1.0747, + "step": 32746 + }, + { + "epoch": 0.99, + "learning_rate": 2.3878765467963414e-09, + "loss": 1.0398, + "step": 32747 + }, + { + "epoch": 0.99, + "learning_rate": 2.3772299690247302e-09, + "loss": 1.1367, + "step": 32748 + }, + { + "epoch": 0.99, + "learning_rate": 2.366607167418877e-09, + "loss": 1.1457, + "step": 32749 + }, + { + "epoch": 0.99, + "learning_rate": 2.356008142080091e-09, + "loss": 1.0748, + "step": 32750 + }, + { + "epoch": 0.99, + "learning_rate": 2.345432893109123e-09, + "loss": 1.0067, + "step": 32751 + }, + { + "epoch": 0.99, + "learning_rate": 2.3348814206067273e-09, + "loss": 1.0923, + "step": 32752 + }, + { + "epoch": 0.99, + "learning_rate": 2.3243537246733783e-09, + "loss": 1.0444, + "step": 32753 + }, + { + "epoch": 0.99, + "learning_rate": 2.3138498054092738e-09, + "loss": 1.1155, + "step": 32754 + }, + { + "epoch": 0.99, + "learning_rate": 2.3033696629146116e-09, + "loss": 1.223, + "step": 32755 + }, + { + "epoch": 0.99, + "learning_rate": 2.292913297288757e-09, + "loss": 1.2086, + "step": 32756 + }, + { + "epoch": 0.99, + "learning_rate": 2.2824807086313517e-09, + "loss": 0.9819, + "step": 32757 + }, + { + "epoch": 0.99, + "learning_rate": 2.272071897041761e-09, + "loss": 1.0792, + "step": 32758 + }, + { + "epoch": 0.99, + "learning_rate": 2.26168686261935e-09, + "loss": 1.0242, + "step": 32759 + }, + { + "epoch": 0.99, + "learning_rate": 2.2513256054623734e-09, + "loss": 0.9921, + "step": 32760 + }, + { + "epoch": 0.99, + "learning_rate": 2.240988125670196e-09, + "loss": 1.0677, + "step": 32761 + }, + { + "epoch": 0.99, + "learning_rate": 2.2306744233405176e-09, + "loss": 1.1472, + "step": 32762 + }, + { + "epoch": 0.99, + "learning_rate": 2.220384498572148e-09, + "loss": 1.065, + "step": 32763 + }, + { + "epoch": 0.99, + "learning_rate": 2.210118351462509e-09, + "loss": 1.0328, + "step": 32764 + }, + { + "epoch": 0.99, + "learning_rate": 2.199875982109856e-09, + "loss": 1.2087, + "step": 32765 + }, + { + "epoch": 0.99, + "learning_rate": 2.189657390611055e-09, + "loss": 1.0804, + "step": 32766 + }, + { + "epoch": 0.99, + "learning_rate": 2.1794625770638068e-09, + "loss": 1.0328, + "step": 32767 + }, + { + "epoch": 0.99, + "learning_rate": 2.1692915415652547e-09, + "loss": 1.0096, + "step": 32768 + }, + { + "epoch": 0.99, + "learning_rate": 2.1591442842119893e-09, + "loss": 1.0526, + "step": 32769 + }, + { + "epoch": 0.99, + "learning_rate": 2.149020805100599e-09, + "loss": 1.1413, + "step": 32770 + }, + { + "epoch": 0.99, + "learning_rate": 2.138921104327396e-09, + "loss": 1.1548, + "step": 32771 + }, + { + "epoch": 0.99, + "learning_rate": 2.12884518198897e-09, + "loss": 1.0594, + "step": 32772 + }, + { + "epoch": 0.99, + "learning_rate": 2.1187930381807996e-09, + "loss": 1.0617, + "step": 32773 + }, + { + "epoch": 0.99, + "learning_rate": 2.108764672998642e-09, + "loss": 1.1303, + "step": 32774 + }, + { + "epoch": 0.99, + "learning_rate": 2.0987600865379767e-09, + "loss": 1.2361, + "step": 32775 + }, + { + "epoch": 0.99, + "learning_rate": 2.088779278894004e-09, + "loss": 0.9827, + "step": 32776 + }, + { + "epoch": 0.99, + "learning_rate": 2.078822250161927e-09, + "loss": 1.1492, + "step": 32777 + }, + { + "epoch": 0.99, + "learning_rate": 2.068889000436669e-09, + "loss": 1.089, + "step": 32778 + }, + { + "epoch": 0.99, + "learning_rate": 2.0589795298123214e-09, + "loss": 1.1031, + "step": 32779 + }, + { + "epoch": 0.99, + "learning_rate": 2.0490938383832537e-09, + "loss": 1.0451, + "step": 32780 + }, + { + "epoch": 0.99, + "learning_rate": 2.039231926244112e-09, + "loss": 0.9561, + "step": 32781 + }, + { + "epoch": 0.99, + "learning_rate": 2.0293937934881548e-09, + "loss": 1.0874, + "step": 32782 + }, + { + "epoch": 0.99, + "learning_rate": 2.0195794402094737e-09, + "loss": 1.0676, + "step": 32783 + }, + { + "epoch": 0.99, + "learning_rate": 2.0097888665013276e-09, + "loss": 1.1261, + "step": 32784 + }, + { + "epoch": 0.99, + "learning_rate": 2.0000220724566977e-09, + "loss": 1.0959, + "step": 32785 + }, + { + "epoch": 0.99, + "learning_rate": 1.99027905816912e-09, + "loss": 1.0768, + "step": 32786 + }, + { + "epoch": 0.99, + "learning_rate": 1.9805598237307434e-09, + "loss": 1.0234, + "step": 32787 + }, + { + "epoch": 0.99, + "learning_rate": 1.9708643692345488e-09, + "loss": 1.0037, + "step": 32788 + }, + { + "epoch": 0.99, + "learning_rate": 1.961192694772407e-09, + "loss": 1.0569, + "step": 32789 + }, + { + "epoch": 0.99, + "learning_rate": 1.9515448004367443e-09, + "loss": 1.0892, + "step": 32790 + }, + { + "epoch": 0.99, + "learning_rate": 1.941920686319154e-09, + "loss": 1.113, + "step": 32791 + }, + { + "epoch": 0.99, + "learning_rate": 1.9323203525115076e-09, + "loss": 1.0422, + "step": 32792 + }, + { + "epoch": 0.99, + "learning_rate": 1.92274379910512e-09, + "loss": 1.261, + "step": 32793 + }, + { + "epoch": 0.99, + "learning_rate": 1.91319102619103e-09, + "loss": 0.9921, + "step": 32794 + }, + { + "epoch": 0.99, + "learning_rate": 1.9036620338602763e-09, + "loss": 1.0803, + "step": 32795 + }, + { + "epoch": 0.99, + "learning_rate": 1.8941568222033415e-09, + "loss": 1.1416, + "step": 32796 + }, + { + "epoch": 0.99, + "learning_rate": 1.8846753913109862e-09, + "loss": 1.1434, + "step": 32797 + }, + { + "epoch": 0.99, + "learning_rate": 1.8752177412734164e-09, + "loss": 1.1588, + "step": 32798 + }, + { + "epoch": 0.99, + "learning_rate": 1.86578387218056e-09, + "loss": 1.0052, + "step": 32799 + }, + { + "epoch": 0.99, + "learning_rate": 1.8563737841226226e-09, + "loss": 1.0939, + "step": 32800 + }, + { + "epoch": 0.99, + "learning_rate": 1.8469874771884222e-09, + "loss": 1.0578, + "step": 32801 + }, + { + "epoch": 0.99, + "learning_rate": 1.8376249514681644e-09, + "loss": 1.0856, + "step": 32802 + }, + { + "epoch": 0.99, + "learning_rate": 1.8282862070501118e-09, + "loss": 1.0179, + "step": 32803 + }, + { + "epoch": 0.99, + "learning_rate": 1.818971244023915e-09, + "loss": 1.0359, + "step": 32804 + }, + { + "epoch": 0.99, + "learning_rate": 1.8096800624778366e-09, + "loss": 1.0449, + "step": 32805 + }, + { + "epoch": 0.99, + "learning_rate": 1.8004126625006946e-09, + "loss": 1.1094, + "step": 32806 + }, + { + "epoch": 0.99, + "learning_rate": 1.7911690441801965e-09, + "loss": 1.1449, + "step": 32807 + }, + { + "epoch": 0.99, + "learning_rate": 1.7819492076046051e-09, + "loss": 1.1735, + "step": 32808 + }, + { + "epoch": 0.99, + "learning_rate": 1.772753152861628e-09, + "loss": 1.0289, + "step": 32809 + }, + { + "epoch": 0.99, + "learning_rate": 1.763580880038973e-09, + "loss": 1.1125, + "step": 32810 + }, + { + "epoch": 0.99, + "learning_rate": 1.7544323892237925e-09, + "loss": 1.0915, + "step": 32811 + }, + { + "epoch": 0.99, + "learning_rate": 1.7453076805032387e-09, + "loss": 1.0774, + "step": 32812 + }, + { + "epoch": 0.99, + "learning_rate": 1.736206753964187e-09, + "loss": 1.0709, + "step": 32813 + }, + { + "epoch": 0.99, + "learning_rate": 1.7271296096932344e-09, + "loss": 1.0799, + "step": 32814 + }, + { + "epoch": 0.99, + "learning_rate": 1.718076247776701e-09, + "loss": 1.1234, + "step": 32815 + }, + { + "epoch": 0.99, + "learning_rate": 1.7090466683009066e-09, + "loss": 1.0687, + "step": 32816 + }, + { + "epoch": 0.99, + "learning_rate": 1.7000408713516158e-09, + "loss": 1.0125, + "step": 32817 + }, + { + "epoch": 0.99, + "learning_rate": 1.691058857014871e-09, + "loss": 1.0692, + "step": 32818 + }, + { + "epoch": 0.99, + "learning_rate": 1.6821006253761596e-09, + "loss": 1.1587, + "step": 32819 + }, + { + "epoch": 0.99, + "learning_rate": 1.6731661765204133e-09, + "loss": 1.1519, + "step": 32820 + }, + { + "epoch": 0.99, + "learning_rate": 1.6642555105331192e-09, + "loss": 0.986, + "step": 32821 + }, + { + "epoch": 0.99, + "learning_rate": 1.6553686274986548e-09, + "loss": 1.0167, + "step": 32822 + }, + { + "epoch": 0.99, + "learning_rate": 1.6465055275019514e-09, + "loss": 1.1545, + "step": 32823 + }, + { + "epoch": 0.99, + "learning_rate": 1.637666210627109e-09, + "loss": 1.2226, + "step": 32824 + }, + { + "epoch": 0.99, + "learning_rate": 1.6288506769585044e-09, + "loss": 1.0765, + "step": 32825 + }, + { + "epoch": 0.99, + "learning_rate": 1.6200589265799594e-09, + "loss": 1.1653, + "step": 32826 + }, + { + "epoch": 0.99, + "learning_rate": 1.6112909595752958e-09, + "loss": 1.1585, + "step": 32827 + }, + { + "epoch": 0.99, + "learning_rate": 1.6025467760277802e-09, + "loss": 1.1305, + "step": 32828 + }, + { + "epoch": 0.99, + "learning_rate": 1.5938263760209571e-09, + "loss": 1.0206, + "step": 32829 + }, + { + "epoch": 0.99, + "learning_rate": 1.5851297596372605e-09, + "loss": 0.9833, + "step": 32830 + }, + { + "epoch": 0.99, + "learning_rate": 1.5764569269602348e-09, + "loss": 1.0361, + "step": 32831 + }, + { + "epoch": 0.99, + "learning_rate": 1.5678078780717587e-09, + "loss": 1.0941, + "step": 32832 + }, + { + "epoch": 0.99, + "learning_rate": 1.559182613054544e-09, + "loss": 1.1262, + "step": 32833 + }, + { + "epoch": 0.99, + "learning_rate": 1.5505811319907471e-09, + "loss": 1.163, + "step": 32834 + }, + { + "epoch": 0.99, + "learning_rate": 1.542003434962247e-09, + "loss": 1.0958, + "step": 32835 + }, + { + "epoch": 0.99, + "learning_rate": 1.5334495220503676e-09, + "loss": 0.9916, + "step": 32836 + }, + { + "epoch": 0.99, + "learning_rate": 1.5249193933367102e-09, + "loss": 1.1051, + "step": 32837 + }, + { + "epoch": 0.99, + "learning_rate": 1.5164130489025986e-09, + "loss": 1.019, + "step": 32838 + }, + { + "epoch": 0.99, + "learning_rate": 1.5079304888288015e-09, + "loss": 1.1089, + "step": 32839 + }, + { + "epoch": 0.99, + "learning_rate": 1.4994717131963654e-09, + "loss": 1.0121, + "step": 32840 + }, + { + "epoch": 0.99, + "learning_rate": 1.4910367220855038e-09, + "loss": 1.113, + "step": 32841 + }, + { + "epoch": 0.99, + "learning_rate": 1.4826255155767077e-09, + "loss": 1.1696, + "step": 32842 + }, + { + "epoch": 0.99, + "learning_rate": 1.4742380937499135e-09, + "loss": 1.0948, + "step": 32843 + }, + { + "epoch": 0.99, + "learning_rate": 1.465874456685057e-09, + "loss": 1.1561, + "step": 32844 + }, + { + "epoch": 0.99, + "learning_rate": 1.4575346044617966e-09, + "loss": 1.1322, + "step": 32845 + }, + { + "epoch": 0.99, + "learning_rate": 1.4492185371595135e-09, + "loss": 0.9749, + "step": 32846 + }, + { + "epoch": 0.99, + "learning_rate": 1.440926254857311e-09, + "loss": 0.9479, + "step": 32847 + }, + { + "epoch": 0.99, + "learning_rate": 1.4326577576340151e-09, + "loss": 1.0287, + "step": 32848 + }, + { + "epoch": 0.99, + "learning_rate": 1.4244130455684512e-09, + "loss": 1.0435, + "step": 32849 + }, + { + "epoch": 0.99, + "learning_rate": 1.416192118739168e-09, + "loss": 1.0645, + "step": 32850 + }, + { + "epoch": 0.99, + "learning_rate": 1.407994977224436e-09, + "loss": 1.0635, + "step": 32851 + }, + { + "epoch": 0.99, + "learning_rate": 1.3998216211022486e-09, + "loss": 1.0594, + "step": 32852 + }, + { + "epoch": 0.99, + "learning_rate": 1.391672050450321e-09, + "loss": 1.0491, + "step": 32853 + }, + { + "epoch": 0.99, + "learning_rate": 1.3835462653463693e-09, + "loss": 1.0195, + "step": 32854 + }, + { + "epoch": 0.99, + "learning_rate": 1.3754442658678314e-09, + "loss": 1.1389, + "step": 32855 + }, + { + "epoch": 0.99, + "learning_rate": 1.3673660520915899e-09, + "loss": 1.1413, + "step": 32856 + }, + { + "epoch": 0.99, + "learning_rate": 1.359311624094528e-09, + "loss": 1.0491, + "step": 32857 + }, + { + "epoch": 0.99, + "learning_rate": 1.3512809819532513e-09, + "loss": 1.0213, + "step": 32858 + }, + { + "epoch": 0.99, + "learning_rate": 1.3432741257446424e-09, + "loss": 1.0526, + "step": 32859 + }, + { + "epoch": 0.99, + "learning_rate": 1.3352910555447519e-09, + "loss": 1.0887, + "step": 32860 + }, + { + "epoch": 0.99, + "learning_rate": 1.327331771429352e-09, + "loss": 1.0437, + "step": 32861 + }, + { + "epoch": 0.99, + "learning_rate": 1.3193962734744935e-09, + "loss": 1.2697, + "step": 32862 + }, + { + "epoch": 0.99, + "learning_rate": 1.311484561755394e-09, + "loss": 1.1853, + "step": 32863 + }, + { + "epoch": 0.99, + "learning_rate": 1.3035966363475483e-09, + "loss": 1.0664, + "step": 32864 + }, + { + "epoch": 0.99, + "learning_rate": 1.2957324973261742e-09, + "loss": 1.0668, + "step": 32865 + }, + { + "epoch": 0.99, + "learning_rate": 1.2878921447659343e-09, + "loss": 1.0996, + "step": 32866 + }, + { + "epoch": 0.99, + "learning_rate": 1.280075578741491e-09, + "loss": 1.048, + "step": 32867 + }, + { + "epoch": 0.99, + "learning_rate": 1.2722827993275066e-09, + "loss": 1.1638, + "step": 32868 + }, + { + "epoch": 0.99, + "learning_rate": 1.2645138065978113e-09, + "loss": 0.9456, + "step": 32869 + }, + { + "epoch": 0.99, + "learning_rate": 1.2567686006265123e-09, + "loss": 1.1543, + "step": 32870 + }, + { + "epoch": 0.99, + "learning_rate": 1.2490471814874395e-09, + "loss": 1.1736, + "step": 32871 + }, + { + "epoch": 0.99, + "learning_rate": 1.2413495492538675e-09, + "loss": 1.0098, + "step": 32872 + }, + { + "epoch": 0.99, + "learning_rate": 1.233675703999071e-09, + "loss": 1.0602, + "step": 32873 + }, + { + "epoch": 0.99, + "learning_rate": 1.2260256457966025e-09, + "loss": 1.1417, + "step": 32874 + }, + { + "epoch": 0.99, + "learning_rate": 1.2183993747186263e-09, + "loss": 1.2054, + "step": 32875 + }, + { + "epoch": 0.99, + "learning_rate": 1.2107968908381395e-09, + "loss": 1.1113, + "step": 32876 + }, + { + "epoch": 0.99, + "learning_rate": 1.2032181942273068e-09, + "loss": 1.1285, + "step": 32877 + }, + { + "epoch": 0.99, + "learning_rate": 1.1956632849585703e-09, + "loss": 1.0187, + "step": 32878 + }, + { + "epoch": 0.99, + "learning_rate": 1.1881321631035393e-09, + "loss": 1.1263, + "step": 32879 + }, + { + "epoch": 0.99, + "learning_rate": 1.1806248287341004e-09, + "loss": 0.9998, + "step": 32880 + }, + { + "epoch": 0.99, + "learning_rate": 1.173141281921586e-09, + "loss": 1.1085, + "step": 32881 + }, + { + "epoch": 0.99, + "learning_rate": 1.1656815227373276e-09, + "loss": 1.0099, + "step": 32882 + }, + { + "epoch": 0.99, + "learning_rate": 1.1582455512521019e-09, + "loss": 1.0617, + "step": 32883 + }, + { + "epoch": 0.99, + "learning_rate": 1.1508333675372407e-09, + "loss": 1.0092, + "step": 32884 + }, + { + "epoch": 0.99, + "learning_rate": 1.1434449716626884e-09, + "loss": 1.0851, + "step": 32885 + }, + { + "epoch": 0.99, + "learning_rate": 1.1360803636992212e-09, + "loss": 1.171, + "step": 32886 + }, + { + "epoch": 0.99, + "learning_rate": 1.1287395437165061e-09, + "loss": 1.1313, + "step": 32887 + }, + { + "epoch": 0.99, + "learning_rate": 1.121422511785042e-09, + "loss": 0.9343, + "step": 32888 + }, + { + "epoch": 0.99, + "learning_rate": 1.1141292679739402e-09, + "loss": 1.1863, + "step": 32889 + }, + { + "epoch": 0.99, + "learning_rate": 1.1068598123528673e-09, + "loss": 1.0486, + "step": 32890 + }, + { + "epoch": 0.99, + "learning_rate": 1.0996141449909348e-09, + "loss": 1.0574, + "step": 32891 + }, + { + "epoch": 0.99, + "learning_rate": 1.0923922659569763e-09, + "loss": 1.2819, + "step": 32892 + }, + { + "epoch": 0.99, + "learning_rate": 1.085194175320381e-09, + "loss": 1.0824, + "step": 32893 + }, + { + "epoch": 0.99, + "learning_rate": 1.0780198731488723e-09, + "loss": 1.0333, + "step": 32894 + }, + { + "epoch": 0.99, + "learning_rate": 1.070869359511284e-09, + "loss": 0.9579, + "step": 32895 + }, + { + "epoch": 0.99, + "learning_rate": 1.06374263447534e-09, + "loss": 1.0368, + "step": 32896 + }, + { + "epoch": 0.99, + "learning_rate": 1.056639698109041e-09, + "loss": 0.9908, + "step": 32897 + }, + { + "epoch": 0.99, + "learning_rate": 1.049560550480111e-09, + "loss": 1.0493, + "step": 32898 + }, + { + "epoch": 0.99, + "learning_rate": 1.0425051916557182e-09, + "loss": 1.0934, + "step": 32899 + }, + { + "epoch": 0.99, + "learning_rate": 1.035473621703309e-09, + "loss": 1.0508, + "step": 32900 + }, + { + "epoch": 0.99, + "learning_rate": 1.0284658406894965e-09, + "loss": 1.1174, + "step": 32901 + }, + { + "epoch": 0.99, + "learning_rate": 1.0214818486811718e-09, + "loss": 1.0583, + "step": 32902 + }, + { + "epoch": 0.99, + "learning_rate": 1.0145216457446705e-09, + "loss": 1.0852, + "step": 32903 + }, + { + "epoch": 0.99, + "learning_rate": 1.007585231946606e-09, + "loss": 1.109, + "step": 32904 + }, + { + "epoch": 0.99, + "learning_rate": 1.0006726073527595e-09, + "loss": 1.1584, + "step": 32905 + }, + { + "epoch": 0.99, + "learning_rate": 9.937837720289112e-10, + "loss": 1.1946, + "step": 32906 + }, + { + "epoch": 0.99, + "learning_rate": 9.869187260405644e-10, + "loss": 1.1096, + "step": 32907 + }, + { + "epoch": 0.99, + "learning_rate": 9.800774694532223e-10, + "loss": 1.0681, + "step": 32908 + }, + { + "epoch": 0.99, + "learning_rate": 9.732600023321104e-10, + "loss": 1.0684, + "step": 32909 + }, + { + "epoch": 0.99, + "learning_rate": 9.664663247416218e-10, + "loss": 1.1252, + "step": 32910 + }, + { + "epoch": 0.99, + "learning_rate": 9.596964367472594e-10, + "loss": 1.1495, + "step": 32911 + }, + { + "epoch": 0.99, + "learning_rate": 9.529503384128612e-10, + "loss": 1.0907, + "step": 32912 + }, + { + "epoch": 0.99, + "learning_rate": 9.462280298025427e-10, + "loss": 1.0656, + "step": 32913 + }, + { + "epoch": 0.99, + "learning_rate": 9.395295109806967e-10, + "loss": 1.0991, + "step": 32914 + }, + { + "epoch": 0.99, + "learning_rate": 9.328547820111612e-10, + "loss": 1.0484, + "step": 32915 + }, + { + "epoch": 0.99, + "learning_rate": 9.262038429569408e-10, + "loss": 1.0553, + "step": 32916 + }, + { + "epoch": 0.99, + "learning_rate": 9.19576693881874e-10, + "loss": 1.1709, + "step": 32917 + }, + { + "epoch": 0.99, + "learning_rate": 9.12973334848688e-10, + "loss": 1.035, + "step": 32918 + }, + { + "epoch": 0.99, + "learning_rate": 9.063937659206656e-10, + "loss": 1.1105, + "step": 32919 + }, + { + "epoch": 0.99, + "learning_rate": 8.998379871599794e-10, + "loss": 1.0562, + "step": 32920 + }, + { + "epoch": 0.99, + "learning_rate": 8.933059986290793e-10, + "loss": 1.0479, + "step": 32921 + }, + { + "epoch": 0.99, + "learning_rate": 8.867978003906929e-10, + "loss": 1.0377, + "step": 32922 + }, + { + "epoch": 0.99, + "learning_rate": 8.803133925058827e-10, + "loss": 1.2173, + "step": 32923 + }, + { + "epoch": 0.99, + "learning_rate": 8.738527750370984e-10, + "loss": 1.231, + "step": 32924 + }, + { + "epoch": 0.99, + "learning_rate": 8.674159480456801e-10, + "loss": 1.2141, + "step": 32925 + }, + { + "epoch": 0.99, + "learning_rate": 8.610029115929674e-10, + "loss": 1.1369, + "step": 32926 + }, + { + "epoch": 0.99, + "learning_rate": 8.546136657397452e-10, + "loss": 1.0313, + "step": 32927 + }, + { + "epoch": 0.99, + "learning_rate": 8.482482105467982e-10, + "loss": 1.0765, + "step": 32928 + }, + { + "epoch": 0.99, + "learning_rate": 8.419065460751885e-10, + "loss": 1.0853, + "step": 32929 + }, + { + "epoch": 0.99, + "learning_rate": 8.355886723845908e-10, + "loss": 1.1735, + "step": 32930 + }, + { + "epoch": 0.99, + "learning_rate": 8.292945895357896e-10, + "loss": 1.0782, + "step": 32931 + }, + { + "epoch": 0.99, + "learning_rate": 8.230242975884595e-10, + "loss": 1.0622, + "step": 32932 + }, + { + "epoch": 0.99, + "learning_rate": 8.167777966025525e-10, + "loss": 1.1707, + "step": 32933 + }, + { + "epoch": 0.99, + "learning_rate": 8.105550866369105e-10, + "loss": 1.0694, + "step": 32934 + }, + { + "epoch": 0.99, + "learning_rate": 8.04356167751208e-10, + "loss": 1.0637, + "step": 32935 + }, + { + "epoch": 0.99, + "learning_rate": 7.981810400042867e-10, + "loss": 1.0619, + "step": 32936 + }, + { + "epoch": 0.99, + "learning_rate": 7.92029703455266e-10, + "loss": 1.0787, + "step": 32937 + }, + { + "epoch": 0.99, + "learning_rate": 7.859021581624327e-10, + "loss": 1.08, + "step": 32938 + }, + { + "epoch": 0.99, + "learning_rate": 7.797984041840733e-10, + "loss": 1.1805, + "step": 32939 + }, + { + "epoch": 0.99, + "learning_rate": 7.737184415781973e-10, + "loss": 1.0162, + "step": 32940 + }, + { + "epoch": 0.99, + "learning_rate": 7.676622704030912e-10, + "loss": 1.104, + "step": 32941 + }, + { + "epoch": 0.99, + "learning_rate": 7.61629890716209e-10, + "loss": 1.1526, + "step": 32942 + }, + { + "epoch": 0.99, + "learning_rate": 7.556213025747272e-10, + "loss": 1.2235, + "step": 32943 + }, + { + "epoch": 0.99, + "learning_rate": 7.496365060360999e-10, + "loss": 1.1776, + "step": 32944 + }, + { + "epoch": 0.99, + "learning_rate": 7.436755011572261e-10, + "loss": 1.0201, + "step": 32945 + }, + { + "epoch": 0.99, + "learning_rate": 7.377382879950046e-10, + "loss": 1.0609, + "step": 32946 + }, + { + "epoch": 0.99, + "learning_rate": 7.318248666057793e-10, + "loss": 1.1028, + "step": 32947 + }, + { + "epoch": 0.99, + "learning_rate": 7.259352370458939e-10, + "loss": 1.1349, + "step": 32948 + }, + { + "epoch": 0.99, + "learning_rate": 7.200693993714147e-10, + "loss": 1.2382, + "step": 32949 + }, + { + "epoch": 0.99, + "learning_rate": 7.142273536381306e-10, + "loss": 1.1058, + "step": 32950 + }, + { + "epoch": 0.99, + "learning_rate": 7.084090999018301e-10, + "loss": 1.1109, + "step": 32951 + }, + { + "epoch": 0.99, + "learning_rate": 7.026146382177467e-10, + "loss": 1.121, + "step": 32952 + }, + { + "epoch": 0.99, + "learning_rate": 6.968439686411144e-10, + "loss": 1.0289, + "step": 32953 + }, + { + "epoch": 0.99, + "learning_rate": 6.910970912266113e-10, + "loss": 1.0922, + "step": 32954 + }, + { + "epoch": 0.99, + "learning_rate": 6.853740060291936e-10, + "loss": 1.0816, + "step": 32955 + }, + { + "epoch": 0.99, + "learning_rate": 6.796747131035398e-10, + "loss": 1.1216, + "step": 32956 + }, + { + "epoch": 0.99, + "learning_rate": 6.739992125034956e-10, + "loss": 1.1234, + "step": 32957 + }, + { + "epoch": 0.99, + "learning_rate": 6.683475042831844e-10, + "loss": 1.0356, + "step": 32958 + }, + { + "epoch": 0.99, + "learning_rate": 6.627195884967297e-10, + "loss": 1.0616, + "step": 32959 + }, + { + "epoch": 0.99, + "learning_rate": 6.571154651971445e-10, + "loss": 1.1823, + "step": 32960 + }, + { + "epoch": 0.99, + "learning_rate": 6.515351344382747e-10, + "loss": 1.2091, + "step": 32961 + }, + { + "epoch": 0.99, + "learning_rate": 6.459785962731336e-10, + "loss": 1.1525, + "step": 32962 + }, + { + "epoch": 0.99, + "learning_rate": 6.404458507544565e-10, + "loss": 1.0505, + "step": 32963 + }, + { + "epoch": 0.99, + "learning_rate": 6.34936897934979e-10, + "loss": 1.0203, + "step": 32964 + }, + { + "epoch": 0.99, + "learning_rate": 6.294517378671594e-10, + "loss": 0.9507, + "step": 32965 + }, + { + "epoch": 0.99, + "learning_rate": 6.239903706031781e-10, + "loss": 1.0104, + "step": 32966 + }, + { + "epoch": 0.99, + "learning_rate": 6.185527961952153e-10, + "loss": 1.1522, + "step": 32967 + }, + { + "epoch": 0.99, + "learning_rate": 6.131390146948968e-10, + "loss": 1.2462, + "step": 32968 + }, + { + "epoch": 0.99, + "learning_rate": 6.077490261535702e-10, + "loss": 1.1328, + "step": 32969 + }, + { + "epoch": 0.99, + "learning_rate": 6.023828306228607e-10, + "loss": 1.0892, + "step": 32970 + }, + { + "epoch": 0.99, + "learning_rate": 5.970404281535613e-10, + "loss": 1.0588, + "step": 32971 + }, + { + "epoch": 0.99, + "learning_rate": 5.917218187967422e-10, + "loss": 1.1003, + "step": 32972 + }, + { + "epoch": 0.99, + "learning_rate": 5.86427002603196e-10, + "loss": 1.162, + "step": 32973 + }, + { + "epoch": 0.99, + "learning_rate": 5.811559796228827e-10, + "loss": 1.1757, + "step": 32974 + }, + { + "epoch": 0.99, + "learning_rate": 5.759087499063176e-10, + "loss": 1.0225, + "step": 32975 + }, + { + "epoch": 0.99, + "learning_rate": 5.706853135031831e-10, + "loss": 1.1467, + "step": 32976 + }, + { + "epoch": 0.99, + "learning_rate": 5.654856704634392e-10, + "loss": 1.065, + "step": 32977 + }, + { + "epoch": 0.99, + "learning_rate": 5.60309820836491e-10, + "loss": 1.0529, + "step": 32978 + }, + { + "epoch": 0.99, + "learning_rate": 5.551577646717432e-10, + "loss": 1.0012, + "step": 32979 + }, + { + "epoch": 0.99, + "learning_rate": 5.500295020180457e-10, + "loss": 0.9911, + "step": 32980 + }, + { + "epoch": 0.99, + "learning_rate": 5.449250329242484e-10, + "loss": 1.1876, + "step": 32981 + }, + { + "epoch": 0.99, + "learning_rate": 5.398443574389234e-10, + "loss": 0.998, + "step": 32982 + }, + { + "epoch": 0.99, + "learning_rate": 5.34787475610643e-10, + "loss": 1.0225, + "step": 32983 + }, + { + "epoch": 0.99, + "learning_rate": 5.297543874874245e-10, + "loss": 1.1251, + "step": 32984 + }, + { + "epoch": 0.99, + "learning_rate": 5.247450931170072e-10, + "loss": 1.0544, + "step": 32985 + }, + { + "epoch": 0.99, + "learning_rate": 5.197595925474086e-10, + "loss": 1.1492, + "step": 32986 + }, + { + "epoch": 0.99, + "learning_rate": 5.147978858258129e-10, + "loss": 1.0798, + "step": 32987 + }, + { + "epoch": 0.99, + "learning_rate": 5.098599729994047e-10, + "loss": 1.084, + "step": 32988 + }, + { + "epoch": 0.99, + "learning_rate": 5.049458541153684e-10, + "loss": 1.0396, + "step": 32989 + }, + { + "epoch": 0.99, + "learning_rate": 5.000555292206111e-10, + "loss": 1.1268, + "step": 32990 + }, + { + "epoch": 0.99, + "learning_rate": 4.951889983614844e-10, + "loss": 1.1436, + "step": 32991 + }, + { + "epoch": 0.99, + "learning_rate": 4.903462615843401e-10, + "loss": 1.1479, + "step": 32992 + }, + { + "epoch": 0.99, + "learning_rate": 4.855273189352527e-10, + "loss": 1.1349, + "step": 32993 + }, + { + "epoch": 0.99, + "learning_rate": 4.807321704602963e-10, + "loss": 1.0587, + "step": 32994 + }, + { + "epoch": 0.99, + "learning_rate": 4.759608162047125e-10, + "loss": 1.118, + "step": 32995 + }, + { + "epoch": 0.99, + "learning_rate": 4.712132562142979e-10, + "loss": 1.1384, + "step": 32996 + }, + { + "epoch": 0.99, + "learning_rate": 4.664894905340168e-10, + "loss": 1.0479, + "step": 32997 + }, + { + "epoch": 0.99, + "learning_rate": 4.6178951920911043e-10, + "loss": 1.2314, + "step": 32998 + }, + { + "epoch": 0.99, + "learning_rate": 4.5711334228398797e-10, + "loss": 1.1695, + "step": 32999 + }, + { + "epoch": 0.99, + "learning_rate": 4.5246095980361336e-10, + "loss": 1.0592, + "step": 33000 + }, + { + "epoch": 0.99, + "learning_rate": 4.478323718115629e-10, + "loss": 1.2285, + "step": 33001 + }, + { + "epoch": 0.99, + "learning_rate": 4.4322757835252304e-10, + "loss": 1.0247, + "step": 33002 + }, + { + "epoch": 0.99, + "learning_rate": 4.386465794703476e-10, + "loss": 1.1958, + "step": 33003 + }, + { + "epoch": 0.99, + "learning_rate": 4.340893752080577e-10, + "loss": 1.056, + "step": 33004 + }, + { + "epoch": 0.99, + "learning_rate": 4.2955596560978476e-10, + "loss": 1.1659, + "step": 33005 + }, + { + "epoch": 0.99, + "learning_rate": 4.250463507179947e-10, + "loss": 1.2729, + "step": 33006 + }, + { + "epoch": 0.99, + "learning_rate": 4.2056053057598636e-10, + "loss": 1.1271, + "step": 33007 + }, + { + "epoch": 0.99, + "learning_rate": 4.160985052265032e-10, + "loss": 1.0479, + "step": 33008 + }, + { + "epoch": 0.99, + "learning_rate": 4.1166027471173375e-10, + "loss": 0.9899, + "step": 33009 + }, + { + "epoch": 0.99, + "learning_rate": 4.072458390744216e-10, + "loss": 1.1198, + "step": 33010 + }, + { + "epoch": 0.99, + "learning_rate": 4.0285519835592256e-10, + "loss": 1.0875, + "step": 33011 + }, + { + "epoch": 0.99, + "learning_rate": 3.9848835259870264e-10, + "loss": 1.2603, + "step": 33012 + }, + { + "epoch": 0.99, + "learning_rate": 3.9414530184384016e-10, + "loss": 1.0491, + "step": 33013 + }, + { + "epoch": 0.99, + "learning_rate": 3.898260461329684e-10, + "loss": 1.0337, + "step": 33014 + }, + { + "epoch": 0.99, + "learning_rate": 3.8553058550688804e-10, + "loss": 1.1464, + "step": 33015 + }, + { + "epoch": 0.99, + "learning_rate": 3.8125892000695497e-10, + "loss": 1.0603, + "step": 33016 + }, + { + "epoch": 0.99, + "learning_rate": 3.770110496734147e-10, + "loss": 1.0554, + "step": 33017 + }, + { + "epoch": 0.99, + "learning_rate": 3.7278697454706803e-10, + "loss": 1.2672, + "step": 33018 + }, + { + "epoch": 0.99, + "learning_rate": 3.685866946678829e-10, + "loss": 1.0544, + "step": 33019 + }, + { + "epoch": 0.99, + "learning_rate": 3.6441021007582733e-10, + "loss": 1.0002, + "step": 33020 + }, + { + "epoch": 0.99, + "learning_rate": 3.6025752081059184e-10, + "loss": 1.1223, + "step": 33021 + }, + { + "epoch": 0.99, + "learning_rate": 3.561286269118669e-10, + "loss": 1.118, + "step": 33022 + }, + { + "epoch": 0.99, + "learning_rate": 3.5202352841906537e-10, + "loss": 1.068, + "step": 33023 + }, + { + "epoch": 0.99, + "learning_rate": 3.479422253710452e-10, + "loss": 1.1216, + "step": 33024 + }, + { + "epoch": 0.99, + "learning_rate": 3.43884717806664e-10, + "loss": 1.0424, + "step": 33025 + }, + { + "epoch": 0.99, + "learning_rate": 3.398510057647797e-10, + "loss": 1.1321, + "step": 33026 + }, + { + "epoch": 0.99, + "learning_rate": 3.35841089283695e-10, + "loss": 1.1277, + "step": 33027 + }, + { + "epoch": 0.99, + "learning_rate": 3.3185496840143496e-10, + "loss": 1.1323, + "step": 33028 + }, + { + "epoch": 0.99, + "learning_rate": 3.2789264315602477e-10, + "loss": 1.1749, + "step": 33029 + }, + { + "epoch": 1.0, + "learning_rate": 3.2395411358521203e-10, + "loss": 1.243, + "step": 33030 + }, + { + "epoch": 1.0, + "learning_rate": 3.2003937972618915e-10, + "loss": 1.2122, + "step": 33031 + }, + { + "epoch": 1.0, + "learning_rate": 3.161484416169813e-10, + "loss": 1.0864, + "step": 33032 + }, + { + "epoch": 1.0, + "learning_rate": 3.1228129929394834e-10, + "loss": 1.0714, + "step": 33033 + }, + { + "epoch": 1.0, + "learning_rate": 3.084379527940051e-10, + "loss": 1.1368, + "step": 33034 + }, + { + "epoch": 1.0, + "learning_rate": 3.0461840215378903e-10, + "loss": 1.0422, + "step": 33035 + }, + { + "epoch": 1.0, + "learning_rate": 3.008226474099374e-10, + "loss": 0.9588, + "step": 33036 + }, + { + "epoch": 1.0, + "learning_rate": 2.970506885982549e-10, + "loss": 1.1442, + "step": 33037 + }, + { + "epoch": 1.0, + "learning_rate": 2.9330252575482386e-10, + "loss": 1.0621, + "step": 33038 + }, + { + "epoch": 1.0, + "learning_rate": 2.8957815891517136e-10, + "loss": 1.0429, + "step": 33039 + }, + { + "epoch": 1.0, + "learning_rate": 2.858775881148246e-10, + "loss": 0.9027, + "step": 33040 + }, + { + "epoch": 1.0, + "learning_rate": 2.8220081338903306e-10, + "loss": 1.1396, + "step": 33041 + }, + { + "epoch": 1.0, + "learning_rate": 2.785478347727688e-10, + "loss": 1.1773, + "step": 33042 + }, + { + "epoch": 1.0, + "learning_rate": 2.7491865230072636e-10, + "loss": 1.1185, + "step": 33043 + }, + { + "epoch": 1.0, + "learning_rate": 2.713132660078777e-10, + "loss": 1.0284, + "step": 33044 + }, + { + "epoch": 1.0, + "learning_rate": 2.67731675927807e-10, + "loss": 1.1274, + "step": 33045 + }, + { + "epoch": 1.0, + "learning_rate": 2.641738820952089e-10, + "loss": 1.1525, + "step": 33046 + }, + { + "epoch": 1.0, + "learning_rate": 2.606398845439451e-10, + "loss": 1.0217, + "step": 33047 + }, + { + "epoch": 1.0, + "learning_rate": 2.5712968330704466e-10, + "loss": 1.2305, + "step": 33048 + }, + { + "epoch": 1.0, + "learning_rate": 2.5364327841864713e-10, + "loss": 1.15, + "step": 33049 + }, + { + "epoch": 1.0, + "learning_rate": 2.501806699117815e-10, + "loss": 1.2404, + "step": 33050 + }, + { + "epoch": 1.0, + "learning_rate": 2.467418578189218e-10, + "loss": 1.1283, + "step": 33051 + }, + { + "epoch": 1.0, + "learning_rate": 2.433268421733748e-10, + "loss": 1.0721, + "step": 33052 + }, + { + "epoch": 1.0, + "learning_rate": 2.3993562300733685e-10, + "loss": 0.9764, + "step": 33053 + }, + { + "epoch": 1.0, + "learning_rate": 2.365682003532821e-10, + "loss": 1.0529, + "step": 33054 + }, + { + "epoch": 1.0, + "learning_rate": 2.332245742431294e-10, + "loss": 1.031, + "step": 33055 + }, + { + "epoch": 1.0, + "learning_rate": 2.2990474470879765e-10, + "loss": 1.0429, + "step": 33056 + }, + { + "epoch": 1.0, + "learning_rate": 2.2660871178192822e-10, + "loss": 1.0901, + "step": 33057 + }, + { + "epoch": 1.0, + "learning_rate": 2.2333647549360738e-10, + "loss": 1.1597, + "step": 33058 + }, + { + "epoch": 1.0, + "learning_rate": 2.2008803587519888e-10, + "loss": 1.0881, + "step": 33059 + }, + { + "epoch": 1.0, + "learning_rate": 2.1686339295778903e-10, + "loss": 1.0688, + "step": 33060 + }, + { + "epoch": 1.0, + "learning_rate": 2.1366254677163135e-10, + "loss": 1.018, + "step": 33061 + }, + { + "epoch": 1.0, + "learning_rate": 2.104854973478121e-10, + "loss": 1.2083, + "step": 33062 + }, + { + "epoch": 1.0, + "learning_rate": 2.0733224471602974e-10, + "loss": 1.0297, + "step": 33063 + }, + { + "epoch": 1.0, + "learning_rate": 2.0420278890653787e-10, + "loss": 1.1017, + "step": 33064 + }, + { + "epoch": 1.0, + "learning_rate": 2.0109712994903497e-10, + "loss": 1.0924, + "step": 33065 + }, + { + "epoch": 1.0, + "learning_rate": 1.9801526787321946e-10, + "loss": 1.1724, + "step": 33066 + }, + { + "epoch": 1.0, + "learning_rate": 1.949572027082347e-10, + "loss": 1.1212, + "step": 33067 + }, + { + "epoch": 1.0, + "learning_rate": 1.9192293448322407e-10, + "loss": 1.1407, + "step": 33068 + }, + { + "epoch": 1.0, + "learning_rate": 1.8891246322733092e-10, + "loss": 1.104, + "step": 33069 + }, + { + "epoch": 1.0, + "learning_rate": 1.859257889691435e-10, + "loss": 1.1549, + "step": 33070 + }, + { + "epoch": 1.0, + "learning_rate": 1.8296291173697244e-10, + "loss": 1.097, + "step": 33071 + }, + { + "epoch": 1.0, + "learning_rate": 1.8002383155885094e-10, + "loss": 1.097, + "step": 33072 + }, + { + "epoch": 1.0, + "learning_rate": 1.7710854846308966e-10, + "loss": 1.0566, + "step": 33073 + }, + { + "epoch": 1.0, + "learning_rate": 1.7421706247716662e-10, + "loss": 0.9356, + "step": 33074 + }, + { + "epoch": 1.0, + "learning_rate": 1.713493736288374e-10, + "loss": 1.0332, + "step": 33075 + }, + { + "epoch": 1.0, + "learning_rate": 1.6850548194530249e-10, + "loss": 1.0674, + "step": 33076 + }, + { + "epoch": 1.0, + "learning_rate": 1.6568538745376229e-10, + "loss": 1.0486, + "step": 33077 + }, + { + "epoch": 1.0, + "learning_rate": 1.6288909018058464e-10, + "loss": 1.0601, + "step": 33078 + }, + { + "epoch": 1.0, + "learning_rate": 1.6011659015297e-10, + "loss": 1.1611, + "step": 33079 + }, + { + "epoch": 1.0, + "learning_rate": 1.5736788739728613e-10, + "loss": 0.9528, + "step": 33080 + }, + { + "epoch": 1.0, + "learning_rate": 1.5464298193906825e-10, + "loss": 1.2121, + "step": 33081 + }, + { + "epoch": 1.0, + "learning_rate": 1.5194187380496162e-10, + "loss": 1.058, + "step": 33082 + }, + { + "epoch": 1.0, + "learning_rate": 1.492645630205014e-10, + "loss": 1.1078, + "step": 33083 + }, + { + "epoch": 1.0, + "learning_rate": 1.4661104961066764e-10, + "loss": 1.0491, + "step": 33084 + }, + { + "epoch": 1.0, + "learning_rate": 1.4398133360155052e-10, + "loss": 1.0687, + "step": 33085 + }, + { + "epoch": 1.0, + "learning_rate": 1.41375415017575e-10, + "loss": 1.1108, + "step": 33086 + }, + { + "epoch": 1.0, + "learning_rate": 1.387932938837211e-10, + "loss": 1.0651, + "step": 33087 + }, + { + "epoch": 1.0, + "learning_rate": 1.3623497022441368e-10, + "loss": 1.1031, + "step": 33088 + }, + { + "epoch": 1.0, + "learning_rate": 1.3370044406435523e-10, + "loss": 1.0941, + "step": 33089 + }, + { + "epoch": 1.0, + "learning_rate": 1.3118971542741553e-10, + "loss": 1.1021, + "step": 33090 + }, + { + "epoch": 1.0, + "learning_rate": 1.2870278433774196e-10, + "loss": 1.1927, + "step": 33091 + }, + { + "epoch": 1.0, + "learning_rate": 1.262396508186492e-10, + "loss": 1.2183, + "step": 33092 + }, + { + "epoch": 1.0, + "learning_rate": 1.2380031489400702e-10, + "loss": 1.0851, + "step": 33093 + }, + { + "epoch": 1.0, + "learning_rate": 1.2138477658657498e-10, + "loss": 1.1129, + "step": 33094 + }, + { + "epoch": 1.0, + "learning_rate": 1.1899303591966783e-10, + "loss": 1.1331, + "step": 33095 + }, + { + "epoch": 1.0, + "learning_rate": 1.1662509291604506e-10, + "loss": 1.1087, + "step": 33096 + }, + { + "epoch": 1.0, + "learning_rate": 1.142809475979112e-10, + "loss": 1.0806, + "step": 33097 + }, + { + "epoch": 1.0, + "learning_rate": 1.1196059998802578e-10, + "loss": 1.1583, + "step": 33098 + }, + { + "epoch": 1.0, + "learning_rate": 1.096640501083157e-10, + "loss": 0.9465, + "step": 33099 + }, + { + "epoch": 1.0, + "learning_rate": 1.0739129798070792e-10, + "loss": 1.0785, + "step": 33100 + }, + { + "epoch": 1.0, + "learning_rate": 1.0514234362657417e-10, + "loss": 1.1268, + "step": 33101 + }, + { + "epoch": 1.0, + "learning_rate": 1.0291718706756382e-10, + "loss": 1.1449, + "step": 33102 + }, + { + "epoch": 1.0, + "learning_rate": 1.0071582832449356e-10, + "loss": 1.0773, + "step": 33103 + }, + { + "epoch": 1.0, + "learning_rate": 9.853826741901274e-11, + "loss": 1.1072, + "step": 33104 + }, + { + "epoch": 1.0, + "learning_rate": 9.638450437138291e-11, + "loss": 1.1156, + "step": 33105 + }, + { + "epoch": 1.0, + "learning_rate": 9.425453920186567e-11, + "loss": 1.0998, + "step": 33106 + }, + { + "epoch": 1.0, + "learning_rate": 9.214837193155524e-11, + "loss": 1.0825, + "step": 33107 + }, + { + "epoch": 1.0, + "learning_rate": 9.006600257960296e-11, + "loss": 1.0976, + "step": 33108 + }, + { + "epoch": 1.0, + "learning_rate": 8.800743116627042e-11, + "loss": 1.1541, + "step": 33109 + }, + { + "epoch": 1.0, + "learning_rate": 8.597265771126406e-11, + "loss": 1.096, + "step": 33110 + }, + { + "epoch": 1.0, + "learning_rate": 8.396168223373524e-11, + "loss": 1.1036, + "step": 33111 + }, + { + "epoch": 1.0, + "learning_rate": 8.19745047528353e-11, + "loss": 1.1827, + "step": 33112 + }, + { + "epoch": 1.0, + "learning_rate": 8.00111252877156e-11, + "loss": 0.9734, + "step": 33113 + }, + { + "epoch": 1.0, + "learning_rate": 7.807154385669479e-11, + "loss": 1.1946, + "step": 33114 + }, + { + "epoch": 1.0, + "learning_rate": 7.615576047836914e-11, + "loss": 0.9805, + "step": 33115 + }, + { + "epoch": 1.0, + "learning_rate": 7.426377517133488e-11, + "loss": 1.0746, + "step": 33116 + }, + { + "epoch": 1.0, + "learning_rate": 7.239558795307799e-11, + "loss": 1.1457, + "step": 33117 + }, + { + "epoch": 1.0, + "learning_rate": 7.055119884163964e-11, + "loss": 1.1096, + "step": 33118 + }, + { + "epoch": 1.0, + "learning_rate": 6.87306078545058e-11, + "loss": 1.1057, + "step": 33119 + }, + { + "epoch": 1.0, + "learning_rate": 6.693381500916252e-11, + "loss": 1.1655, + "step": 33120 + }, + { + "epoch": 1.0, + "learning_rate": 6.516082032254067e-11, + "loss": 1.1645, + "step": 33121 + }, + { + "epoch": 1.0, + "learning_rate": 6.341162381157118e-11, + "loss": 0.972, + "step": 33122 + }, + { + "epoch": 1.0, + "learning_rate": 6.168622549290737e-11, + "loss": 1.0839, + "step": 33123 + }, + { + "epoch": 1.0, + "learning_rate": 5.998462538292504e-11, + "loss": 1.1168, + "step": 33124 + }, + { + "epoch": 1.0, + "learning_rate": 5.830682349799999e-11, + "loss": 1.0378, + "step": 33125 + }, + { + "epoch": 1.0, + "learning_rate": 5.665281985395288e-11, + "loss": 1.0155, + "step": 33126 + }, + { + "epoch": 1.0, + "learning_rate": 5.502261446632684e-11, + "loss": 1.0825, + "step": 33127 + }, + { + "epoch": 1.0, + "learning_rate": 5.341620735122011e-11, + "loss": 1.1794, + "step": 33128 + }, + { + "epoch": 1.0, + "learning_rate": 5.183359852334313e-11, + "loss": 1.1109, + "step": 33129 + }, + { + "epoch": 1.0, + "learning_rate": 5.027478799796148e-11, + "loss": 1.0938, + "step": 33130 + }, + { + "epoch": 1.0, + "learning_rate": 4.873977579006317e-11, + "loss": 0.9793, + "step": 33131 + }, + { + "epoch": 1.0, + "learning_rate": 4.722856191435865e-11, + "loss": 1.1646, + "step": 33132 + }, + { + "epoch": 1.0, + "learning_rate": 4.574114638472571e-11, + "loss": 1.0902, + "step": 33133 + }, + { + "epoch": 1.0, + "learning_rate": 4.427752921559725e-11, + "loss": 1.0601, + "step": 33134 + }, + { + "epoch": 1.0, + "learning_rate": 4.283771042112861e-11, + "loss": 1.1811, + "step": 33135 + }, + { + "epoch": 1.0, + "learning_rate": 4.142169001464247e-11, + "loss": 1.2047, + "step": 33136 + }, + { + "epoch": 1.0, + "learning_rate": 4.0029468010016614e-11, + "loss": 1.1036, + "step": 33137 + }, + { + "epoch": 1.0, + "learning_rate": 3.866104442001861e-11, + "loss": 1.0632, + "step": 33138 + }, + { + "epoch": 1.0, + "learning_rate": 3.731641925824869e-11, + "loss": 1.1048, + "step": 33139 + }, + { + "epoch": 1.0, + "learning_rate": 3.599559253691931e-11, + "loss": 1.1401, + "step": 33140 + }, + { + "epoch": 1.0, + "learning_rate": 3.4698564269075583e-11, + "loss": 1.081, + "step": 33141 + }, + { + "epoch": 1.0, + "learning_rate": 3.3425334466652413e-11, + "loss": 1.1409, + "step": 33142 + }, + { + "epoch": 1.0, + "learning_rate": 3.217590314213981e-11, + "loss": 1.2343, + "step": 33143 + }, + { + "epoch": 1.0, + "learning_rate": 3.0950270307472664e-11, + "loss": 1.1107, + "step": 33144 + }, + { + "epoch": 1.0, + "learning_rate": 2.9748435973753206e-11, + "loss": 1.0673, + "step": 33145 + }, + { + "epoch": 1.0, + "learning_rate": 2.85704001531939e-11, + "loss": 0.9727, + "step": 33146 + }, + { + "epoch": 1.0, + "learning_rate": 2.7416162856341855e-11, + "loss": 1.0475, + "step": 33147 + }, + { + "epoch": 1.0, + "learning_rate": 2.628572409457686e-11, + "loss": 1.1937, + "step": 33148 + }, + { + "epoch": 1.0, + "learning_rate": 2.517908387844603e-11, + "loss": 1.2767, + "step": 33149 + }, + { + "epoch": 1.0, + "learning_rate": 2.409624221849649e-11, + "loss": 1.1508, + "step": 33150 + }, + { + "epoch": 1.0, + "learning_rate": 2.3037199125275354e-11, + "loss": 1.0529, + "step": 33151 + }, + { + "epoch": 1.0, + "learning_rate": 2.2001954608774634e-11, + "loss": 1.0743, + "step": 33152 + }, + { + "epoch": 1.0, + "learning_rate": 2.0990508678708778e-11, + "loss": 1.0549, + "step": 33153 + }, + { + "epoch": 1.0, + "learning_rate": 2.0002861344792233e-11, + "loss": 1.2216, + "step": 33154 + }, + { + "epoch": 1.0, + "learning_rate": 1.9039012616461904e-11, + "loss": 1.148, + "step": 33155 + }, + { + "epoch": 1.0, + "learning_rate": 1.809896250259957e-11, + "loss": 1.1783, + "step": 33156 + }, + { + "epoch": 1.0, + "learning_rate": 1.7182711012642128e-11, + "loss": 1.08, + "step": 33157 + }, + { + "epoch": 1.0, + "learning_rate": 1.6290258155193804e-11, + "loss": 1.0224, + "step": 33158 + }, + { + "epoch": 1.0, + "learning_rate": 1.5421603938303718e-11, + "loss": 1.0767, + "step": 33159 + }, + { + "epoch": 1.0, + "learning_rate": 1.4576748370853655e-11, + "loss": 1.0325, + "step": 33160 + }, + { + "epoch": 1.0, + "learning_rate": 1.3755691460337617e-11, + "loss": 1.0644, + "step": 33161 + }, + { + "epoch": 1.0, + "learning_rate": 1.2958433215082278e-11, + "loss": 1.2864, + "step": 33162 + }, + { + "epoch": 1.0, + "learning_rate": 1.2184973642304088e-11, + "loss": 1.0948, + "step": 33163 + }, + { + "epoch": 1.0, + "learning_rate": 1.1435312749497052e-11, + "loss": 1.0555, + "step": 33164 + }, + { + "epoch": 1.0, + "learning_rate": 1.070945054387762e-11, + "loss": 1.1112, + "step": 33165 + }, + { + "epoch": 1.0, + "learning_rate": 1.000738703210713e-11, + "loss": 1.1691, + "step": 33166 + }, + { + "epoch": 1.0, + "learning_rate": 9.329122221124476e-12, + "loss": 1.0519, + "step": 33167 + }, + { + "epoch": 1.0, + "learning_rate": 8.67465611731344e-12, + "loss": 1.0447, + "step": 33168 + }, + { + "epoch": 1.0, + "learning_rate": 8.04398872678025e-12, + "loss": 1.0714, + "step": 33169 + }, + { + "epoch": 1.0, + "learning_rate": 7.437120055631131e-12, + "loss": 1.0355, + "step": 33170 + }, + { + "epoch": 1.0, + "learning_rate": 6.854050109694754e-12, + "loss": 0.9724, + "step": 33171 + }, + { + "epoch": 1.0, + "learning_rate": 6.294778894522236e-12, + "loss": 1.0798, + "step": 33172 + }, + { + "epoch": 1.0, + "learning_rate": 5.759306415387134e-12, + "loss": 1.0808, + "step": 33173 + }, + { + "epoch": 1.0, + "learning_rate": 5.247632677285452e-12, + "loss": 1.0862, + "step": 33174 + }, + { + "epoch": 1.0, + "learning_rate": 4.7597576852131956e-12, + "loss": 1.0765, + "step": 33175 + }, + { + "epoch": 1.0, + "learning_rate": 4.29568144388881e-12, + "loss": 1.0955, + "step": 33176 + }, + { + "epoch": 1.0, + "learning_rate": 3.855403957475634e-12, + "loss": 0.932, + "step": 33177 + }, + { + "epoch": 1.0, + "learning_rate": 3.438925230414558e-12, + "loss": 1.0955, + "step": 33178 + }, + { + "epoch": 1.0, + "learning_rate": 3.0462452665913633e-12, + "loss": 1.2332, + "step": 33179 + }, + { + "epoch": 1.0, + "learning_rate": 2.6773640696142744e-12, + "loss": 1.018, + "step": 33180 + }, + { + "epoch": 1.0, + "learning_rate": 2.3322816430915163e-12, + "loss": 1.024, + "step": 33181 + }, + { + "epoch": 1.0, + "learning_rate": 2.010997990631314e-12, + "loss": 1.1562, + "step": 33182 + }, + { + "epoch": 1.0, + "learning_rate": 1.7135131147316687e-12, + "loss": 1.1175, + "step": 33183 + }, + { + "epoch": 1.0, + "learning_rate": 1.439827018445694e-12, + "loss": 1.0069, + "step": 33184 + }, + { + "epoch": 1.0, + "learning_rate": 1.189939704548948e-12, + "loss": 1.0455, + "step": 33185 + }, + { + "epoch": 1.0, + "learning_rate": 9.638511752618762e-13, + "loss": 1.2671, + "step": 33186 + }, + { + "epoch": 1.0, + "learning_rate": 7.615614325273691e-13, + "loss": 1.2811, + "step": 33187 + }, + { + "epoch": 1.0, + "learning_rate": 5.830704788434283e-13, + "loss": 1.2257, + "step": 33188 + }, + { + "epoch": 1.0, + "learning_rate": 4.2837831532027697e-13, + "loss": 1.047, + "step": 33189 + }, + { + "epoch": 1.0, + "learning_rate": 2.974849439008054e-13, + "loss": 1.0248, + "step": 33190 + }, + { + "epoch": 1.0, + "learning_rate": 1.9039036541768086e-13, + "loss": 1.1207, + "step": 33191 + }, + { + "epoch": 1.0, + "learning_rate": 1.0709458125868211e-13, + "loss": 1.1119, + "step": 33192 + }, + { + "epoch": 1.0, + "learning_rate": 4.759759170136491e-14, + "loss": 1.1302, + "step": 33193 + }, + { + "epoch": 1.0, + "learning_rate": 1.1899397855952288e-14, + "loss": 1.1273, + "step": 33194 + }, + { + "epoch": 1.0, + "learning_rate": 0.0, + "loss": 1.1128, + "step": 33195 + }, + { + "epoch": 1.0, + "step": 33195, + "total_flos": 7183881258045440.0, + "train_loss": 1.1314439481955585, + "train_runtime": 84160.343, + "train_samples_per_second": 12.621, + "train_steps_per_second": 0.394 + } + ], + "max_steps": 33195, + "num_train_epochs": 1, + "total_flos": 7183881258045440.0, + "trial_name": null, + "trial_params": null +}